1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
//#pragma GCC optimize("Ofast")
//#pragma GCC optimize ("unroll-loops")
//#pragma GCC target("sse,sse2,sse3,ssse3,sse4,popcnt,abm,mmx,avx,tune=native")

#pragma warning(disable:4786)
#pragma warning(disable:4996)
#include <random>
#include <chrono>
#include <ctime>
#include<list>
#include <numeric>
#include<bitset>
#include<iostream>
#include<cstdio>
#include<algorithm>
#include<vector>
#include<set>
#include<map>
#include<functional>
#include<string>
#include<cstring>
#include<cstdlib>
#include<queue>
#include<utility>
#include<fstream>
#include<sstream>
#include<cmath>
#include<stack>
#include<assert.h>
#include<unordered_map>
#include<unordered_set>
#include <array>
#include <complex>
using namespace std;

#define MEM(a, b) memset(a, (b), sizeof(a))
#define CLR(a) memset(a, 0, sizeof(a))
#define MAX(a, b) ((a) > (b) ? (a) : (b))
#define MIN(a, b) ((a) < (b) ? (a) : (b))
#define ABS(X) ( (X) > 0 ? (X) : ( -(X) ) )
#define S(X) ( (X) * (X) )
#define SZ(V) (int )V.size()
#define FORN(i, n) for(int i = 0; i < n; i++)
#define FORAB(i, a, b) for(int i = a; i <= b; i++)
#define ALL(V) V.begin(), V.end()
#define IN(A, B, C)  ((B) <= (A) && (A) <= (C))
#define AIN(A, B, C) assert(IN(A, B, C))

typedef long long int LL;
//typedef __int128 LLL;
typedef long long LLL;

typedef pair<int, int> PII;
typedef pair<LL, LL> PLL;
typedef pair<double, double> PDD;
typedef vector<int> VI;
typedef vector<LL> VL;
typedef vector<PLL> VPL;
typedef vector<PII> VP;
typedef vector<double> VD;
typedef vector<vector<int>> VVI;
typedef vector<string> VS;
typedef long double ld;

#define MAXN 203
#define MAXN2 MAXN*MAXN
//#define MAXN 1006

const LL MOD = 1000000007;
//const LL MOD = 998244353;
//const LL INF = 2000000000000000001LL; //2e18 + 1

void solve(int ks) {
	LL C, R, p;
	scanf("%lld %lld %lld", &C, &R, &p);
	vector<LL> sCol(R + 2, 0), sRow(R + 2, 0);
	for (int i = 1; i <= R; i++) {
		sCol[i] = i + sCol[i - 1];
		if (sCol[i] >= p) sCol[i] -= p;
	}
	for (int i = R; i >= 1; i--) {
		sRow[i] = R - i + 1 + sRow[i + 1];
		if (sRow[i] >= p) sRow[i] -= p;
	}

	auto reduce = [&](LL val) -> LL {
		if (val >= 0) return val % p;
		val = (-val) % p;
		if (val == 0) return 0;
		return p - val;
	};

	for (int num_col = 2; num_col <= C; num_col++) {
		vector<LL> new_sCol(R + 2, 0), new_sRow(R + 2, 0);
		LL all_sum = sCol[R];
		LL run_sum = 0;
		for (int i = 1; i <= R; i++) {
			new_sCol[i] = reduce(i * all_sum - i * sRow[i + 1] - run_sum);
			new_sCol[i] += new_sCol[i - 1];
			if (new_sCol[i] >= p) new_sCol[i] -= p;
			run_sum += sCol[i];
			if (run_sum >= p) run_sum -= p;
		}
		run_sum = 0;
		for (int i = R, j = 1; i >= 1; i--, j++) {
			new_sRow[i] = reduce(j * all_sum - run_sum - j * sCol[i - 1]);
			new_sRow[i] += new_sRow[i + 1];
			if (new_sRow[i] >= p) new_sRow[i] -= p;
			run_sum += sRow[i];
			if (run_sum >= p) run_sum -= p;
		}

		sCol.swap(new_sCol);
		sRow.swap(new_sRow);
	}
	printf("%lld\n", sCol[R]);
}

void gen() {
}

int main()
{
	double start_time = clock();
#ifdef LOCAL
	freopen("C:\\Home\\Contests\\F\\sample.in", "r", stdin);
	//	freopen("out.out", "w", stdout);
#endif

	gen();

	if (0) {
		int T;
		scanf("%d", &T);
		//AIN(T, 1, 5000);
		for (int ks = 1; ks <= T; ks++) {
			solve(ks);
			//if (ks % 1 == 0) fprintf(stderr, "%d done\n", ks);
		}
	}
	else {
		solve(0);
	}

	double end_time = clock();
	fprintf(stderr, "Time = %lf\n", (end_time - start_time) / CLOCKS_PER_SEC);

	return 0;
}