P4245 【模板】任意模数NTT
不会 MTT,直接拆系数 FFT,也行。
但是要long double,否则会被卡精度,记得取模。
以及一些小细节问题。
// powered by c++11
// by Isaunoya
#include <bits/stdc++.h>
#define rep(i, x, y) for (register int i = (x); i <= (y); ++i)
#define Rep(i, x, y) for (register int i = (x); i >= (y); --i)
using namespace std;
using db = double;
using ll = long long;
using uint = unsigned int;
using ull = unsigned long long;
#define pii pair<int, int>
#define fir first
#define sec second
template <class T>
void cmax(T& x, const T& y) {
if (x < y) x = y;
}
template <class T>
void cmin(T& x, const T& y) {
if (x > y) x = y;
}
#define all(v) v.begin(), v.end()
#define sz(v) ((int)v.size())
#define pb emplace_back
template <class T>
void sort(vector<T>& v) {
sort(all(v));
}
template <class T>
void reverse(vector<T>& v) {
reverse(all(v));
}
template <class T>
void unique(vector<T>& v) {
sort(all(v)), v.erase(unique(all(v)), v.end());
}
void reverse(string& s) { reverse(s.begin(), s.end()); }
const int io_size = 1 << 23 | 233;
const int io_limit = 1 << 22;
struct io_in {
char ch;
#ifndef __WIN64
char getchar() {
static char buf[io_size], *p1 = buf, *p2 = buf;
return (p1 == p2) && (p2 = (p1 = buf) + fread(buf, 1, io_size, stdin), p1 == p2) ? EOF : *p1++;
}
#endif
io_in& operator>>(char& c) {
for (c = getchar(); isspace(c); c = getchar())
;
return *this;
}
io_in& operator>>(string& s) {
for (s.clear(); isspace(ch = getchar());)
;
if (!~ch) return *this;
for (s = ch; !isspace(ch = getchar()) && ~ch; s += ch)
;
return *this;
}
io_in& operator>>(char* str) {
char* cur = str;
while (*cur) *cur++ = 0;
for (cur = str; isspace(ch = getchar());)
;
if (!~ch) return *this;
for (*cur = ch; !isspace(ch = getchar()) && ~ch; *++cur = ch)
;
return *++cur = 0, *this;
}
template <class T>
void read(T& x) {
bool f = 0;
while ((ch = getchar()) < 48 && ~ch) f ^= (ch == 45);
x = ~ch ? (ch ^ 48) : 0;
while ((ch = getchar()) > 47) x = x * 10 + (ch ^ 48);
x = f ? -x : x;
}
io_in& operator>>(int& x) { return read(x), *this; }
io_in& operator>>(ll& x) { return read(x), *this; }
io_in& operator>>(uint& x) { return read(x), *this; }
io_in& operator>>(ull& x) { return read(x), *this; }
io_in& operator>>(db& x) {
read(x);
bool f = x < 0;
x = f ? -x : x;
if (ch ^ '.') return *this;
double d = 0.1;
while ((ch = getchar()) > 47) x += d * (ch ^ 48), d *= .1;
return x = f ? -x : x, *this;
}
} in;
struct io_out {
char buf[io_size], *s = buf;
int pw[233], st[233];
io_out() {
set(7);
rep(i, pw[0] = 1, 9) pw[i] = pw[i - 1] * 10;
}
~io_out() { flush(); }
void io_chk() {
if (s - buf > io_limit) flush();
}
void flush() { fwrite(buf, 1, s - buf, stdout), fflush(stdout), s = buf; }
io_out& operator<<(char c) { return *s++ = c, *this; }
io_out& operator<<(string str) {
for (char c : str) *s++ = c;
return io_chk(), *this;
}
io_out& operator<<(char* str) {
char* cur = str;
while (*cur) *s++ = *cur++;
return io_chk(), *this;
}
template <class T>
void write(T x) {
if (x < 0) *s++ = '-', x = -x;
do {
st[++st[0]] = x % 10, x /= 10;
} while (x);
while (st[0]) *s++ = st[st[0]--] ^ 48;
}
io_out& operator<<(int x) { return write(x), io_chk(), *this; }
io_out& operator<<(ll x) { return write(x), io_chk(), *this; }
io_out& operator<<(uint x) { return write(x), io_chk(), *this; }
io_out& operator<<(ull x) { return write(x), io_chk(), *this; }
int len;
ll lft, rig;
void set(int _length) { len = _length; }
io_out& operator<<(db x) {
bool f = x < 0;
x = f ? -x : x, lft = x, rig = 1. * (x - lft) * pw[len];
return write(f ? -lft : lft), *s++ = '.', write(rig), io_chk(), *this;
}
} out;
#define int long long
template <int sz, int mod>
struct math_t {
math_t() {
fac.resize(sz + 1), ifac.resize(sz + 1);
rep(i, fac[0] = 1, sz) fac[i] = fac[i - 1] * i % mod;
ifac[sz] = inv(fac[sz]);
Rep(i, sz - 1, 0) ifac[i] = ifac[i + 1] * (i + 1) % mod;
}
vector<int> fac, ifac;
int qpow(int x, int y) {
int ans = 1;
for (; y; y >>= 1, x = x * x % mod)
if (y & 1) ans = ans * x % mod;
return ans;
}
int inv(int x) { return qpow(x, mod - 2); }
int C(int n, int m) {
if (n < 0 || m < 0 || n < m) return 0;
return fac[n] * ifac[m] % mod * ifac[n - m] % mod;
}
};
int gcd(int x, int y) { return !y ? x : gcd(y, x % y); }
int lcm(int x, int y) { return x * y / gcd(x, y); }
#define double long double
struct cpx {
double x, y;
cpx(double _x = 0, double _y = 0) {
x = _x;
y = _y;
}
double real() { return x; }
};
cpx operator+(cpx x, cpx y) { return cpx(x.x + y.x, x.y + y.y); }
cpx operator-(cpx x, cpx y) { return cpx(x.x - y.x, x.y - y.y); }
cpx operator*(cpx x, cpx y) { return cpx(x.x * y.x - x.y * y.y, x.x * y.y + x.y * y.x); }
cpx operator*(cpx x, double y) { return cpx(x.x * y, x.y * y); }
cpx operator/(cpx x, double y) { return cpx(x.x / y, x.y / y); }
const int maxn = 6e5 + 56;
int limit = 1, rev[maxn];
const double pi = acosl(-1);
void FFT(cpx* a, int type) {
for (int i = 0; i < limit; i++)
if (i < rev[i]) swap(a[i], a[rev[i]]);
for (int len = 1; len < limit; len <<= 1) {
cpx Wn(cos(pi / len), sin(pi / len) * type);
for (int i = 0; i < limit; i += len << 1) {
cpx w(1, 0);
for (int j = 0; j < len; j++, w = w * Wn) {
cpx X = a[i + j];
cpx Y = a[i + j + len] * w;
a[i + j] = X + Y;
a[i + j + len] = X - Y;
}
}
}
if (type == -1) {
for (int i = 0; i < limit; i++) a[i] = a[i] / limit;
}
}
int n, m, p;
int a[maxn], b[maxn];
cpx A[maxn], B[maxn];
cpx A15[maxn], B15[maxn];
int ans[maxn];
const int qwq = (1 << 15) - 1;
signed main() {
// code begin.
in >> n >> m >> p;
rep(i, 0, n) { in >> a[i], a[i] %= p; }
rep(i, 0, m) { in >> b[i], b[i] %= p; }
int l = 0;
while (limit <= n + m) {
limit <<= 1, ++l;
}
rep(i, 0, limit) rev[i] = rev[i >> 1] >> 1 | (i & 1) << l - 1;
rep(i, 0, n) {
A[i] = cpx(a[i] & qwq);
A15[i] = cpx(a[i] >> 15);
}
rep(i, 0, m) {
B[i] = cpx(b[i] & qwq);
B15[i] = cpx(b[i] >> 15);
}
FFT(A, 1), FFT(A15, 1);
FFT(B, 1), FFT(B15, 1);
static cpx bit[maxn];
static cpx bit15[maxn];
static cpx bit30[maxn];
rep(i, 0, limit) {
bit[i] = A[i] * B[i];
bit15[i] = A15[i] * B[i] + B15[i] * A[i];
bit30[i] = A15[i] * B15[i];
}
FFT(bit, -1), FFT(bit15, -1), FFT(bit30, -1);
rep(i, 0, n + m) {
int ret = 0;
(ret += (int)(bit[i].real() + .5) % p) %= p;
(ret += (((int)(bit15[i].real() + .5) % p) << 15ll) % p) %= p;
(ret += (((int)(bit30[i].real() + .5) % p) << 30ll) % p) %= p;
(ret += p) %= p;
ans[i] = ret;
}
rep(i, 0, n + m) { out << ans[i] << ' '; }
return 0;
// code end.
}