#include <cstdio>
#include <cctype>
#include <algorithm>
typedef unsigned int uint;
typedef long long unsigned int uint64;
struct IO_Tp
{
const static int _I_Buffer_Size = 2 << 20;
char _I_Buffer[_I_Buffer_Size], *_I_pos = _I_Buffer;
const static int _O_Buffer_Size = 2 << 20;
char _O_Buffer[_O_Buffer_Size], *_O_pos = _O_Buffer;
IO_Tp() { fread(_I_Buffer, 1, _I_Buffer_Size, stdin); }
~IO_Tp() { fwrite(_O_Buffer, 1, _O_pos - _O_Buffer, stdout); }
IO_Tp &operator>>(int &res)
{
while (!isdigit(*_I_pos))
++_I_pos;
res = *_I_pos++ & 15;
while (isdigit(*_I_pos))
res = res * 10 + (*_I_pos++ & 15);
return *this;
}
IO_Tp &operator>>(uint &res)
{
while (!isdigit(*_I_pos))
++_I_pos;
res = *_I_pos++ & 15;
while (isdigit(*_I_pos))
res = res * 10 + (*_I_pos++ & 15);
return *this;
}
IO_Tp &operator<<(uint n)
{
static char _buf[10];
char* _pos = _buf;
do
*_pos++ = '0' + n % 10;
while (n /= 10);
while (_pos != _buf)
*_O_pos++ = *--_pos;
return *this;
}
IO_Tp &operator<<(char ch)
{
*_O_pos++ = ch;
return *this;
}
} IO;
constexpr uint Max_size = 1000001;
constexpr uint g = 3, Mod = 998244353;
inline uint norm_2(const uint x)
{
return x < Mod * 2 ? x : x - Mod * 2;
}
inline uint norm(const uint x)
{
return x < Mod ? x : x - Mod;
}
struct Z
{
uint v;
Z() { }
Z(const uint _v) : v(_v) { }
};
inline Z operator+(const Z &x1, const Z &x2) { return x1.v + x2.v < Mod ? x1.v + x2.v : x1.v + x2.v - Mod; }
inline Z operator-(const Z &x1, const Z &x2) { return x1.v >= x2.v ? x1.v - x2.v : x1.v + Mod - x2.v; }
inline Z operator*(const Z &x1, const Z &x2) { return static_cast<uint64>(x1.v) * x2.v % Mod; }
inline Z &operator*=(Z &x1, const Z &x2) { x1.v = static_cast<uint64>(x1.v) * x2.v % Mod; return x1; }
Z Power(Z Base, int Exp)
{
Z res = 1;
for (; Exp; Base *= Base, Exp >>= 1)
if (Exp & 1)
res *= Base;
return res;
}
inline uint mf(uint x)
{
return (static_cast<uint64>(x) << 32) / Mod;
}
int size;
uint w[Max_size], w_[Max_size];
inline uint mult_Shoup_2(const uint x, const uint y, const uint y_)
{
uint q = static_cast<uint64>(x) * y_ >> 32;
return x * y - q * Mod;
}
inline uint mult_Shoup(const uint x, const uint y, const uint y_)
{
return norm(mult_Shoup_2(x, y, y_));
}
inline void init(int n)
{
for (size = 2; size < n; size <<= 1)
;
Z pr = Power(g, (Mod - 1) / size);
size >>= 1;
w[size] = 1, w_[size] = (static_cast<uint64>(w[size]) << 32) / Mod;
if (size <= 8)
{
for (int i = 1; i < size; ++i)
w[size + i] = (w[size + i - 1] * pr).v, w_[size + i] = (static_cast<uint64>(w[size + i]) << 32) / Mod;
}
else
{
for (int i = 1; i < 8; ++i)
w[size + i] = (w[size + i - 1] * pr).v, w_[size + i] = (static_cast<uint64>(w[size + i]) << 32) / Mod;
pr *= pr, pr *= pr, pr *= pr;
for (int i = 8; i < size; i += 8)
{
w[size + i + 0] = (w[size + i - 8] * pr).v, w_[size + i + 0] = (static_cast<uint64>(w[size + i + 0]) << 32) / Mod;
w[size + i + 1] = (w[size + i - 7] * pr).v, w_[size + i + 1] = (static_cast<uint64>(w[size + i + 1]) << 32) / Mod;
w[size + i + 2] = (w[size + i - 6] * pr).v, w_[size + i + 2] = (static_cast<uint64>(w[size + i + 2]) << 32) / Mod;
w[size + i + 3] = (w[size + i - 5] * pr).v, w_[size + i + 3] = (static_cast<uint64>(w[size + i + 3]) << 32) / Mod;
w[size + i + 4] = (w[size + i - 4] * pr).v, w_[size + i + 4] = (static_cast<uint64>(w[size + i + 4]) << 32) / Mod;
w[size + i + 5] = (w[size + i - 3] * pr).v, w_[size + i + 5] = (static_cast<uint64>(w[size + i + 5]) << 32) / Mod;
w[size + i + 6] = (w[size + i - 2] * pr).v, w_[size + i + 6] = (static_cast<uint64>(w[size + i + 6]) << 32) / Mod;
w[size + i + 7] = (w[size + i - 1] * pr).v, w_[size + i + 7] = (static_cast<uint64>(w[size + i + 7]) << 32) / Mod;
}
}
for (int i = size - 1; i; --i)
w[i] = w[i * 2], w_[i] = w_[i * 2];
size <<= 1;
}
inline void DFT_fr_2(Z _A[], const int L)
{
if (L == 1)
return;
uint *A = reinterpret_cast<uint *>(_A);
#define butterfly1(a, b)\
do\
{\
uint _a = a, _b = b;\
uint x = norm_2(_a + _b), y = norm_2(_a + Mod * 2 - _b);\
a = x, b = y;\
} while (0)
if (L == 2)
{
butterfly1(A[0], A[1]);
return;
}
#define butterfly(a, b, _w, _w_)\
do\
{\
uint _a = a, _b = b;\
uint x = norm_2(_a + _b), y = mult_Shoup_2(_a + Mod * 2 - _b, _w, _w_);\
a = x, b = y;\
} while (0)
if (L == 4)
{
butterfly1(A[0], A[2]);
butterfly(A[1], A[3], w[3], w_[3]);
butterfly1(A[0], A[1]);
butterfly1(A[2], A[3]);
return;
}
for (int d = L >> 1; d != 4; d >>= 1)
for (int i = 0; i != L; i += d << 1)
for (int j = 0; j != d; j += 4)
{
butterfly(A[i + j], A[i + d + j], w[d + j], w_[d + j]);
butterfly(A[i + j + 1], A[i + d + j + 1], w[d + j + 1], w_[d + j + 1]);
butterfly(A[i + j + 2], A[i + d + j + 2], w[d + j + 2], w_[d + j + 2]);
butterfly(A[i + j + 3], A[i + d + j + 3], w[d + j + 3], w_[d + j + 3]);
}
for (int i = 0; i != L; i += 8)
{
butterfly1(A[i], A[i + 4]);
butterfly(A[i + 1], A[i + 5], w[5], w_[5]);
butterfly(A[i + 2], A[i + 6], w[6], w_[6]);
butterfly(A[i + 3], A[i + 7], w[7], w_[7]);
}
for (int i = 0; i != L; i += 8)
{
butterfly1(A[i], A[i + 2]);
butterfly(A[i + 1], A[i + 3], w[3], w_[3]);
butterfly1(A[i + 4], A[i + 6]);
butterfly(A[i + 5], A[i + 7], w[3], w_[3]);
}
for (int i = 0; i != L; i += 8)
{
butterfly1(A[i], A[i + 1]);
butterfly1(A[i + 2], A[i + 3]);
butterfly1(A[i + 4], A[i + 5]);
butterfly1(A[i + 6], A[i + 7]);
}
#undef butterfly1
#undef butterfly
}
inline void IDFT_fr(Z _A[], const int L)
{
if (L == 1)
return;
uint *A = reinterpret_cast<uint *>(_A);
#define butterfly1(a, b)\
do\
{\
uint _a = a, _b = b;\
uint x = norm_2(_a), t = norm_2(_b);\
a = x + t, b = x + Mod * 2 - t;\
} while (0)
if (L == 2)
{
butterfly1(A[0], A[1]);
A[0] = norm(norm_2(A[0])), A[0] = A[0] & 1 ? A[0] + Mod : A[0], A[0] /= 2;
A[1] = norm(norm_2(A[1])), A[1] = A[1] & 1 ? A[1] + Mod : A[1], A[1] /= 2;
return;
}
#define butterfly(a, b, _w, _w_)\
do\
{\
uint _a = a, _b = b;\
uint x = norm_2(_a), t = mult_Shoup_2(_b, _w, _w_);\
a = x + t, b = x + Mod * 2 - t;\
} while (0)
if (L == 4)
{
butterfly1(A[0], A[1]);
butterfly1(A[2], A[3]);
butterfly1(A[0], A[2]);
butterfly(A[1], A[3], w[3], w_[3]);
std::swap(A[1], A[3]);
for (int i = 0; i != L; ++i)
{
uint64 m = -A[i] & 3;
A[i] = norm((A[i] + m * Mod) >> 2);
}
return;
}
for (int i = 0; i != L; i += 8)
{
butterfly1(A[i], A[i + 1]);
butterfly1(A[i + 2], A[i + 3]);
butterfly1(A[i + 4], A[i + 5]);
butterfly1(A[i + 6], A[i + 7]);
}
for (int i = 0; i != L; i += 8)
{
butterfly1(A[i], A[i + 2]);
butterfly(A[i + 1], A[i + 3], w[3], w_[3]);
butterfly1(A[i + 4], A[i + 6]);
butterfly(A[i + 5], A[i + 7], w[3], w_[3]);
}
for (int i = 0; i != L; i += 8)
{
butterfly1(A[i], A[i + 4]);
butterfly(A[i + 1], A[i + 5], w[5], w_[5]);
butterfly(A[i + 2], A[i + 6], w[6], w_[6]);
butterfly(A[i + 3], A[i + 7], w[7], w_[7]);
}
for (int d = 8; d != L; d <<= 1)
for (int i = 0; i != L; i += d << 1)
for (int j = 0; j != d; j += 4)
{
butterfly(A[i + j], A[i + d + j], w[d + j], w_[d + j]);
butterfly(A[i + j + 1], A[i + d + j + 1], w[d + j + 1], w_[d + j + 1]);
butterfly(A[i + j + 2], A[i + d + j + 2], w[d + j + 2], w_[d + j + 2]);
butterfly(A[i + j + 3], A[i + d + j + 3], w[d + j + 3], w_[d + j + 3]);
}
#undef butterfly1
#undef butterfly
std::reverse(A + 1, A + L);
int k = __builtin_ctz(L);
for (int i = 0; i != L; ++i)
{
uint64 m = -A[i] & (L - 1);
A[i] = norm((A[i] + m * Mod) >> k);
}
}
int N, M, L;
Z A[Max_size], B[Max_size];
int main(int argc, char **argv)
{
IO >> N >> M;
--N, --M;
for (int i = 0; i != N; ++i)
IO >> A[i].v;
for (int i = 0; i != M; ++i)
IO >> B[i].v;
for (L = 2; L <= N + M - 2; L <<= 1)
;
init(L);
DFT_fr_2(A, L), DFT_fr_2(B, L);
for (int i = 0; i != L; ++i)
A[i] *= B[i];
IDFT_fr(A, L);
for (int i = 0; i <= N + M - 2; ++i)
IO << A[i].v << ' ';
return 0;
}
Compilation | N/A | N/A | Compile OK | Score: N/A | 显示更多 |
Subtask #1 Testcase #1 | 11.61 us | 44 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #2 | 15.337 ms | 7 MB + 276 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #3 | 5.916 ms | 2 MB + 632 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #4 | 5.944 ms | 2 MB + 632 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #5 | 12.38 us | 48 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #6 | 11.28 us | 44 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #7 | 10.7 us | 44 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #8 | 14.593 ms | 6 MB + 696 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #9 | 14.598 ms | 6 MB + 696 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #10 | 7.881 ms | 4 MB + 88 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #11 | 15.53 ms | 7 MB + 436 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #12 | 12.434 ms | 5 MB + 196 KB | Wrong Answer | Score: 0 | 显示更多 |
Subtask #1 Testcase #13 | 195.433 ms | 40 KB | Runtime Error | Score: 0 | 显示更多 |