P4245 【模板】任意模数NTT

不会 MTT,直接拆系数 FFT,也行。
但是要long double,否则会被卡精度,记得取模。
以及一些小细节问题。

// powered by c++11
// by Isaunoya
#include <bits/stdc++.h>

#define rep(i, x, y) for (register int i = (x); i <= (y); ++i)
#define Rep(i, x, y) for (register int i = (x); i >= (y); --i)

using namespace std;
using db = double;
using ll = long long;
using uint = unsigned int;
using ull = unsigned long long;

#define pii pair<int, int>
#define fir first
#define sec second

template <class T>

void cmax(T& x, const T& y) {
  if (x < y) x = y;
}

template <class T>

void cmin(T& x, const T& y) {
  if (x > y) x = y;
}

#define all(v) v.begin(), v.end()
#define sz(v) ((int)v.size())
#define pb emplace_back

template <class T>

void sort(vector<T>& v) {
  sort(all(v));
}

template <class T>

void reverse(vector<T>& v) {
  reverse(all(v));
}

template <class T>

void unique(vector<T>& v) {
  sort(all(v)), v.erase(unique(all(v)), v.end());
}

void reverse(string& s) { reverse(s.begin(), s.end()); }

const int io_size = 1 << 23 | 233;
const int io_limit = 1 << 22;
struct io_in {
  char ch;
#ifndef __WIN64
  char getchar() {
    static char buf[io_size], *p1 = buf, *p2 = buf;

    return (p1 == p2) && (p2 = (p1 = buf) + fread(buf, 1, io_size, stdin), p1 == p2) ? EOF : *p1++;
  }
#endif
  io_in& operator>>(char& c) {
    for (c = getchar(); isspace(c); c = getchar())
      ;

    return *this;
  }
  io_in& operator>>(string& s) {
    for (s.clear(); isspace(ch = getchar());)
      ;

    if (!~ch) return *this;

    for (s = ch; !isspace(ch = getchar()) && ~ch; s += ch)
      ;

    return *this;
  }

  io_in& operator>>(char* str) {
    char* cur = str;
    while (*cur) *cur++ = 0;

    for (cur = str; isspace(ch = getchar());)
      ;
    if (!~ch) return *this;

    for (*cur = ch; !isspace(ch = getchar()) && ~ch; *++cur = ch)
      ;

    return *++cur = 0, *this;
  }

  template <class T>

  void read(T& x) {
    bool f = 0;
    while ((ch = getchar()) < 48 && ~ch) f ^= (ch == 45);

    x = ~ch ? (ch ^ 48) : 0;
    while ((ch = getchar()) > 47) x = x * 10 + (ch ^ 48);
    x = f ? -x : x;
  }

  io_in& operator>>(int& x) { return read(x), *this; }

  io_in& operator>>(ll& x) { return read(x), *this; }

  io_in& operator>>(uint& x) { return read(x), *this; }

  io_in& operator>>(ull& x) { return read(x), *this; }

  io_in& operator>>(db& x) {
    read(x);
    bool f = x < 0;
    x = f ? -x : x;
    if (ch ^ '.') return *this;

    double d = 0.1;
    while ((ch = getchar()) > 47) x += d * (ch ^ 48), d *= .1;
    return x = f ? -x : x, *this;
  }
} in;

struct io_out {
  char buf[io_size], *s = buf;
  int pw[233], st[233];

  io_out() {
    set(7);
    rep(i, pw[0] = 1, 9) pw[i] = pw[i - 1] * 10;
  }

  ~io_out() { flush(); }

  void io_chk() {
    if (s - buf > io_limit) flush();
  }

  void flush() { fwrite(buf, 1, s - buf, stdout), fflush(stdout), s = buf; }

  io_out& operator<<(char c) { return *s++ = c, *this; }

  io_out& operator<<(string str) {
    for (char c : str) *s++ = c;
    return io_chk(), *this;
  }

  io_out& operator<<(char* str) {
    char* cur = str;
    while (*cur) *s++ = *cur++;
    return io_chk(), *this;
  }

  template <class T>

  void write(T x) {
    if (x < 0) *s++ = '-', x = -x;

    do {
      st[++st[0]] = x % 10, x /= 10;
    } while (x);

    while (st[0]) *s++ = st[st[0]--] ^ 48;
  }

  io_out& operator<<(int x) { return write(x), io_chk(), *this; }

  io_out& operator<<(ll x) { return write(x), io_chk(), *this; }

  io_out& operator<<(uint x) { return write(x), io_chk(), *this; }

  io_out& operator<<(ull x) { return write(x), io_chk(), *this; }

  int len;
  ll lft, rig;

  void set(int _length) { len = _length; }

  io_out& operator<<(db x) {
    bool f = x < 0;
    x = f ? -x : x, lft = x, rig = 1. * (x - lft) * pw[len];
    return write(f ? -lft : lft), *s++ = '.', write(rig), io_chk(), *this;
  }
} out;
#define int long long

template <int sz, int mod>

struct math_t {
  math_t() {
    fac.resize(sz + 1), ifac.resize(sz + 1);
    rep(i, fac[0] = 1, sz) fac[i] = fac[i - 1] * i % mod;

    ifac[sz] = inv(fac[sz]);
    Rep(i, sz - 1, 0) ifac[i] = ifac[i + 1] * (i + 1) % mod;
  }

  vector<int> fac, ifac;

  int qpow(int x, int y) {
    int ans = 1;
    for (; y; y >>= 1, x = x * x % mod)
      if (y & 1) ans = ans * x % mod;
    return ans;
  }

  int inv(int x) { return qpow(x, mod - 2); }

  int C(int n, int m) {
    if (n < 0 || m < 0 || n < m) return 0;
    return fac[n] * ifac[m] % mod * ifac[n - m] % mod;
  }
};

int gcd(int x, int y) { return !y ? x : gcd(y, x % y); }
int lcm(int x, int y) { return x * y / gcd(x, y); }

#define double long double
struct cpx {
  double x, y;

  cpx(double _x = 0, double _y = 0) {
    x = _x;
    y = _y;
  }

  double real() { return x; }
};

cpx operator+(cpx x, cpx y) { return cpx(x.x + y.x, x.y + y.y); }

cpx operator-(cpx x, cpx y) { return cpx(x.x - y.x, x.y - y.y); }

cpx operator*(cpx x, cpx y) { return cpx(x.x * y.x - x.y * y.y, x.x * y.y + x.y * y.x); }

cpx operator*(cpx x, double y) { return cpx(x.x * y, x.y * y); }

cpx operator/(cpx x, double y) { return cpx(x.x / y, x.y / y); }

const int maxn = 6e5 + 56;
int limit = 1, rev[maxn];
const double pi = acosl(-1);

void FFT(cpx* a, int type) {
  for (int i = 0; i < limit; i++)
    if (i < rev[i]) swap(a[i], a[rev[i]]);
  for (int len = 1; len < limit; len <<= 1) {
    cpx Wn(cos(pi / len), sin(pi / len) * type);
    for (int i = 0; i < limit; i += len << 1) {
      cpx w(1, 0);
      for (int j = 0; j < len; j++, w = w * Wn) {
        cpx X = a[i + j];
        cpx Y = a[i + j + len] * w;
        a[i + j] = X + Y;
        a[i + j + len] = X - Y;
      }
    }
  }

  if (type == -1) {
    for (int i = 0; i < limit; i++) a[i] = a[i] / limit;
  }
}

int n, m, p;
int a[maxn], b[maxn];
cpx A[maxn], B[maxn];
cpx A15[maxn], B15[maxn];
int ans[maxn];

const int qwq = (1 << 15) - 1;
signed main() {
  // code begin.
  in >> n >> m >> p;
  rep(i, 0, n) { in >> a[i], a[i] %= p; }
  rep(i, 0, m) { in >> b[i], b[i] %= p; }

  int l = 0;
  while (limit <= n + m) {
    limit <<= 1, ++l;
  }
  rep(i, 0, limit) rev[i] = rev[i >> 1] >> 1 | (i & 1) << l - 1;

  rep(i, 0, n) {
    A[i] = cpx(a[i] & qwq);
    A15[i] = cpx(a[i] >> 15);
  }
  rep(i, 0, m) {
    B[i] = cpx(b[i] & qwq);
    B15[i] = cpx(b[i] >> 15);
  }

  FFT(A, 1), FFT(A15, 1);
  FFT(B, 1), FFT(B15, 1);

  static cpx bit[maxn];
  static cpx bit15[maxn];
  static cpx bit30[maxn];

  rep(i, 0, limit) {
    bit[i] = A[i] * B[i];
    bit15[i] = A15[i] * B[i] + B15[i] * A[i];
    bit30[i] = A15[i] * B15[i];
  }

  FFT(bit, -1), FFT(bit15, -1), FFT(bit30, -1);

  rep(i, 0, n + m) {
    int ret = 0;
    (ret += (int)(bit[i].real() + .5) % p) %= p;
    (ret += (((int)(bit15[i].real() + .5) % p) << 15ll) % p) %= p;
    (ret += (((int)(bit30[i].real() + .5) % p) << 30ll) % p) %= p;
    (ret += p) %= p;
    ans[i] = ret;
  }
	
  rep(i, 0, n + m) { out << ans[i] << ' '; }
  return 0;
  // code end.
}

猜你喜欢

转载自www.cnblogs.com/Isaunoya/p/12677484.html