拆系数FFT(任意模数FFT)

拆系数FFT

对于任意模数 \(mod\)

设\(m=\sqrt {mod}\)

把多项式\(A(x)\)和\(B(x)\)的系数都拆成\(a\times m+b\)的形式,时\(a, b\)都小于\(m\)

提出,那么一个多项式就可以拆成两个多项式的加法

一个是\(a*m\)的,一个是\(b\)的

直接乘法分配律,\(aa\)一遍,\(ab\)一遍,\(ba\),\(bb\)一遍,四遍\(FFT\)

乘出来不会超过取模范围

然后合并直接

\[(a\times m+b)(c\times m+d)=a\times c\times m^2+(a\times c+b\times d)m+b\times d
\]

这样子要进行 \(7\) 次 \(DFT\)

如果研究一下 \(myy\) \(2016\) 年的集训队论文就会发现有 \(2\) 次 或者 \(1.5\) 次 \(DFT\) 的 \(FFT\) 算法

2次的够了吧

\(myy\) 巧妙的运用了复数的虚部,优化了算法

具体来说

\[C(x)=A(x)+iB(x)
\]

\[D(x)=A(x)-iB(x)
\]

假设

\(c(w_n^k)\) 表示将 \(C(x)\) \(DFT\) 后的点值

\(d(w_n^k)\) 表示将 \(D(x)\) \(DFT\) 后的点值

\(w\) 为 \(n\) 次单位复数根

设 \(conj(x)\) 表示 \(x\) 的共轭复数

那么

\[c(w_{2n}^{k})=A(w_{2n}^{k})+iB(w_{2n}^{k})=\sum_{j=0}^{2n-1}A_jw_{2n}^{jk}+iB_jw_{2n}^{jk}
\]

\[=\sum_{j=0}^{2n-1}(A_j+iB_j)(cos\frac{\pi jk}{n}+isin \frac{\pi jk}{n})
\]

\[d(w_{2n}^{k})=A(w_{2n}^{k})-iB(w_{2n}^{k})=\sum_{j=0}^{2n-1}(A_j-iB_j)(cos\frac{\pi jk}{n}+isin \frac{\pi jk}{n})
\]

设 \(x=\frac{\pi jk}{n}\)

那么

\[d(w_{2n}^{k})=\sum_{j=0}^{2n-1}(A_jcosx+B_jsinx)+i(A_jsinx-B_jcosx)
\]

\[=conj(\sum_{j=0}^{2n-1}(A_jcosx+B_jsinx)-i(A_jsinx-B_jcosx))
\]

\[=conj(\sum_{j=0}^{2n-1}(A_jcos(-x)-B_jsin(-x))+i(A_jsin(-x)+B_jcos(-x)))
\]

\[=conj(\sum_{j=0}^{2n-1}(A_j+iB_j)(cos(-x)+isin(-x)))
\]

\[=conj(\sum_{j=0}^{2n-1}(A_j+iB_j)(cos(2\pi-x)+isin(2\pi-x)))
\]

\[=conj(c(w_{2n}^{2n-k}))
\]

也就是说

只需要一次 \(DFT\) 求出 \(c\) 就可以求出 \(d\)

那么

\[DFT(A(k))=\frac{c(w^{k})+d(w^{k})}{2}
\]

\[DFT(B(k))=\frac{c(w^{k})-d(w^{k})}{2i}
\]

再用一次 \(DFT^{-1}\) 还原出多项式,多项式乘法只要两次 \(DFT\)

考虑拆系数 \(FFT\)

\(DFT\) 两两合并,从 \(4\) 次变成 \(2\) 次

\(DFT^{-1}\) 合并其中一个,从 \(3\) 次变成 \(2\) 次

一共 \(4\) 次

# include <bits/stdc++.h>
using namespace std;
typedef long long ll; namespace IO {
const int maxn((1 << 21) + 1); char ibuf[maxn], *iS, *iT, obuf[maxn], *oS = obuf, *oT = obuf + maxn - 1, c, st[65];
int f, tp; char Getc() {
return (iS == iT ? (iT = (iS = ibuf) + fread(ibuf, 1, maxn, stdin), (iS == iT ? EOF : *iS++)) : *iS++);
} void Flush() {
fwrite(obuf, 1, oS - obuf, stdout);
oS = obuf;
} void Putc(char x) {
*oS++ = x;
if (oS == oT) Flush();
} template <class Int> void In(Int &x) {
for (f = 1, c = Getc(); c < '0' || c > '9'; c = Getc()) f = c == '-' ? -1 : 1;
for (x = 0; c <= '9' && c >= '0'; c = Getc()) x = (x << 3) + (x << 1) + (c ^ 48);
x *= f;
} template <class Int> void Out(Int x) {
if (!x) Putc('0');
if (x < 0) Putc('-'), x = -x;
while (x) st[++tp] = x % 10 + '0', x /= 10;
while (tp) Putc(st[tp--]);
}
} using IO :: In;
using IO :: Out;
using IO :: Putc;
using IO :: Flush; const int maxn(1 << 18);
const double pi(acos(-1)); struct Complex {
double a, b; inline Complex() {
a = b = 0;
} inline Complex(double _a, double _b) {
a = _a, b = _b;
} inline Complex operator +(Complex x) const {
return Complex(a + x.a, b + x.b);
} inline Complex operator -(Complex x) const {
return Complex(a - x.a, b - x.b);
} inline Complex operator *(Complex x) const {
return Complex(a * x.a - b * x.b, a * x.b + b * x.a);
} inline Complex Conj() {
return Complex(a, -b);
}
}; Complex a[maxn], b[maxn], w[maxn], a1[maxn], a2[maxn];
int r[maxn], l, deg, g[maxn], h[maxn], mod; inline void FFT(Complex *p, int opt) {
register int i, j, k, t;
register Complex wn, x, y;
for (i = 0; i < deg; ++i) if (r[i] < i) swap(p[r[i]], p[i]);
for (i = 1; i < deg; i <<= 1)
for(t = i << 1, j = 0; j < deg; j += t)
for (k = 0; k < i; ++k) {
wn = w[deg / i * k];
if (opt == -1) wn.b *= -1;
x = p[j + k], y = wn * p[i + j + k];
p[j + k] = x + y, p[i + j + k] = x - y;
}
} inline void Mul(int n, int *p, int *q, int *f) {
register int i, k, v1, v2, v3;
register Complex ca, cb, da1, da2, db1, db2;
for (deg = 1, l = 0; deg < n; deg <<= 1) ++l;
for (i = 0; i < deg; ++i) r[i] = (r[i >> 1] >> 1) | ((i & 1) << (l - 1));
for (i = 0; i < deg; ++i) w[i] = Complex(cos(pi * i / deg), sin(pi * i / deg));
for (i = 0; i < n; ++i) a[i] = Complex(p[i] & 32767, p[i] >> 15), b[i] = Complex(q[i] & 32767, q[i] >> 15);
for (FFT(a, 1), FFT(b, 1), i = 0; i < deg; ++i) {
k = (deg - i) & (deg - 1), ca = a[k].Conj(), cb = b[k].Conj();
da1 = (ca + a[i]) * Complex(0.5, 0), da2 = (a[i] - ca) * Complex(0, -0.5);
db1 = (cb + b[i]) * Complex(0.5, 0), db2 = (b[i] - cb) * Complex(0, -0.5);
a1[i] = da1 * db1 + (da1 * db2 + da2 * db1) * Complex(0, 1), a2[i] = da2 * db2;
}
for (FFT(a1, -1), FFT(a2, -1), i = 0; i < deg; ++i) {
v1 = (ll)(a1[i].a / deg + 0.5) % mod, v2 = (ll)(a1[i].b / deg + 0.5) % mod;
v3 = (ll)(a2[i].a / deg + 0.5) % mod, f[i] = (((ll)v3 << 30) + ((ll)v2 << 15) + v1) % mod;
if (f[i] < 0) f[i] += mod;
}
} int main() {
register int len, i, n, m;
In(n), In(m), In(mod), ++n, ++m;
for (i = 0; i < n; ++i) In(h[i]), h[i] %= mod;
for (i = 0; i < m; ++i) In(g[i]), g[i] %= mod;
for (len = 1, n += m - 1; len < n; len <<= 1);
for (Mul(len, h, g, g), i = 0; i < n; ++i) Out(g[i]), Putc(' ');
return Flush(), 0;
}
上一篇:[洛谷P4245]【模板】任意模数NTT


下一篇:SQLAlchemy中表结构的一对一