This documentation is automatically generated by online-judge-tools/verification-helper
View the Project on GitHub shino16/cplib
#pragma once #include "math/ntt.cpp" #include "template.cpp" #include "math/modint.cpp" namespace Garner { static NTT<0> ntt0; static NTT<1> ntt1; static NTT<2> ntt2; static ll inv(ll x, ll md) { return power(x, md - 2, md); } ll garner(ll c0, ll c1, ll c2, ll m01, ll mod) { static ll r01 = inv(ntt0.md, ntt1.md); static ll r02 = inv(ntt0.md, ntt2.md); static ll r12 = inv(ntt1.md, ntt2.md); c1 = (ll)(c1 - c0) * r01 % ntt1.md; if (c1 < 0) c1 += ntt1.md; c2 = (ll)(c2 - c0) * r02 % ntt2.md; c2 = (ll)(c2 - c1) * r12 % ntt2.md; if (c2 < 0) c2 += ntt2.md; c0 %= mod; c0 += (ll)c1 * ntt0.md % mod; if (c0 >= mod) c0 -= mod; c0 += (ll)c2 * m01 % mod; if (c0 >= mod) c0 -= mod; return c0; } vector<ll> garner(vector<vector<ll>> &cs, ll mod) { ll m01 = (ll)ntt0.md * ntt1.md % mod; ll sz = cs[0].size(); vector<ll> res(sz); for (ll i = 0; i < sz; i++) res[i] = garner(cs[0][i], cs[1][i], cs[2][i], m01, mod); return res; } vector<ll> multiply(vector<ll> as, vector<ll> bs, ll mod) { vector<vector<ll>> cs(3); cs[0] = ntt0.multiply(as, bs); cs[1] = ntt1.multiply(as, bs); cs[2] = ntt2.multiply(as, bs); size_t sz = as.size() + bs.size() - 1; for (auto &v : cs) v.resize(sz); return garner(cs, mod); } template <ll Mod = 1000000007> vector<modint<Mod>> multiply(vector<modint<Mod>> am, vector<modint<Mod>> bm) { vector<ll> as(am.size()), bs(bm.size()); rep(i, am.size()) as[i] = am[i].v; rep(i, bm.size()) bs[i] = bm[i].v; vector<ll> cs = multiply(as, bs, Mod); vector<modint<Mod>> cm(cs.size()); rep(i, cs.size()) cm[i] = modint<Mod>(cs[i]); return cm; } }; // namespace Garner
#line 2 "math/garner-ntt.cpp" #line 2 "math/ntt.cpp" #line 2 "template.cpp" #ifndef LOCAL #pragma GCC optimize("O3") #pragma GCC optimize("unroll-loops") #pragma GCC target("avx") #endif #include <algorithm> #include <bitset> #include <cassert> #include <cmath> #include <functional> #include <iostream> #include <map> #include <numeric> #include <queue> #include <set> #include <stack> using namespace std; using ll = long long; using ull = unsigned long long; using VI = vector<int>; using VVI = vector<vector<int>>; using VLL = vector<ll>; using VVLL = vector<vector<ll>>; using VB = vector<bool>; using PII = pair<int, int>; using PLL = pair<ll, ll>; constexpr int INF = 1000000007; constexpr ll INF_LL = 1'000'000'000'000'000'007; #define all(x) begin(x), end(x) #define rall(x) rbegin(x), rend(x) #define newl '\n' // loops rep(until) / rep(var, until) / rep(var, from, until) / repr (reversed order) #define OVERLOAD3(_1, _2, _3, name, ...) name #define rep(...) OVERLOAD3(__VA_ARGS__, REPEAT_FROM_UNTIL, REPEAT_UNTIL, REPEAT)(__VA_ARGS__) #define REPEAT(times) REPEAT_CNT(_repeat, __COUNTER__, times) #define REPEAT_CNT(_repeat, cnt, times) REPEAT_CNT_CAT(_repeat, cnt, times) #define REPEAT_CNT_CAT(_repeat, cnt, times) REPEAT_FROM_UNTIL(_repeat ## cnt, 0, times) #define REPEAT_UNTIL(name, times) REPEAT_FROM_UNTIL(name, 0, times) #define REPEAT_FROM_UNTIL(name, from, until) for (int name = from, name ## __until = (until); name < name ## __until; name++) #define repr(...) OVERLOAD3(__VA_ARGS__, REPR_FROM_UNTIL, REPR_UNTIL, REPEAT)(__VA_ARGS__) #define REPR_UNTIL(name, times) REPR_FROM_UNTIL(name, 0, times) #define REPR_FROM_UNTIL(name, from, until) for (int name = (until)-1, name ## __from = (from); name >= name ## __from; name--) template <typename T, typename U> bool chmin(T& var, U x) { if (var > x) { var = x; return true; } else return false; } template <typename T, typename U> bool chmax(T& var, U x) { if (var < x) { var = x; return true; } else return false; } ll power(ll e, ll t, ll mod = INF_LL) { ll res = 1; for (; t; t >>= 1, (e *= e) %= mod) if (t & 1) (res *= e) %= mod; return res; } ll choose(ll n, int r) { chmin(r, n-r); if (r < 0) return 0; ll res = 1; rep(i, r) res *= n-i, res /= i+1; return res; } template <typename T, typename U> T divceil(T m, U d) { return (m + d - 1) / d; } template <typename T> vector<T> make_v(size_t a, T b) { return vector<T>(a, b); } template <typename... Ts> auto make_v(size_t a, Ts... ts) { return vector<decltype(make_v(ts...))>(a, make_v(ts...)); } // debugging stuff #pragma GCC diagnostic push #pragma GCC diagnostic ignored "-Wmisleading-indentation" #define repi(it, ds) for (auto it = ds.begin(); it != ds.end(); it++) class DebugPrint { public: template <typename T> DebugPrint& operator <<(const T& v) { #ifdef LOCAL cerr << v; #endif return *this; } } debugos; template <typename T> DebugPrint& operator<<(DebugPrint& os, const vector<T>& vec) { os << "{"; for (int i = 0; i < vec.size(); i++) os << vec[i] << (i + 1 == vec.size() ? "" : ", "); os << "}"; return os; } template <typename T, typename U> DebugPrint& operator<<(DebugPrint& os, const map<T, U>& map_var) { os << "{"; repi(itr, map_var) { os << * itr; itr++; if (itr != map_var.end()) os << ", "; itr--; } os << "}"; return os; } template < typename T> DebugPrint& operator<<(DebugPrint& os, const set<T>& set_var) { os << "{"; repi( itr, set_var) { os << *itr; itr++; if (itr != set_var.end()) os << ", "; itr--; } os << "}"; return os; } template <typename T, typename U> DebugPrint& operator<<(DebugPrint& os, const pair<T, U>& p) { os << "(" << p.first << ", " << p.second << ")"; return os; } void dump_func( ) { debugos << newl; } template <class Head, class... Tail> void dump_func(Head &&head, Tail &&... tail) { debugos << head; if (sizeof...(Tail) > 0) { debugos << ", "; } dump_func(forward <Tail>(tail)...); } #ifdef LOCAL #define dump(...) debugos << " " << string(#__VA_ARGS__) << ": " << "[" << to_string(__LINE__) \ << ":" << __FUNCTION__ << "]" << newl << " ", dump_func(__VA_ARGS__) #else #define dump(...) ({}) #endif #pragma GCC diagnostic pop #line 2 "math/modint.cpp" #line 4 "math/modint.cpp" template <ll> class modint; template <ll MOD> constexpr modint<MOD> pow(modint<MOD>, ll); template <ll MOD = 1000000007> class modint { public: ll value; static constexpr ll Mod = MOD; constexpr modint(const ll x = 0) noexcept : value(x) { value %= MOD; if (value < 0) value += MOD; } constexpr bool operator==(const modint& rhs) { return value == rhs.value; } constexpr bool operator!=(const modint& rhs) { return value != rhs.value; } constexpr modint operator-() const { return modint(0) - *this; } constexpr modint operator+(const modint& rhs) const { return modint(*this) += rhs; } constexpr modint operator-(const modint& rhs) const { return modint(*this) -= rhs; } constexpr modint operator*(const modint& rhs) const { return modint(*this) *= rhs; } constexpr modint operator/(const modint& rhs) const { return modint(*this) /= rhs; } constexpr modint& operator+=(const modint& rhs) { value += rhs.value; if (value >= MOD) value -= MOD; return *this; } constexpr modint& operator-=(const modint& rhs) { if (value < rhs.value) value += MOD; value -= rhs.value; return *this; } constexpr modint& operator*=(const modint& rhs) { value = value * rhs.value % MOD; return *this; } constexpr modint& operator/=(const modint& rhs) { return *this *= pow(rhs, MOD - 2); } constexpr modint& operator++() { return *this += 1; } constexpr modint operator++(int) { modint tmp(*this); ++(*this); return tmp; } constexpr modint& operator--() { return *this -= 1; } constexpr modint operator--(int) { modint tmp(*this); --(*this); return tmp; } constexpr operator int() const { return (int)value; } constexpr operator ll() const { return value; } }; template <typename OutStream, ll MOD> OutStream& operator<<(OutStream& out, modint<MOD> n) { out << n.value; return out; } template <typename InStream, ll MOD> InStream& operator>>(InStream& in, modint<MOD>& n) { ll var; in >> var; n = modint<MOD>(var); return in; } template <ll MOD> constexpr modint<MOD> pow(modint<MOD> base, ll exp) { modint<MOD> res = 1; while (exp) { if (exp % 2) res *= base; base *= base; exp /= 2; } return res; } // O(r + log MOD) template <ll MOD> modint<MOD> choose(int n, int r) { chmin(r, n-r); if (r < 0) return modint<MOD>(0); modint<MOD> nu = 1, de = 1; rep(i, r) nu *= n-i, de *= i+1; return nu / de; } #line 5 "math/ntt.cpp" constexpr ll mods(int x) { const ll v[] = {1012924417, 924844033, 998244353, 897581057, 645922817}; return v[x]; } constexpr int primitive_roots(int x) { const int v[] = {5, 5, 3, 3, 3}; return v[x]; } template <int X = 2> class NTT { public: static constexpr int md = mods(X); static constexpr int rt = primitive_roots(X); using mint = modint<md>; private: vector<vector<mint>> root, rroot; void prepare(int n) { if (root.size() >= n) return; root.resize(n); rroot.resize(n); for (int i = 1; i < n; i <<= 1) { if (!root[i].empty()) continue; mint w = pow(mint(rt), (md - 1) / (i << 1)); mint rw = mint(1) / w; root[i].resize(i); rroot[i].resize(i); root[i][0] = mint(1); rroot[i][0] = mint(1); rep(k, 1, i) root[i][k] = root[i][k - 1] * w, rroot[i][k] = rroot[i][k - 1] * rw; } } public: void ntt(vector<mint>& A, bool reverse) { int n = A.size(); assert((n & (n - 1)) == 0); prepare(n); for (int i = 0, j = 1; j + 1 < n; j++) { for (int k = n >> 1; k > (i ^= k); k >>= 1) {} if (i > j) swap(A[i], A[j]); } for (int i = 1; i < n; i <<= 1) { for (int j = 0; j < n; j += i * 2) { for (int k = 0; k < i; k++) { mint z = A[i + j + k] * (reverse ? rroot[i][k] : root[i][k]); A[i + j + k] = A[j + k] - z; A[j + k] += z; } } } if (reverse) { mint tmp = mint(1) / mint(n); rep(i, n) A[i] *= tmp; } } vector<mint> multiply(vector<mint> A, vector<mint> B) { int need = A.size() + B.size() - 1; int sz = need <= 1 ? 1 : 1 << (32 - __builtin_clz(need - 1)); A.resize(sz, mint(0)); B.resize(sz, mint(0)); ntt(A, 0); ntt(B, 0); rep(i, sz) A[i] *= B[i]; ntt(A, 1); A.resize(need); return A; } vector<ll> multiply(vector<ll> A, vector<ll> B) { vector<mint> am(A.size()), bm(B.size()); rep(i, am.size()) am[i] = mint(A[i]); rep(i, bm.size()) bm[i] = mint(B[i]); vector<mint> cm = multiply(am, bm); vector<ll> cs(cm.size()); rep(i, cs.size()) cs[i] = cm[i].value; return cs; } }; #line 6 "math/garner-ntt.cpp" namespace Garner { static NTT<0> ntt0; static NTT<1> ntt1; static NTT<2> ntt2; static ll inv(ll x, ll md) { return power(x, md - 2, md); } ll garner(ll c0, ll c1, ll c2, ll m01, ll mod) { static ll r01 = inv(ntt0.md, ntt1.md); static ll r02 = inv(ntt0.md, ntt2.md); static ll r12 = inv(ntt1.md, ntt2.md); c1 = (ll)(c1 - c0) * r01 % ntt1.md; if (c1 < 0) c1 += ntt1.md; c2 = (ll)(c2 - c0) * r02 % ntt2.md; c2 = (ll)(c2 - c1) * r12 % ntt2.md; if (c2 < 0) c2 += ntt2.md; c0 %= mod; c0 += (ll)c1 * ntt0.md % mod; if (c0 >= mod) c0 -= mod; c0 += (ll)c2 * m01 % mod; if (c0 >= mod) c0 -= mod; return c0; } vector<ll> garner(vector<vector<ll>> &cs, ll mod) { ll m01 = (ll)ntt0.md * ntt1.md % mod; ll sz = cs[0].size(); vector<ll> res(sz); for (ll i = 0; i < sz; i++) res[i] = garner(cs[0][i], cs[1][i], cs[2][i], m01, mod); return res; } vector<ll> multiply(vector<ll> as, vector<ll> bs, ll mod) { vector<vector<ll>> cs(3); cs[0] = ntt0.multiply(as, bs); cs[1] = ntt1.multiply(as, bs); cs[2] = ntt2.multiply(as, bs); size_t sz = as.size() + bs.size() - 1; for (auto &v : cs) v.resize(sz); return garner(cs, mod); } template <ll Mod = 1000000007> vector<modint<Mod>> multiply(vector<modint<Mod>> am, vector<modint<Mod>> bm) { vector<ll> as(am.size()), bs(bm.size()); rep(i, am.size()) as[i] = am[i].v; rep(i, bm.size()) bs[i] = bm[i].v; vector<ll> cs = multiply(as, bs, Mod); vector<modint<Mod>> cm(cs.size()); rep(i, cs.size()) cm[i] = modint<Mod>(cs[i]); return cm; } }; // namespace Garner