#line 2 "nachia\\fps\\formal-power-series-struct.hpp" #include #include #include #include #include #line 3 "nachia\\math-modulo\\modulo-primitive-root.hpp" #include namespace nachia{ template struct PrimitiveRoot{ static constexpr unsigned long long powm(unsigned long long a, unsigned long long i) { unsigned long long res = 1, aa = a; while(i){ if(i & 1) res = res * aa % MOD; aa = aa * aa % MOD; i /= 2; } return res; } static constexpr bool ExamineVal(unsigned int g){ unsigned int t = MOD - 1; for(unsigned long long d=2; d*d<=t; d++) if(t % d == 0){ if(powm(g, (MOD - 1) / d) == 1) return false; while(t % d == 0) t /= d; } if(t != 1) if(powm(g, (MOD - 1) / t) == 1) return false; return true; } static constexpr unsigned int GetVal(){ for(unsigned int x=2; x class Comb{ private: std::vector F; std::vector iF; public: void extend(int newN){ int prevN = (int)F.size() - 1; if(prevN >= newN) return; F.resize(newN+1); iF.resize(newN+1); for(int i=prevN+1; i<=newN; i++) F[i] = F[i-1] * Modint::raw(i); iF[newN] = F[newN].inv(); for(int i=newN; i>prevN; i--) iF[i-1] = iF[i] * Modint::raw(i); } Comb(int n = 1){ F.assign(2, Modint(1)); iF.assign(2, Modint(1)); extend(n); } Modint factorial(int n) const { return F[n]; } Modint invFactorial(int n) const { return iF[n]; } Modint invOf(int n) const { return iF[n] * F[n-1]; } Modint comb(int n, int r) const { if(n < 0 || n < r || r < 0) return Modint(0); return F[n] * iF[r] * iF[n-r]; } Modint invComb(int n, int r) const { if(n < 0 || n < r || r < 0) return Modint(0); return iF[n] * F[r] * F[n-r]; } Modint perm(int n, int r) const { if(n < 0 || n < r || r < 0) return Modint(0); return F[n] * iF[n-r]; } Modint invPerm(int n, int r) const { if(n < 0 || n < r || r < 0) return Modint(0); return iF[n] * F[n-r]; } Modint operator()(int n, int r) const { return comb(n,r); } }; } // namespace nachia #line 4 "nachia\\misc\\bit-operations.hpp" namespace nachia{ int Popcount(unsigned long long c) noexcept { #ifdef __GNUC__ return __builtin_popcountll(c); #else c = (c & (~0ull/3)) + ((c >> 1) & (~0ull/3)); c = (c & (~0ull/5)) + ((c >> 2) & (~0ull/5)); c = (c & (~0ull/17)) + ((c >> 4) & (~0ull/17)); c = (c * (~0ull/257)) >> 56; return c; #endif } // please ensure x != 0 int MsbIndex(unsigned long long x) noexcept { #ifdef __GNUC__ return 63 - __builtin_clzll(x); #else int res = 0; for(int d=32; d>0; d>>=1) if(x >> d){ res |= d; x >>= d; } return res; #endif } // please ensure x != 0 int LsbIndex(unsigned long long x) noexcept { #ifdef __GNUC__ return __builtin_ctzll(x); #else return MsbIndex(x & -x); #endif } } #line 2 "nachia\\fps\\ntt-interface.hpp" namespace nachia { template struct NttInterface{ template void Butterfly(Iter, int) const {} template void IButterfly(Iter, int) const {} template void BitReversal(Iter a, int N) const { for(int i=0, j=0; j>1; k > (i^=k); k>>=1); } } }; } // namespace nachia #line 5 "nachia\\fps\\ntt-acl.hpp" #include #line 8 "nachia\\fps\\ntt-acl.hpp" #include namespace nachia{ constexpr int bsf_constexpr(unsigned int n) { int x = 0; while (!(n & (1 << x))) x++; return x; } template struct NttFromAcl : NttInterface { using u32 = unsigned int; using u64 = unsigned long long; static int ceil_pow2(int n) { int x = 0; while ((1U << x) < (u32)(n)) x++; return x; } struct fft_info { static constexpr u32 g = nachia::PrimitiveRoot::val; static constexpr int rank2 = bsf_constexpr(mint::mod()-1); std::array root; std::array iroot; std::array rate2; std::array irate2; std::array rate3; std::array irate3; fft_info(){ root[rank2] = mint(g).pow((mint::mod() - 1) >> rank2); iroot[rank2] = root[rank2].inv(); for(int i=rank2-1; i>=0; i--){ root[i] = root[i+1] * root[i+1]; iroot[i] = iroot[i+1] * iroot[i+1]; } mint prod = 1, iprod = 1; for(int i=0; i<=rank2-2; i++){ rate2[i] = root[i+2] * prod; irate2[i] = iroot[i+2] * iprod; prod *= iroot[i+2]; iprod *= root[i+2]; } prod = 1; iprod = 1; for(int i=0; i<=rank2-3; i++){ rate3[i] = root[i+3] * prod; irate3[i] = iroot[i+3] * iprod; prod *= iroot[i+3]; iprod *= root[i+3]; } } }; template void Butterfly(RandomAccessIterator a, int n) const { int h = ceil_pow2(n); static const fft_info info; int len = 0; while(len < h){ if(h-len == 1){ int p = 1 << (h-len-1); mint rot = 1; for(int s=0; s<(1< void IButterfly(RandomAccessIterator a, int n) const { int h = ceil_pow2(n); static const fft_info info; constexpr int MOD = mint::mod(); int len = h; while(len){ if(len == 1){ int p = 1 << (h-len); mint irot = 1; for(int s=0; s<(1<<(len-1)); s++){ int offset = s << (h-len+1); for(int i=0; i> struct FormalPowerSeriesNTT { public: using Fps = FormalPowerSeriesNTT; using ElemTy = Elem; static constexpr unsigned int MOD = Elem::mod(); static constexpr int CONV_THRES = 30; static const NttInst nttInst; static const unsigned int zeta = nachia::PrimitiveRoot::GetVal(); private: using u32 = unsigned int; static Elem ZeroElem() noexcept { return Elem(0); } static Elem OneElem() noexcept { return Elem(1); } static Comb comb; std::vector a; public: int size() const noexcept { return a.size(); } Elem& operator[](int x) noexcept { return a[x]; } const Elem& operator[](int x) const noexcept { return a[x]; } Elem getCoeff(int x) const noexcept { return (0 <= x && x < size()) ? a[x] : ZeroElem(); } static Comb& GetComb() { return comb; } static int BestNttSize(int x) noexcept { assert(x); return 1 << MsbIndex(x*2-1); } Fps move(){ return std::move(*this); } Fps& set(int i, Elem c){ a[i] = c; return *this; } Fps& removeLeadingZeros(){ int newsz = size(); while(newsz && a[newsz-1].val() == 0) newsz--; a.resize(newsz); if((int)a.capacity() / 4 > newsz) a.shrink_to_fit(); return *this; } FormalPowerSeriesNTT(){} FormalPowerSeriesNTT(int sz) : a(sz, ZeroElem()) {} FormalPowerSeriesNTT(std::vector&& src) : a(std::move(src)) {} FormalPowerSeriesNTT(const std::vector& src) : a(src) {} Fps& ntt() { capSize(BestNttSize(size())); nttInst.Butterfly(a.begin(), size()); return *this; } Fps& intt() { nttInst.IButterfly(a.begin(), a.size()); return times(Elem::raw(size()).inv()); } Fps nttDouble(Fps vanilla) const { int n = size(); assert(n == (n&-n)); // n is a power of 2 Elem q = Elem::raw(zeta).pow((Elem::mod() - 1) / (n*2)); Elem qq = Elem::raw(1); for(int i=0; i srcR = max(srcL, size()); // if resSz is unspecified -> resSz = destL + srcR - srcL Fps clip(int srcL, int srcR = -1, int destL = 0, int resSz = -1) const { if(srcR < 0) srcR = std::max(srcL, size()); if(resSz < 0) resSz = destL + srcR - srcL; if(srcR > size()) srcR = size(); Fps res(resSz); for(int j=std::max(0, -srcL); j+destL < resSz && j+srcL < srcR; j++) res[j+destL] = a[j+srcL]; return res; } Fps clip() const { return *this; } Fps& capSize(int l, int r) { if(r <= (int)size()) a.resize(r); if(size() <= l) a.resize(l, ZeroElem()); return *this; } Fps& capSize(int z){ a.resize(z, ZeroElem()); return *this; } Fps& times(Elem x){ for(int i=0; i b.size()) return convolution(b, a, sz); if(sz < 0) sz = std::max(0, a.size() + b.size() - 1); std::vector res(sz); for(int i=0; i=1; i--) a[i] = a[i-1] * comb.invOf(i); return set(0, ZeroElem()); } Fps log(int sz = -1){ if(sz < 0) sz = size(); assert(sz != 0); assert(a[0].val() == 1); return convolution(inv(sz), clip().difference(), sz-1).integral(); } Fps exp(int sz = -1){ if(sz < 0) sz = size(); Fps res = Fps(1).set(0, OneElem()); while(res.size() < sz){ auto z = res.size(); auto tmp = res.capSize(z*2).log().set(0, -OneElem()).move(); for(int i=0; i= (n-1) / k + 1) return Fps(n); Fps res = clip(ctz, ctz+n-ctz*k); Elem a0 = res[0]; ctz *= k; n -= ctz; return res.times(a0.inv()).log(n).times(Elem(k)).exp(n).times(a0.pow(k)).clip(0, n, ctz); } auto begin(){ return a.begin(); } auto end(){ return a.end(); } auto begin() const { return a.begin(); } auto end() const { return a.end(); } std::string toString(std::string beg = "[ ", std::string delim = " ", std::string en = " ]") const { std::string res = beg; bool f = false; for(auto x : a){ if(f){ res += delim; } f = true; res += std::to_string(x.val()); } res += en; return res; } std::vector getVectorMoved(){ return std::move(a); } Fps& operator+=(const Fps& r){ capSize(std::max(size(), r.size())); for(int i=0; i=0; i--) res = res * x + a[i]; return res; } }; template Comb FormalPowerSeriesNTT::comb; template const NttInst FormalPowerSeriesNTT::nttInst; } // namespace nachia #line 5 "nachia\\linear\\matrix-on-ring.hpp" namespace nachia{ template struct MatrixOnRing{ private: int h; int w; std::vector elems; public: MatrixOnRing(int new_h=0, int new_w=0){ h = new_h; w = new_w; elems.resize(h * w); } MatrixOnRing(MatrixOnRing const&) = default; int numRow() const { return h; } int numColumn() const { return w; } int height() const { return numRow(); } int width() const { return numColumn(); } typename std::vector::iterator operator[](int y){ return elems.begin() + (y*w); } typename std::vector::const_iterator operator[](int y) const { return elems.begin() + (y*w); } static MatrixOnRing Identity(int idx, Elem One){ auto res = MatrixOnRing(idx, idx); for(int i=0; i MatrixOnRing PRecursiveMatrixProduct( MatrixOnRing> p, unsigned long long idx ){ struct ShiftOfSamplingPointsOfPolynomialUpdate{ using Fps = FormalPowerSeriesNTT; int n; int N2; Fps iF, F, iFI, iFIntt1, iFntt; std::vector iFIntt2s; ShiftOfSamplingPointsOfPolynomialUpdate(int n, std::vector sh){ auto& comb = Fps::GetComb(); comb.extend(n); this->n = n; N2 = Fps::BestNttSize(n*2); iF = F = iFI = Fps(n); for(int i=0; i> calc(const std::vector& points){ Fps P(N2); for(int i=0; i> res2(iFIntt2s.size()); for(size_t shi=0; shi> res; res.resize(h*h); for(auto& a : res) a.resize(h); u64 a = 1, b = 1; for(int i=0; i MatrixOnRing { MatrixOnRing res(h, h); for(int y=0; y MatrixOnRing { MatrixOnRing g(h, h); for(int y=0; y sh(3); sh[0] = Elem(b); sh[1] = Elem(a) / Elem(maxA); sh[2] = sh[0] + sh[1]; std::vector>> shbuf(h*h); auto shman = ShiftOfSamplingPointsOfPolynomialUpdate(b, sh); for(int i=0; i> resbuf; resbuf.assign(h*h, std::vector(b*2)); for(int i=0; i ans = MatrixOnRing::Identity(h, Elem::raw(1)); while(pos + maxA <= idx){ ans = EvalL(pos / maxA) * ans; pos += maxA; } while(pos < idx){ ans = EvalP(pos++) * ans; } return ans; } } // namespace nachia #line 2 "nachia\\fps\\ntt-setup-manager.hpp" namespace nachia{ template class FpsNttSetupManager { using ElemTy = Elem; using Fps = typename nachia::FormalPowerSeriesNTT; using MyType = FpsNttSetupManager; Fps raw; mutable Fps ntt; static const int THRESH = 30; FpsNttSetupManager(Fps _raw) : raw(_raw.move()) , ntt() {} public: FpsNttSetupManager() : FpsNttSetupManager(Fps()) {} FpsNttSetupManager(Fps _raw, Fps _ntt) : raw(_raw.move()) , ntt(_ntt.move()) {} const Fps& getRaw() const { return raw; } int size() const { return raw.size(); } int Least(){ return Fps::BestNttSize(raw.size()); } static MyType FromRaw(Fps _raw){ return FpsNttSetupManager(_raw.move()); } static MyType FromNtt(Fps _ntt){ Fps x = _ntt.clip(); return MyType(x.intt().removeLeadingZeros().move(), _ntt.move()); } void doubling() const { if(ntt.size() == 0) ntt = raw.clip(0, Fps::BestNttSize(raw.size())).ntt().move(); else ntt = ntt.nttDouble(raw.clip(0, ntt.size())); } Fps& ensureNtt(int sz) const { if(sz / 8 >= ntt.size()) ntt = raw.clip(0, sz).ntt().move(); while(ntt.size() < sz) doubling(); return ntt; } Fps nttClip(int sz) const { return ensureNtt(sz).clip(0,sz); } std::pair destruct(){ return std::make_pair(raw.move(), ntt.move()); } MyType operator+(const MyType& r) const { Fps nntt; int z1 = std::min(ntt.size(), r.ntt.size()); if(z1 >= std::max(size(), r.size())){ nntt.capSize(std::min(ntt.size(), r.ntt.size())); for(int i=0; i #include #include #line 6 "nachia\\misc\\fastio.hpp" namespace nachia{ struct CInStream{ private: static const unsigned int INPUT_BUF_SIZE = 1 << 17; unsigned int p = INPUT_BUF_SIZE; static char Q[INPUT_BUF_SIZE]; public: using MyType = CInStream; char seekChar() noexcept { if(p == INPUT_BUF_SIZE){ size_t len = fread(Q, 1, INPUT_BUF_SIZE, stdin); if(len != INPUT_BUF_SIZE) Q[len] = '\0'; p = 0; } return Q[p]; } void skipSpace() noexcept { while(isspace(seekChar())) p++; } uint32_t nextU32() noexcept { skipSpace(); uint32_t buf = 0; while(true){ char tmp = seekChar(); if('9' < tmp || tmp < '0') break; buf = buf * 10 + (tmp - '0'); p++; } return buf; } int32_t nextI32() noexcept { skipSpace(); if(seekChar() == '-'){ p++; return (int32_t)(-nextU32()); } return (int32_t)nextU32(); } uint64_t nextU64() noexcept { skipSpace(); uint64_t buf = 0; while(true){ char tmp = seekChar(); if('9' < tmp || tmp < '0') break; buf = buf * 10 + (tmp - '0'); p++; } return buf; } int64_t nextI64() noexcept { skipSpace(); if(seekChar() == '-'){ p++; return (int64_t)(-nextU64()); } return (int64_t)nextU64(); } char nextChar() noexcept { skipSpace(); char buf = seekChar(); p++; return buf; } std::string nextToken(){ skipSpace(); std::string buf; while(true){ char ch = seekChar(); if(isspace(ch) || ch == '\0') break; buf.push_back(ch); p++; } return buf; } MyType& operator>>(unsigned int& dest) noexcept { dest = nextU32(); return *this; } MyType& operator>>(int& dest) noexcept { dest = nextI32(); return *this; } MyType& operator>>(unsigned long& dest) noexcept { dest = nextU64(); return *this; } MyType& operator>>(long& dest) noexcept { dest = nextI64(); return *this; } MyType& operator>>(unsigned long long& dest) noexcept { dest = nextU64(); return *this; } MyType& operator>>(long long& dest) noexcept { dest = nextI64(); return *this; } MyType& operator>>(std::string& dest){ dest = nextToken(); return *this; } MyType& operator>>(char& dest) noexcept { dest = nextChar(); return *this; } } cin; struct FastOutputTable{ char LZ[1000][4] = {}; char NLZ[1000][4] = {}; constexpr FastOutputTable(){ using u32 = uint_fast32_t; for(u32 d=0; d<1000; d++){ LZ[d][0] = ('0' + d / 100 % 10); LZ[d][1] = ('0' + d / 10 % 10); LZ[d][2] = ('0' + d / 1 % 10); LZ[d][3] = '\0'; } for(u32 d=0; d<1000; d++){ u32 i = 0; if(d >= 100) NLZ[d][i++] = ('0' + d / 100 % 10); if(d >= 10) NLZ[d][i++] = ('0' + d / 10 % 10); if(d >= 1) NLZ[d][i++] = ('0' + d / 1 % 10); NLZ[d][i++] = '\0'; } } }; struct COutStream{ private: using u32 = uint32_t; using u64 = uint64_t; using MyType = COutStream; static const u32 OUTPUT_BUF_SIZE = 1 << 17; static char Q[OUTPUT_BUF_SIZE]; static constexpr FastOutputTable TB = FastOutputTable(); u32 p = 0; static constexpr u32 P10(u32 d){ return d ? P10(d-1)*10 : 1; } static constexpr u64 P10L(u32 d){ return d ? P10L(d-1)*10 : 1; } template static void Fil(T& m, U& l, U x) noexcept { m = l/x; l -= m*x; } void next_dig9(u32 x){ u32 y; Fil(y, x, P10(6)); nextCstr(TB.LZ[y]); Fil(y, x, P10(3)); nextCstr(TB.LZ[y]); nextCstr(TB.LZ[x]); } public: void nextChar(char c){ Q[p++] = c; if(p == OUTPUT_BUF_SIZE){ fwrite(Q, p, 1, stdout); p = 0; } } void nextEoln(){ nextChar('\n'); } void nextCstr(const char* s){ while(*s) nextChar(*(s++)); } void nextU32(uint32_t x){ u32 y = 0; if(x >= P10(9)){ Fil(y, x, P10(9)); nextCstr(TB.NLZ[y]); next_dig9(x); } else if(x >= P10(6)){ Fil(y, x, P10(6)); nextCstr(TB.NLZ[y]); Fil(y, x, P10(3)); nextCstr(TB.LZ[y]); nextCstr(TB.LZ[x]); } else if(x >= P10(3)){ Fil(y, x, P10(3)); nextCstr(TB.NLZ[y]); nextCstr(TB.LZ[x]); } else if(x >= 1) nextCstr(TB.NLZ[x]); else nextChar('0'); } void nextI32(int32_t x){ if(x >= 0) nextU32(x); else{ nextChar('-'); nextU32((u32)-x); } } void nextU64(uint64_t x){ u32 y = 0; if(x >= P10L(18)){ Fil(y, x, P10L(18)); nextU32(y); Fil(y, x, P10L(9)); next_dig9(y); next_dig9(x); } else if(x >= P10L(9)){ Fil(y, x, P10L(9)); nextU32(y); next_dig9(x); } else nextU32(x); } void nextI64(int64_t x){ if(x >= 0) nextU64(x); else{ nextChar('-'); nextU64((u64)-x); } } void writeToFile(bool flush = false){ fwrite(Q, p, 1, stdout); if(flush) fflush(stdout); p = 0; } COutStream(){ Q[0] = 0; } ~COutStream(){ writeToFile(); } MyType& operator<<(unsigned int tg){ nextU32(tg); return *this; } MyType& operator<<(unsigned long tg){ nextU64(tg); return *this; } MyType& operator<<(unsigned long long tg){ nextU64(tg); return *this; } MyType& operator<<(int tg){ nextI32(tg); return *this; } MyType& operator<<(long tg){ nextI64(tg); return *this; } MyType& operator<<(long long tg){ nextI64(tg); return *this; } MyType& operator<<(const std::string& tg){ nextCstr(tg.c_str()); return *this; } MyType& operator<<(const char* tg){ nextCstr(tg); return *this; } MyType& operator<<(char tg){ nextChar(tg); return *this; } } cout; char CInStream::Q[INPUT_BUF_SIZE]; char COutStream::Q[OUTPUT_BUF_SIZE]; } // namespace nachia #line 5 "Main.cpp" #include #line 7 "Main.cpp" int main(){ using Modint = atcoder::static_modint<998244353>; using Polynomial = nachia::FormalPowerSeriesNTT; using PolynomialMat = nachia::MatrixOnRing; using NttSetup = nachia::FpsNttSetupManager; using NttSetupMat = nachia::MatrixOnRing; using nachia::cin, nachia::cout; auto MatMod = [&](NttSetupMat mat, NttSetup mod) -> NttSetupMat { int n = mat.height(); NttSetupMat res(n, n); int maxlen = 0; for(int i=0; i> T; if(T <= 5){ for(int t=0; t> N >> K; if(K >= 998244353){ cout << "0\n"; continue; } PolynomialMat M_nX = PolynomialMat(2,2); M_nX[0][0] = std::vector{ Modint(N) * 2 , -Modint(2) }; // 2N - 2k M_nX[0][1] = std::vector{ 0, (Modint(N)*2+1) / 2, -Modint(1) / 2 }; // (2N+1)k/2 - k^2/2 M_nX[1][0] = std::vector{ 1 }; M_nX[1][1] = std::vector{}; auto ansMat = nachia::PRecursiveMatrixProduct(M_nX, K); Modint ans = ansMat[0][0]; cout << ans.val() << '\n'; } } else{ int MAX_K = 100000; int MATRIX_QUERY = 1001001001; std::vector> NK(T); for(auto& nk : NK) cin >> nk.first >> nk.second; std::vector> queries; for(int k=0; k x){ return NttSetup::FromRaw(x); }; std::vector FX; std::vector KX; FX.assign(segN*2, NttSetupMat::Identity(2, ConstructNttSetup({1}))); KX.assign(segN*2, ConstructNttSetup({1})); for(int q=0; q<(int)queries.size(); q++){ if(queries[q].second == MATRIX_QUERY){ int k = queries[q].first; FX[segN+q][0][0] = ConstructNttSetup({ -Modint(k)*2, Modint(2) }); // 2N - 2k FX[segN+q][0][1] = ConstructNttSetup({ Modint(k)*(1-k) / 2, Modint(k) }); // Nk + k(1-k)/2 FX[segN+q][1][0] = ConstructNttSetup({ 1 }); FX[segN+q][1][1] = ConstructNttSetup({}); } else{ unsigned long long N = NK[queries[q].second].first; KX[segN+q] = ConstructNttSetup({ -Modint(N), 1 }); // x - N } } for(int i=segN-1; i>=1; i--) FX[i] = FX[i*2+1] * FX[i*2]; for(int i=segN-1; i>=1; i--) KX[i] = KX[i*2+1] * KX[i*2]; std::vector FXmodKX(segN*2); FXmodKX[1] = MatMod(NttSetupMat::Identity(2, ConstructNttSetup({1})), std::move(KX[1])); for(int i=1; i<=segN-1; i++){ FXmodKX[i*2+1] = MatMod(FX[i*2] * FXmodKX[i], std::move(KX[i*2+1])); FXmodKX[i*2] = MatMod(std::move(FXmodKX[i]), std::move(KX[i*2])); } std::vector ans(T); for(int q=0; q<(int)queries.size(); q++){ if(queries[q].second != MATRIX_QUERY){ ans[queries[q].second] = FXmodKX[segN+q][0][0].getRaw().eval(0); } } for(int i=0; i