#pragma GCC optimize("O3") #include "bits/stdc++.h" #include #include "atcoder/all" #include using namespace boost::multiprecision; using namespace std; using namespace atcoder; using ll = long long; using ull = unsigned long long; using mint = modint998244353; using mint2 = modint1000000007; const double eps = 1e-9; #define OVERLOAD3(_1, _2, _3, call,...) call #define REP0(n) for (ll i = 0; i < ll(n); ++i) #define REP1(i, n) for (ll i = 0; i < ll(n); ++i) #define REP2(i, a, b) for (ll i = ll(a); i < ll(b); ++i) #define REP(...) OVERLOAD3(__VA_ARGS__, REP2, REP1, REP0)(__VA_ARGS__) #define RREP0(n) for (ll i = ll(n) - 1; i >= 0; --i) #define RREP1(i, n) for (ll i = ll(n) - 1; i >= 0; --i) #define RREP2(i, a, b) for (ll i = ll(a) - 1; i >= b; --i) #define RREP(...) OVERLOAD3(__VA_ARGS__, RREP2, RREP1, RREP0)(__VA_ARGS__) #define REPE(i, c) for (auto&& i : c) #define TCASE() ll _ttt; cin >> _ttt; while(_ttt--) template void COMMON_IN(T&... a) { (cin >> ... >> a); } #define LI(...) ll __VA_ARGS__; COMMON_IN(__VA_ARGS__); #define SI(...) string __VA_ARGS__; COMMON_IN(__VA_ARGS__); using vl = vector; using vvl = vector; using vvvl = vector; #define VLI(a, n) vector a; a.assign(n, 0); for(auto& x : a) cin >> x; #define DLI(a, n) deque a; a.assign(n, 0); for(auto& x : a) cin >> x; #define VSI(a, n) vector a; a.assign(n, ""); for(auto& x : a) cin >> x; #define VVLI(a, n, m) vector> a(n, vector(m)); for(auto& x : a) for(auto& y : x) cin >> y; using vd = vector; using pl = pair; using vpl = vector; using vvpl = vector; struct uv { ll u; ll v; }; struct uvc { ll u; ll v; ll c = 1; }; #define VUVI(a, n) vector a; a.assign(n, {0, 0}); for(auto& x : a) {cin >> x.u >> x.v; x.u--; x.v--;} #define VUVCI(a, n) vector a; a.assign(n, {0, 0, 0}); for(auto& x : a) {cin >> x.u >> x.v >> x.c; x.u--; x.v--;} vvl to_edge(const ll n, const vector& v) { vvl ret(n); for (auto& x : v) ret[x.u].emplace_back(x.v); return ret; } vvl to_edge_d(const ll n, const vector& v) { vvl ret(n); for (auto& x : v) { ret[x.u].emplace_back(x.v); ret[x.v].emplace_back(x.u); } return ret; } vvpl to_edge_d(const ll n, const vector& v) { vvpl ret(n); for (auto& x : v) { ret[x.u].emplace_back(x.v, x.c); ret[x.v].emplace_back(x.u, x.c); } return ret; } template using pql = priority_queue; template using pqg = priority_queue, greater>; using vm = vector; using vvm = vector; template requires std::is_base_of_v ostream& operator<<(ostream& os, const T& v) { os << v.val(); return os; } void yn(bool f) { std::cout << (f ? "Yes" : "No") << "\n"; }; template void ov(const T& v) { for (auto it = v.begin(); it != v.end(); it++) { if (it != v.begin()) cout << " "; cout << *it; } }; template void ovn(const T& v) { ov(v); cout << "\n"; }; const ll llhuge = 1LL << 61; //十分でかいが多少足しても溢れない数値 auto gmax(const auto& a, const auto& b) { return a > b ? a : b; }; auto gmin(const auto& a, const auto& b) { return a < b ? a : b; }; bool chmin(auto& a, const auto& b) { const auto olda = a; a = gmin(a, b); return olda != a; } bool chmax(auto& a, const auto& b) { const auto olda = a; a = gmax(a, b); return olda != a; } void sort(auto& v) { std::ranges::sort(v); }; void rev(auto& v) { std::ranges::reverse(v); }; template auto p_sum(const T& v) { T ret(v.size()); std::partial_sum(begin(v), end(v), ret.begin()); return ret; }; template [[nodiscard]] V myat(const T& mp, const K& key) { return mp.find(key) == mp.end() ? V() : mp.at(key); } long long ceil(const long long a, const long long b) { return (a + b - 1) / b; } vector to_binary_fast(const string& s) { const int BASE = 1000000000; vector a; for (int i = s.size(); i > 0; i -= 9) { int l = max(0, i - 9); int len = i - l; a.push_back(stoull(s.substr(l, len))); } vector bits; while (!a.empty()) { uint64_t rem = 0; for (int i = (int)a.size() - 1; i >= 0; --i) { uint64_t cur = a[i] + rem * BASE; a[i] = cur / 2; rem = cur % 2; } bits.push_back((uint8_t)rem); while (!a.empty() && a.back() == 0) a.pop_back(); } reverse(bits.begin(), bits.end()); return bits; } int main() { cin.tie(nullptr); ios::sync_with_stdio(false); TCASE() { LI(n, m); REP(m) { SI(k); if (k == "0") { cout << 1 << "\n"; continue; } if (n == 0) { cout << 1 << "\n"; continue; } // k++ (10進文字列でインクリメント) int carry = 1; for (int i = (int)k.size() - 1; i >= 0; --i) { int d = (k[i] - '0') + carry; k[i] = char('0' + (d % 10)); carry = d / 10; } if (carry) k.insert(k.begin(), '1'); vector bits = to_binary_fast(k); rev(bits); int rp = 1; int rs = 0; int cp = n; int cs = 1; for(auto b : bits) { if (b) { rs = (rs + (rp * cs) % 998) % 998; rp = (rp * cp) % 998; } int ncp = cp * cp % 998; int ncs = (cs * ((cp + 1) % 998)) % 998; cp = ncp; cs = ncs; } cout << rs << "\n"; } } }