#include #pragma GCC optimize("Ofast") #define _GLIBCXX_DEBUG using namespace std; using std::cout; using std::cin; using std::endl; using ll=long long; using ld=long double; ll ILL=1167167167167167167; const int INF=2100000000; const ll mod=998244353; #define rep(i,a) for (ll i=0;i using _pq = priority_queue, greater>; template ll LB(vector &v,T a){return lower_bound(v.begin(),v.end(),a)-v.begin();} template ll UB(vector &v,T a){return upper_bound(v.begin(),v.end(),a)-v.begin();} template bool chmin(T &a,const T &b){if(a>b){a=b;return 1;}else return 0;} template bool chmax(T &a,const T &b){if(a void So(vector &v) {sort(v.begin(),v.end());} template void Sore(vector &v) {sort(v.begin(),v.end(),[](T x,T y){return x>y;});} void yneos(bool a){if(a) cout<<"Yes\n"; else cout<<"No\n";} template void vec_out(vector &p){for(int i=0;i<(int)(p.size());i++){if(i) cout<<" ";cout<>t; rep(i,t) solve(); } void solve(){ ll N,M; cin>>N>>M; vector sum(N+2); vector> seg(M); rep(i,M){ seg[i].resize(N+2,0); } sum[0]=1; sum[1]=-1; ll X=1; rep(i,N){ X=(X*M)%mod; sum[i]%=mod; rep(j,M){ seg[j][i]%=mod; ll tmp=sum[i]-seg[j][i]; seg[j][i+1]+=tmp; sum[i+1]+=tmp; ll x=(i+j+1); chmin(x,N+1); seg[j][x]-=tmp; sum[x]-=tmp; seg[j][i+1]+=seg[j][i]; } sum[i+1]+=sum[i]; } /*rep(i,N){ cout<