#include using namespace std; typedef signed long long ll; #define _P(...) (void)printf(__VA_ARGS__) #define FOR(x,to) for(x=0;x<(to);x++) #define FORR(x,arr) for(auto& x:arr) #define FORR2(x,y,arr) for(auto& [x,y]:arr) #define ALL(a) (a.begin()),(a.end()) #define ZERO(a) memset(a,0,sizeof(a)) #define MINUS(a) memset(a,0xff,sizeof(a)) template bool chmax(T &a, const T &b) { if(a bool chmin(T &a, const T &b) { if(a>b){a=b;return 1;}return 0;} //------------------------------------------------------- ll mo; const int NUM_=400001; static ll fact[NUM_+1],factr[NUM_+1],inv[NUM_+1]; ll comb(ll N_, ll C_) { if (fact[0]==0) { } if(C_<0 || C_>N_) return 0; return factr[C_]*fact[N_]%mo*factr[N_-C_]%mo; } ll modpow(ll a, ll n = mo-2) { ll r=1;a%=mo; while(n) r=r*((n%2)?a:1)%mo,a=a*a%mo,n>>=1; return r; } int N; ll F[201010]; ll FS[201010]; ll G[101010]; ll sum1[201010]; ll sumA[101010][332]; ll sumB[101010][332]; void solve() { int i,j,k,l,r,x,y; string s; cin>>N>>mo; inv[1]=fact[0]=factr[0]=1; for (int i=2;i<=NUM_;++i) inv[i] = inv[mo % i] * (mo - mo / i) % mo; for (int i=1;i<=NUM_;++i) fact[i]=fact[i-1]*i%mo, factr[i]=factr[i-1]*inv[i]%mo; for(i=2;i<=2*N;i++) { if(i<=N) F[i]=modpow(N,N-i)*fact[N-2]%mo*factr[N-i]%mo; (FS[i]=FS[i-1]+F[i])%=mo; } ll add=0; for(i=N;i>=1;i--) { (add+=F[i+2])%=mo; (G[i]=G[i+1]+add)%=mo; } for(int L=1;L<=N;L++) { // L未満のところは到達不可 sum1[1]+=N+1-L; sum1[L]-=N+1-L; if(L<=330) { for(int d=1;d*L<=N;d++) { int add=0; for(x=1;x=j) { sumA[i][j]+=sumA[i-j][j]; sumB[i][j]+=sumB[i-j][j]; } sumB[i][j]+=sumA[i][j]; sum1[i]+=sumB[i][j]; } } ll ret=0; ll pat=0; ll SR=0; ll SL=1LL*N*(N+1)/2%mo; for(i=1;i<=N;i++) { // 2が閉路外 (ret+=(SL+mo-sum1[i])%mo*G[i])%=mo; // 2が閉路内 (pat+=(1LL*i*(i+1)/2-1)%mo*F[i])%=mo; // L=iとしたときR>LとなるRの数 SR+=N-i; } // 2が閉路内でL>R (ret+=SR%mo*pat)%=mo; // 2が閉路内かつL=R for(int d=1;d<=N-1;d++) for(int c=1;c<=N;c++) { ll g=(FS[d+c]+mo-FS[max(d,c-1)])%mo; for(int L=1;L<=N;L++) if(d%__gcd(c,L)==0) (ret+=g)%=mo; } ret=ret*N%mo*(N-1)%mo; cout<