#include #include using namespace std; using namespace atcoder; typedef long long int ll; typedef long double ld; typedef vector vi; typedef vector vl; typedef vector vvl; typedef vector vvvl; typedef vector vvvvl; typedef vector vb; typedef vector vvb; typedef vector vvvb; typedef vector vvvvb; typedef pair pl; typedef pair ppl; typedef pair pppl; typedef pair pppppl; #define rep(i,a,b) for(int i=(a);i<(b);i++) #define rrep(i,a,b) for(int i=(b)-1;i>=(a);i--) #define all(a) begin(a),end(a) #define sz(a) (int)(a).size() #define F first #define S second #define bs(A,x) binary_search(all(A),x) #define lb(A,x) (ll)(lower_bound(all(A),x)-A.begin()) #define ub(A,x) (ll)(upper_bound(all(A),x)-A.begin()) #define cou(A,x) (ll)(upper_bound(all(A),x)-lower_bound(all(A),x)) templateusing min_priority_queue=priority_queue,greater>; templatebool chmax(T&a,T b){if(abool chmin(T&a,T b){if(b vm; typedef vector vvm; typedef vector vvvm; typedef vector vvvvm; ostream&operator<<(ostream&os,mint a){os<>(istream&is,mint&a){int x;is>>x;a=mint(x);return is;} //*/ templateostream&operator<<(ostream&os,pairp){os<istream&operator>>(istream&is,pair&p){is>>p.F>>p.S;return is;} templateostream&operator<<(ostream&os,vectorv){rep(i,0,sz(v))os<istream&operator>>(istream&is,vector&v){for(T&in:v)is>>in;return is;} template struct relaxed_convolution{ vectorF,G,H; mint query(mint x,mint y){ int n=F.size(); F.emplace_back(x); G.emplace_back(y); for(int i=0;;i++){ if((((n+2)>>i)<pr=convolution(vector(F.begin()+l,F.begin()+r),vector(G.begin()+l,G.begin()+r)); for(int j=0;jpr1=convolution(vector(F.begin()+l,F.begin()+r),vector(G.begin()+n+1-(1<pr2=convolution(vector(F.begin()+n+1-(1<(G.begin()+l,G.begin()+r)); for(int j=0;jsync_with_stdio(0); cin.exceptions(cin.failbit); ll N,M;cin>>N>>M; vm ex(2e6,1),re(2e6); rep(i,1,2e6)ex[i]=i*ex[i-1]; rep(i,0,2e6)re[i]=1/ex[i]; vl A(M);cin>>A; vl T(N+1); T[0]=1; rep(i,0,M)T[A[i]]=1; relaxed_convolutionC; vm DP(N+1); rep(i,0,N){ mint r=C.query(DP[i],-2*ex[i+2]); if(T[i+1])DP[i+1]=r-2*ex[i+1]; } mint ans=2*ex[N]; rep(i,1,N+1)ans+=ex[N-i+1]*DP[i]; cout<