#pragma GCC optimize ("Ofast") #include using namespace std; #define MD (998244353U) void*wmem; char memarr[96000000]; template inline void walloc1d(T **arr, int x, void **mem = &wmem){ static int skip[16] = {0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1}; (*mem) = (void*)( ((char*)(*mem)) + skip[((unsigned long long)(*mem)) & 15] ); (*arr)=(T*)(*mem); (*mem)=((*arr)+x); } template inline void walloc1d(T **arr, int x1, int x2, void **mem = &wmem){ walloc1d(arr, x2-x1, mem); (*arr) -= x1; } template void sortA_L(int N, T1 a[], void *mem = wmem){ sort(a, a+N); } template void sortA_L(int N, T1 a[], T2 b[], void *mem = wmem){ int i; pair*arr; walloc1d(&arr, N, &mem); for(i=(0);i<(N);i++){ arr[i].first = a[i]; arr[i].second = b[i]; } sort(arr, arr+N); for(i=(0);i<(N);i++){ a[i] = arr[i].first; b[i] = arr[i].second; } } struct Modint{ unsigned val; Modint(){ val=0; } Modint(int a){ val = ord(a); } Modint(unsigned a){ val = ord(a); } Modint(long long a){ val = ord(a); } Modint(unsigned long long a){ val = ord(a); } inline unsigned ord(unsigned a){ return a%MD; } inline unsigned ord(int a){ a %= (int)MD; if(a < 0){ a += MD; } return a; } inline unsigned ord(unsigned long long a){ return a%MD; } inline unsigned ord(long long a){ a %= (int)MD; if(a < 0){ a += MD; } return a; } inline unsigned get(){ return val; } inline Modint &operator+=(Modint a){ val += a.val; if(val >= MD){ val -= MD; } return *this; } inline Modint &operator-=(Modint a){ if(val < a.val){ val = val + MD - a.val; } else{ val -= a.val; } return *this; } inline Modint &operator*=(Modint a){ val = ((unsigned long long)val*a.val)%MD; return *this; } inline Modint &operator/=(Modint a){ return *this *= a.inverse(); } inline Modint operator+(Modint a){ return Modint(*this)+=a; } inline Modint operator-(Modint a){ return Modint(*this)-=a; } inline Modint operator*(Modint a){ return Modint(*this)*=a; } inline Modint operator/(Modint a){ return Modint(*this)/=a; } inline Modint operator+(int a){ return Modint(*this)+=Modint(a); } inline Modint operator-(int a){ return Modint(*this)-=Modint(a); } inline Modint operator*(int a){ return Modint(*this)*=Modint(a); } inline Modint operator/(int a){ return Modint(*this)/=Modint(a); } inline Modint operator+(long long a){ return Modint(*this)+=Modint(a); } inline Modint operator-(long long a){ return Modint(*this)-=Modint(a); } inline Modint operator*(long long a){ return Modint(*this)*=Modint(a); } inline Modint operator/(long long a){ return Modint(*this)/=Modint(a); } inline Modint operator-(void){ Modint res; if(val){ res.val=MD-val; } else{ res.val=0; } return res; } inline operator bool(void){ return val!=0; } inline operator int(void){ return get(); } inline operator long long(void){ return get(); } inline Modint inverse(){ int a = val; int b = MD; int u = 1; int v = 0; int t; Modint res; while(b){ t = a / b; a -= t * b; swap(a, b); u -= t * v; swap(u, v); } if(u < 0){ u += MD; } res.val = u; return res; } inline Modint pw(unsigned long long b){ Modint a(*this); Modint res; res.val = 1; while(b){ if(b&1){ res *= a; } b >>= 1; a *= a; } return res; } inline bool operator==(int a){ return ord(a)==val; } inline bool operator!=(int a){ return ord(a)!=val; } } ; inline Modint operator+(int a, Modint b){ return Modint(a)+=b; } inline Modint operator-(int a, Modint b){ return Modint(a)-=b; } inline Modint operator*(int a, Modint b){ return Modint(a)*=b; } inline Modint operator/(int a, Modint b){ return Modint(a)/=b; } inline Modint operator+(long long a, Modint b){ return Modint(a)+=b; } inline Modint operator-(long long a, Modint b){ return Modint(a)-=b; } inline Modint operator*(long long a, Modint b){ return Modint(a)*=b; } inline Modint operator/(long long a, Modint b){ return Modint(a)/=b; } inline int my_getchar_unlocked(){ static char buf[1048576]; static int s = 1048576; static int e = 1048576; if(s == e && e == 1048576){ e = fread_unlocked(buf, 1, 1048576, stdin); s = 0; } if(s == e){ return EOF; } return buf[s++]; } inline void rd(int &x){ int k; int m=0; x=0; for(;;){ k = my_getchar_unlocked(); if(k=='-'){ m=1; break; } if('0'<=k&&k<='9'){ x=k-'0'; break; } } for(;;){ k = my_getchar_unlocked(); if(k<'0'||k>'9'){ break; } x=x*10+k-'0'; } if(m){ x=-x; } } struct MY_WRITER{ char buf[1048576]; int s; int e; MY_WRITER(){ s = 0; e = 1048576; } ~MY_WRITER(){ if(s){ fwrite_unlocked(buf, 1, s, stdout); } } } ; MY_WRITER MY_WRITER_VAR; void my_putchar_unlocked(int a){ if(MY_WRITER_VAR.s == MY_WRITER_VAR.e){ fwrite_unlocked(MY_WRITER_VAR.buf, 1, MY_WRITER_VAR.s, stdout); MY_WRITER_VAR.s = 0; } MY_WRITER_VAR.buf[MY_WRITER_VAR.s++] = a; } inline void wt_L(char a){ my_putchar_unlocked(a); } inline void wt_L(int x){ int s=0; int m=0; char f[10]; if(x<0){ m=1; x=-x; } while(x){ f[s++]=x%10; x/=10; } if(!s){ f[s++]=0; } if(m){ my_putchar_unlocked('-'); } while(s--){ my_putchar_unlocked(f[s]+'0'); } } inline void wt_L(Modint x){ int i; i = (int)x; wt_L(i); } template struct fenwick{ int size; int memory; T*data; void malloc(int mem); void malloc(int mem, int fg); void walloc(int mem, void **workMemory = &wmem); void walloc(int mem, int fg, void **workMemory = &wmem); void free(void); void init(int N); void add(int k, T val); T get(int k); T range(int a, int b); int kth(T k); } ; int N; int A[200000]; int val[200000]; int ind[200000]; fenwick t1; fenwick t2; fenwick f1; fenwick f2; int main(){ wmem = memarr; int i; int j; int k; long long tmp1; long long tmp2; Modint res = 0; rd(N); { int Lj4PdHRW; for(Lj4PdHRW=(0);Lj4PdHRW<(N);Lj4PdHRW++){ rd(A[Lj4PdHRW]); } } t1.walloc(N,1); t2.walloc(N,1); f1.walloc(N,1); f2.walloc(N,1); for(i=(0);i<(N);i++){ { auto RZTsC2BF = (A[i]); auto FmcKpFmN = ( i); val[i] = RZTsC2BF; ind[i] = FmcKpFmN; } } sortA_L(N, A, ind); for(i=(0);i<(N);i++){ t1.add(i,1); } for(i=(0);i<(N);i++){ f1.add(ind[i],A[i]); } i = 0; for(k=(0);k<(N);k++){ j = i; while(i < N && A[i]==A[k]){ t1.add(ind[i],-1); f1.add(ind[i],-A[i]); i++; } i = j; while(i < N && A[i]==A[k]){ tmp1 = t1.get(ind[i]-1); tmp2 = t2.range(ind[i]+1,N-1); res += Modint(A[i]) * tmp1 * tmp2; res += f1.get(ind[i]-1) * tmp2; res += f2.range(ind[i]+1,N-1) * tmp1; i++; } i = j; while(i < N && A[i]==A[k]){ t2.add(ind[i],1); f2.add(ind[i],A[i]); i++; } } wt_L(res); wt_L('\n'); return 0; } template void fenwick::malloc(int mem){ memory = mem; data = (T*)std::malloc(sizeof(T)*mem); } template void fenwick::malloc(int mem, int fg){ memory = mem; data = (T*)std::malloc(sizeof(T)*mem); if(fg){ init(mem); } } template void fenwick::walloc(int mem, void **workMemory /* = &wmem*/){ memory = mem; walloc1d(&data, mem, workMemory); } template void fenwick::walloc(int mem, int fg, void **workMemory /* = &wmem*/){ memory = mem; walloc1d(&data, mem, workMemory); if(fg){ init(mem); } } template void fenwick::free(void){ memory = 0; free(data); } template void fenwick::init(int N){ size = N; memset(data,0,sizeof(T)*N); } template void fenwick::add(int k, T val){ while(k < size){ data[k] += val; k |= k+1; } } template T fenwick::get(int k){ T res = 0; while(k>=0){ res += data[k]; k = (k&(k+1))-1; } return res; } template T fenwick::range(int a, int b){ if(b==-1){ b=size-1; } return get(b) - get(a-1); } template int fenwick::kth(T k){ int i=0; int j=size; int c; T v; while(i t1, t2; // fenwick f1,f2; // { // int i, j, k; // ll tmp1, tmp2; // Modint res = 0; // rd(N,A(N)); // t1.walloc(N,1); // t2.walloc(N,1); // f1.walloc(N,1); // f2.walloc(N,1); // rep(i,N) (val[i], ind[i]) = (A[i], i); // sortA(N, A, ind); // // rep(i,N) t1.add(i,1); // rep(i,N) f1.add(ind[i],A[i]); // i = 0; // rep(k,N){ // j = i; // while(i < N && A[i]==A[k]){ // t1.add(ind[i],-1); // f1.add(ind[i],-A[i]); // i++; // } // i = j; // while(i < N && A[i]==A[k]){ // tmp1 = t1.get(ind[i]-1); // tmp2 = t2.range(ind[i]+1,N-1); // res += Modint(A[i]) * tmp1 * tmp2; // res += f1.get(ind[i]-1) * tmp2; // res += f2.range(ind[i]+1,N-1) * tmp1; // // wt(ind[i],A[i],":",tmp1,tmp2,":",res); // i++; // } // i = j; // while(i < N && A[i]==A[k]){ // t2.add(ind[i],1); // f2.add(ind[i],A[i]); // i++; // } // } // // wt(res); // }