#pragma GCC target("avx") #pragma GCC optimize("O3") #pragma GCC optimize("unroll-loops") #include // #include // #include // #include // using namespace __gnu_pbds; // #include // namespace multiprecisioninteger = boost::multiprecision; // using cint=multiprecisioninteger::cpp_int; using namespace std; using ll=long long; #define double long double using datas=pair; using ddatas=pair; using tdata=pair; using vec=vector; using mat=vector; using pvec=vector; using pmat=vector; // using llset=tree,rb_tree_tag,tree_order_statistics_node_update>; #define For(i,a,b) for(i=a;i<(ll)b;++i) #define bFor(i,b,a) for(i=b,--i;i>=(ll)a;--i) #define rep(i,N) For(i,0,N) #define rep1(i,N) For(i,1,N) #define brep(i,N) bFor(i,N,0) #define brep1(i,N) bFor(i,N,1) #define all(v) (v).begin(),(v).end() #define allr(v) (v).rbegin(),(v).rend() #define vsort(v) sort(all(v)) #define vrsort(v) sort(allr(v)) #define uniq(v) (v).erase(unique(all(v)),(v).end()) #define endl "\n" #define eb emplace_back #define print(x) cout< ostream& operator<<(ostream& os,const pair& p){return os<<"("< ostream& operator<<(ostream& os,const vector& v){ os<<"{";ll i; rep(i,v.size()){ if(i)os<<","; os< inline bool chmax(T& a,T b){bool x=a inline bool chmin(T& a,T b){bool x=a>b;if(x)a=b;return x;} #ifdef DEBUG void debugg(){cout<void debugg(const T& x,const Args&... args){cout<<" "<0){ if(n&1)res=res*a%m; a=a*a%m; n>>=1; } return res; } ll gcd(ll a,ll b){if(!b)return abs(a);return (a%b==0)?abs(b):gcd(b,a%b);} ll lcm(ll a,ll b){return a/gcd(a,b)*b;} ll countdigits(ll n){ ll ans=0; while(n){n/=10;ans++;} return ans; } ll sumdigits(ll n){ ll ans=0; while(n){ans+=n%10;n/=10;} return ans; } template struct mcf_graph{ public: mcf_graph(){} mcf_graph(int n):_n(n),g(n){} int add_edge(int from,int to,Cap cap,Cost cost){ assert(0<=from&&from<_n); assert(0<=to&&to<_n); int m=int(pos.size()); pos.push_back({from,int(g[from].size())}); int from_id=int(g[from].size()); int to_id=int(g[to].size())+int(from==to); g[from].push_back(_edge{to,to_id,cap,cost}); g[to].push_back(_edge{from,from_id,0,-cost}); return m; } struct edge{ int from,to; Cap cap,flow; Cost cost; }; edge get_edge(int i){ assert(0<=i&&i edges(){ int m=int(pos.size()); vector result(m); for(int i=0;i flow(int s,int t){ return flow(s,t,numeric_limits::max()); } pair flow(int s,int t,Cap flow_limit){ return slope(s,t,flow_limit).back(); } vector> slope(int s,int t){ return slope(s,t,numeric_limits::max()); } vector> slope(int s,int t,Cap flow_limit){ assert(0<=s&&s<_n); assert(0<=t&&t<_n); assert(s!=t); // variants(C=maxcost): //-(n-1)C<=dual[s]<=dual[i]<=dual[t]=0 // reduced cost(=e.cost+dual[e.from]-dual[e.to])>=0 for all edge vector dual(_n,0),dist(_n); vector pv(_n),pe(_n); vector vis(_n); auto dual_ref=[&](){ fill(dist.begin(),dist.end(),numeric_limits::max()); fill(pv.begin(),pv.end(),-1); fill(pe.begin(),pe.end(),-1); fill(vis.begin(),vis.end(),false); struct Q{ Cost key; int to; bool operator<(Q r)const{ return key>r.key;} }; priority_queue que; dist[s]=0; que.push(Q{0,s}); while(!que.empty()){ int v=que.top().to; que.pop(); if(vis[v])continue; vis[v]=true; if(v==t)break; // dist[v]=shortest(s,v)+dual[s]-dual[v] // dist[v]>=0(all reduced cost are positive) // dist[v]<=(n-1)C for(int i=0;icost){ dist[e.to]=dist[v]+cost; pv[e.to]=v; pe[e.to]=i; que.push(Q{dist[e.to],e.to}); } } } if(!vis[t])return false; for(int v=0;v<_n;++v){ if(!vis[v])continue; // dual[v]=dual[v]-dist[t]+dist[v] // =dual[v]-(shortest(s,t)+dual[s]-dual[t])+(shortest(s,v)+dual[s]-dual[v]) // =-shortest(s,t)+dual[t]+shortest(s,v) // =shortest(s,v)-shortest(s,t)>=0-(n-1)C dual[v]-=dist[t]-dist[v]; } return true; }; Cap flow=0; Cost cost=0,prev_cost_per_flow=-1; vector> result; result.push_back({flow,cost}); while(flow> pos; vector> g; }; template struct BinaryIndexedTree{ int size,bitn=0; T I; using func=function; func F; vector tree; BinaryIndexedTree(int N,T e,func f):size(N+1),I(e),F(f),tree(size,e){} BinaryIndexedTree(int N):size(N+1),I(0),F([](T a,T b){return a+b;}),tree(size,0){} void act(int i,T x){ for(++i;i0;i-=-i&i){ res=F(tree[i],res); } return res; } //sum([l,r)); T sum(int l,int r){ // if(--l>--r)return 0; assert(--l<=--r); if(l<0)return queli(r); else return queli(r)-queli(l); } //only(N,+) int lower_bound(int x){ int i=0; if(!bitn){ i=size;bitn=1; while(i){ i>>=1;bitn<<=1; } i=0; } for(int k=bitn;k;k>>=1){ if(i+k>codeforces;while(codeforces--){ ll i,j; cin>>N; pvec v(N); rep(i,N){cin>>v[i].first;v[i].second=i;} vec ans(N,0); BinaryIndexedTree ftree(N+1,0,sum),fsum(N+1,0,sum),stree(N+1,0,sum),ssum(N+1,0,sum); vrsort(v); rep(i,N){ debug(v[i]); if(v[i].second>1){ A=stree.queli(v[i].second-1); B=ssum.queli(v[i].second-1); debug(A,B); ans[v[i].second]+=B+v[i].first*A%mod; } if(v[i].second){ A=ftree.queli(v[i].second-1); B=fsum.queli(v[i].second-1); debug(A,B); stree.act(v[i].second,A); ssum.act(v[i].second,B+v[i].first*A%mod); } ftree.act(v[i].second,1); fsum.act(v[i].second,v[i].first); } debug(ans); print(accumulate(all(ans),0LL,[](ll a,ll b){return (a+b)%mod;})); }