#include #include using namespace std; namespace my{ using ml=atcoder::modint1000000007; auto&operator>>(istream&i,ml&x){int t;i>>t;x=t;return i;} auto&operator<<(ostream&o,const ml&x){return o<<(int)x.val();} #define eb emplace_back #define LL(...) ll __VA_ARGS__;lin(__VA_ARGS__) #define FO(n) for(ll ij=n;ij-->0;) #define FOR(i,...) for(auto[i,i##stop,i##step]=range(0,__VA_ARGS__);i=i##stop;i+=i##step) #define fe(a,i,...) for(auto&&__VA_OPT__([)i __VA_OPT__(,__VA_ARGS__]):a) #define bit_sizeof(T) ll(sizeof(T)*CHAR_BIT) #define base_operator(op,type) auto operator op(const type&v)const{auto copy=*this;return copy op##=v;} #define multiple_testcases void solve();}int main(){my::io();int T;std::cin>>T;while(T--)my::solve();}namespace my{ void io(){cin.tie(nullptr)->sync_with_stdio(0);cout<concept addable=requires(T a,T b){{a+b}->same_as;}; templatestruct pair{ A a;B b; pair()=default; pair(A a,B b):a(a),b(b){} pair(const std::pair&p):a(p.first),b(p.second){} auto operator<=>(const pair&)const=default; pair operator+(const pair&p)const{return{a+p.a,b+p.b};} friend istream&operator>>(istream&i,pair&p){return i>>p.a>>p.b;} friend ostream&operator<<(ostream&o,const pair&p){return o<using pack_kth_t=tuple_element_t>; templateauto pack_kth(const auto&...a){return get(make_tuple(a...));} templateauto pack_prefix_array(const auto&...a){return[&](index_sequence){return array{get(make_tuple(a...))...};}(make_index_sequence{});} templateconcept vectorial=is_base_of_v,V>; templatestruct vec_attr{using core_type=T;static constexpr int rank=0;}; templatestruct vec_attr{using core_type=typename vec_attr::core_type;static constexpr int rank=vec_attr::rank+1;}; templateistream&operator>>(istream&i,vector&v){fe(v,e)i>>e;return i;} templateostream&operator<<(ostream&o,const vector&v){fe(v,e)o<?newline:space);return o;} templatestruct vec; templatestruct tensor_helper{using type=vec::type>;}; templatestruct tensor_helper<0,T>{using type=T;}; templateusing tensor=typename tensor_helper::type; templatestruct vec:vector{ static constexpr int R=vec_attr::rank+1; using C=vec_attr::core_type; using vector::vector; vec(const vector&v){vector::operator=(v);} templaterequires(sizeof...(A)>=3)vec(const A&...a){resizes(pack_prefix_array(a...),pack_kth(a...));} void resizes(const array&s,C x={}){*this=std::move(make(s,x));} templatestatic auto make(const array&s,C x){if constexpr(i==R-1)return vec(s[i],x);else return tensor(s[i],make(s,x));} vec&operator^=(const vec&u){this->insert(this->end(),u.begin(),u.end());return*this;} vec&operator+=(const vec&u){vec&v=*this;assert(v.size()==u.size());fo(i,v.size())v[i]+=u[i];return v;} vec&operator-=(const vec&u){vec&v=*this;assert(v.size()==u.size());fo(i,v.size())v[i]-=u[i];return v;} base_operator(^,vec) base_operator(+,vec) base_operator(-,vec) vec&operator--(){fe(*this,e)--e;return*this;} ll size()const{return vector::size();} vec zeta()const{vec v=*this;if constexpr(vectorial)fe(v,e)e=e.zeta();fo(i,v.size()-1)v[i+1]+=v[i];return v;} auto transform(const auto&f)const{ tensorres(size()); if constexpr(vectorial)fo(i,size())res[i]=(*this)[i].transform(f); else std::transform(this->begin(),this->end(),res.begin(),f); return res; } templateauto cast_core_type()const{return transform([&](auto e){return static_cast(e);});} }; templaterequires(sizeof...(A)>=2)vec(const A&...a)->vec>>; vec(ll)->vec; void lin(auto&...a){(cin>>...>>a);} void pp(const auto&...a){ll n=sizeof...(a);((cout<0,space)),...);cout<r(n);fo(i,n)r[i]=f(i);return r;} constexpr uint64_t kth_root_floor(uint64_t a,ll k){ if (k==1)return a; auto within=[&](uint32_t x){uint64_t t=1;fo(k)if(__builtin_mul_overflow(t,x,&t))return false;return t<=a;}; uint64_t r=0; of(i,bit_sizeof(uint32_t))if(within(r|(1u<constexpr T sqrt_floor(T x){return kth_root_floor(x,2);} auto divmod(auto a,auto b){return pair{a/b,a%b};} auto mod(auto a,auto b){return(a%=b)<0?a+b:a;} templateT square_sum(T n){return n*(n+1)/2*(n*2+1)/3;} templateT square_sum(const vec&a){ T res=0; fe(a,e)res+=T(e)*e; return res; } templatestruct circle_vec:vec{ vecsu; circle_vec(ll n):vec(n){} circle_vec(const initializer_list&a={}){fe(a,e)this->eb(e);if constexpr(addable)build_zeta();} circle_vec(const vec&v){fe(v,e)this->eb(e);if constexpr(addable)build_zeta();} void build_zeta()requires(addable){su=this->zeta();} T&operator[](ll i){ll n=this->size();return vec::operator[]((i%n+n)%n);} T operator[](ll i)const{ll n=this->size();return vec::operator[]((i%n+n)%n);} T circle_sum(ll n)const requires(addable){auto[q,r]=divmod(n,this->size());return su.back()*q+schrodinger(r,su[r-1]);} }; multiple_testcases void solve(){ LL(a,N); ll M=sqrt_floor(a*N); auto f=[&](ll i){return mod(square(i+1)-1,a);}; circle_vecv=iota_lambda(a,f).cast_core_type(); pp(ml(N)*M-(square_sum(M)-M-v.circle_sum(M))/a); }}