#885155 (C++17) No.2362 Inversion Number of Mod of Linear

提出ソース
結果

問題	No.2362 Inversion Number of Mod of Linear
コンテスト
ユーザー	ecottea
提出日時	2023-06-28 02:35:03
言語	C++17 (gcc 15.2.0 + boost 1.89.0) コンパイル: `g++-15 -O2 -lm -std=c++17 -Wuninitialized -DONLINE_JUDGE -o a.out _filename_` 実行: `./a.out`
結果	AC
実行時間	139 ms / 2,000 ms
コード長	10,144 bytes
記録記録タグの例: 初AC ショートコード純ショートコード純主流ショートコード最速実行時間
コンパイル時間	4,059 ms
コンパイル使用メモリ	258,244 KB
最終ジャッジ日時	2025-02-15 02:47:49
ジャッジサーバーID （参考情報）	judge3 / judge3
このコードへのチャレンジ
（要ログイン）
ファイルパターン	結果
sample	AC * 2
other	AC * 8
権限があれば一括ダウンロードができます
ソースコード

raw source code
#ifndef HIDDEN_IN_VS // 折りたたみ用

// 警告の抑制
#define _CRT_SECURE_NO_WARNINGS

// ライブラリの読み込み
#include <bits/stdc++.h>
using namespace std;

// 型名の短縮
using ll = long long; // -2^63 ～ 2^63 = 9 * 10^18（int は -2^31 ～ 2^31 = 2 * 10^9）
using pii = pair<int, int>;	using pll = pair<ll, ll>;	using pil = pair<int, ll>;	using pli = pair<ll, int>;
using vi = vector<int>;		using vvi = vector<vi>;		using vvvi = vector<vvi>;
using vl = vector<ll>;		using vvl = vector<vl>;		using vvvl = vector<vvl>;
using vb = vector<bool>;	using vvb = vector<vb>;		using vvvb = vector<vvb>;
using vc = vector<char>;	using vvc = vector<vc>;		using vvvc = vector<vvc>;
using vd = vector<double>;	using vvd = vector<vd>;		using vvvd = vector<vvd>;
template <class T> using priority_queue_rev = priority_queue<T, vector<T>, greater<T>>;
using Graph = vvi;

// 定数の定義
const double PI = acos(-1);
const vi DX = { 1, 0, -1, 0 }; // 4 近傍（下，右，上，左）
const vi DY = { 0, 1, 0, -1 };
int INF = 1001001001; ll INFL = 4004004003104004004LL; // (int)INFL = 1010931620;
double EPS = 1e-15;

// 入出力高速化
struct fast_io { fast_io() { cin.tie(nullptr); ios::sync_with_stdio(false); cout << fixed << setprecision(18); } } fastIOtmp;

// 汎用マクロの定義
#define all(a) (a).begin(), (a).end()
#define sz(x) ((int)(x).size())
#define lbpos(a, x) (int)distance((a).begin(), std::lower_bound(all(a), x))
#define ubpos(a, x) (int)distance((a).begin(), std::upper_bound(all(a), x))
#define Yes(b) {cout << ((b) ? "Yes\n" : "No\n");}
#define YES(b) {cout << ((b) ? "YES\n" : "NO\n");}
#define rep(i, n) for(int i = 0, i##_len = int(n); i < i##_len; ++i) // 0 から n-1 まで昇順
#define repi(i, s, t) for(int i = int(s), i##_end = int(t); i <= i##_end; ++i) // s から t まで昇順
#define repir(i, s, t) for(int i = int(s), i##_end = int(t); i >= i##_end; --i) // s から t まで降順
#define repe(v, a) for(const auto& v : (a)) // a の全要素（変更不可能）
#define repea(v, a) for(auto& v : (a)) // a の全要素（変更可能）
#define repb(set, d) for(int set = 0; set < (1 << int(d)); ++set) // d ビット全探索（昇順）
#define repp(a) sort(all(a)); for(bool a##_perm = true; a##_perm; a##_perm = next_permutation(all(a))) // a の順列全て（昇順）
#define smod(n, m) ((((n) % (m)) + (m)) % (m)) // 非負mod
#define uniq(a) {sort(all(a)); (a).erase(unique(all(a)), (a).end());} // 重複除去
#define EXIT(a) {cout << (a) << endl; exit(0);} // 強制終了
#define inQ(x, y, u, l, d, r) ((u) <= (x) && (l) <= (y) && (x) < (d) && (y) < (r)) // 矩形内判定

// 汎用関数の定義
template <class T> inline ll pow(T n, int k) { ll v = 1; rep(i, k) v *= n; return v; }
template <class T> inline bool chmax(T& M, const T& x) { if (M < x) { M = x; return true; } return false; } // 最大値を更新（更新されたら true を返す）
template <class T> inline bool chmin(T& m, const T& x) { if (m > x) { m = x; return true; } return false; } // 最小値を更新（更新されたら true を返す）
template <class T> inline T get(T set, int i) { return (set >> i) & T(1); }

// 演算子オーバーロード
template <class T, class U> inline istream& operator>>(istream& is, pair<T, U>& p) { is >> p.first >> p.second; return is; }
template <class T> inline istream& operator>>(istream& is, vector<T>& v) { repea(x, v) is >> x; return is; }
template <class T> inline vector<T>& operator--(vector<T>& v) { repea(x, v) --x; return v; }
template <class T> inline vector<T>& operator++(vector<T>& v) { repea(x, v) ++x; return v; }

#endif // 折りたたみ用


#if __has_include(<atcoder/all>)
#include <atcoder/all>
using namespace atcoder;

#ifdef _MSC_VER
#include "localACL.hpp"
#endif

//using mint = modint1000000007;
//using mint = modint998244353;
using mint = modint; // mint::set_mod(m);

namespace atcoder {
	inline istream& operator>>(istream& is, mint& x) { ll x_; is >> x_; x = x_; return is; }
	inline ostream& operator<<(ostream& os, const mint& x) { os << x.val(); return os; }
}
using vm = vector<mint>; using vvm = vector<vm>; using vvvm = vector<vvm>;
#endif


#ifdef _MSC_VER // 手元環境（Visual Studio）
#include "local.hpp"
#else // 提出用（gcc）
inline int popcount(int n) { return __builtin_popcount(n); }
inline int popcount(ll n) { return __builtin_popcountll(n); }
inline int lsb(int n) { return n != 0 ? __builtin_ctz(n) : -1; }
inline int lsb(ll n) { return n != 0 ? __builtin_ctzll(n) : -1; }
inline int msb(int n) { return n != 0 ? (31 - __builtin_clz(n)) : -1; }
inline int msb(ll n) { return n != 0 ? (63 - __builtin_clzll(n)) : -1; }
#define gcd __gcd
#define dump(...)
#define dumpel(v)
#define dump_list(v)
#define dump_mat(v)
#define input_from_file(f)
#define output_to_file(f)
#define Assert(b) { if (!(b)) while (1) cout << "OLE"; }
#endif


#ifdef _MSC_VER
#define __int128 ll // デバッグ用
#endif


//【一次式の切り捨て和】O(log(n + m + a + b))
/*
* Σi∈[0..n) floor((a i + b) / m) を返す．
*/
template <class T>
T sum_of_floor_of_linear(T n, T m, T a, T b) {
	// 参考 : https://twitter.com/kyopro_friends/status/1304063876019793921?ref_src=twsrc%5Etfw
	// verify : https://judge.yosupo.jp/problem/sum_of_floor_of_linear

	//【方法】
	// m < 0 なら a, b, m をそれぞれ -1 倍して m > 0 とする．
	//		a = aq m + ar, b = bq m + br (0 ≦ ar, br < m)
	// と表すと，
	//		Σi∈[0..n) floor((a i + b) / m)
	//		= Σi∈[0..n) (floor((ar i + br) / m) + (aq i + bq))
	//		= Σi∈[0..n) floor((ar i + br) / m) + (aq n(n-1)/2 + bq n)
	// となるので 0 ≦ a < m, 0 ≦ b < m として一般性を失わない．
	// 
	// 求めるべき値は，領域
	//		{(x, y) | 0 ≦ x < n かつ 0 < y ≦ (a x + b) / m}
	// に含まれる格子点の個数である．u1 = floor((a x + b) / m) とおき，変数変換
	//		v = n - x, u = u1 - y
	// を施すと，直線 y = (a x + b) / m の式は
	//		u1 - u = (a (n - v) + b) / m
	//		⇔ m u1 - m u = a n - a v + b
	//		⇔ a v = m u + a n + b - m u1
	//		⇔ v = (m u + (a n + b - m u1)) / a
	// と書き換えられるので，先の領域は
	//		{(u, v) | 0 ≦ u < u1 かつ 0 < v ≦ (m u + (a n + b - m u1)) / a}
	// となる．ここに含まれる格子点の個数は
	//		Σi∈[0..u1) floor((m i + (a n + b - m u1)) / a)
	// であり，分母を m からより小さい a に書き換えられた．
	//
	// 次のステップに進む前に m ← m mod a とするので，収束の速さはユークリッドの互除法と同じである．

	Assert(m != 0);
	if (n <= 0) return 0;

	T res = 0;

	// m < 0 の場合，分母分子を -1 倍して m > 0 とする．
	if (m < 0) { a *= -1; b *= -1; m *= -1; }

	// a を m だけ増減させた場合の影響は floor なしの和で計算できるので，0 ≦ a < m とする．
	res += (a / m - (T)(a % m < 0)) * (n * (n - 1) / 2);
	a = smod(a, m);

	// b を m だけ増減させた場合の影響は floor なしの和で計算できるので，0 ≦ b < m とする．
	res += (b / m - (T)(b % m < 0)) * n;
	b = smod(b, m);

	while (a > 0) {
		T nn = (a * n + b) / m;
		T nm = a;
		T na = m;
		T nb = a * n + b - m * nn;

		res += (na / nm) * (nn * (nn - 1) / 2);
		na %= nm;

		res += (nb / nm) * nn;
		nb %= nm;

		n = nn; m = nm; a = na; b = nb;
	}

	return res;
}


//【一次式の線形加重切り捨て和】O(log(n + m + a + b))
/*
* Σi∈[0..n) i floor((a i + b) / m) を返す．
*/
template <class T>
T linear_floor_sum(T n, T m, T a, T b) {
	
	//【方法】
	//【一次式の切り捨て和】と同じように分母がより小さい問題への帰着を目指す．
	// ただし同じ形に帰着できるわけではないので，
	//		S1 = Σi∈[0..n) i floor((a i + b) / m)
	//		S2 = Σi∈[0..n) floor((a i + b) / m)^2
	//		S3 = Σi∈[0..n) floor((a i + b) / m) （通常の FloorSum）
	// の 3 つを並行して計算していく．

	Assert(m != 0);
	if (n <= 0) return 0;

	T res = 0;

	// m < 0 の場合，分母分子を -1 倍して m > 0 とする．
	if (m < 0) { a *= -1; b *= -1; m *= -1; }

	// a を m だけ増減させた場合の影響は floor なしの和で計算できるので，0 ≦ a < m とする．
	res += (a / m - (T)(a % m < 0)) * (n * (n - 1) * (2 * n - 1) / 6);
	a = smod(a, m);

	// b を m だけ増減させた場合の影響は floor なしの和で計算できるので，0 ≦ b < m とする．
	res += (b / m - (T)(b % m < 0)) * (n * (n - 1) / 2);
	b = smod(b, m);

	function<tuple<T, T, T>(T, T, T, T)> rf1, rf2;

	// a ≧ m, b ≧ 0 用
	rf1 = [&](T n, T m, T a, T b) {
		if (n == 0) return make_tuple(T(0), T(0), T(0));

		T A = a / m, B = b / m;
		T n3 = n * (n - 1) * (2 * n - 1) / 6, n2 = n * (n - 1) / 2;

		T s1 = A * n3 + B * n2;
		T s2 = A * A * n3 + 2 * A * B * n2 + B * B * n;
		T s3 = A * n2 + B * n;

		a %= m; b %= m;
		auto [ns1, ns2, ns3] = rf2(n, m, a, b);

		s1 += ns1;
		s2 += ns2 + 2 * A * ns1 + 2 * B * ns3;
		s3 += ns3;

		return make_tuple(s1, s2, s3);
	};

	// 0 ≦ a < m, 0 ≦ b < m 用
	rf2 = [&](T n, T m, T a, T b) {
		if (a == 0) return make_tuple(T(0), T(0), T(0));

		T nn = (a * n + b) / m;
		T nm = a;
		T na = m;
		T nb = a * n + b - m * nn;
		auto [ns1, ns2, ns3] = rf1(nn, nm, na, nb);

		T s1 = ((2 * n - 1) * ns3 - ns2) / 2;
		T s2 = (2 * nn - 1) * ns3 - 2 * ns1;
		T s3 = ns3;

		return make_tuple(s1, s2, s3);
	};

	auto [s1, s2, s3] = rf2(n, m, a, b);

	return res + s1;
}


void Main() {
	ll n_, m_, a_, b_;
	cin >> n_ >> m_ >> a_ >> b_;

	__int128 n = n_, m = m_, a = a_, b = b_;

	__int128 res = 0;
	res += 2 * linear_floor_sum(n, m, a, b);
	res += (1 - n) * sum_of_floor_of_linear(n, m, a, b);
	res += linear_floor_sum(n, m, a, __int128(0));
	res += -n * sum_of_floor_of_linear(n, m, a, __int128(0));

	cout << (ll)res << endl;
}

int main() {
	//	input_from_file("input.txt");
	//	output_to_file("output.txt");

	int t;
	cin >> t; // マルチテストケースの場合
	//	t = 1; // シングルテストケースの場合

	while (t--) {
		dump("------------------------------");
		Main();
	}
}
yukicoder

結果

ソースコード