#1013095 (C++17) No.1867 Partitions and Inversions

提出ソース
結果

問題	No.1867 Partitions and Inversions
コンテスト
ユーザー	ecottea
提出日時	2024-09-24 00:13:50
言語	C++17 (gcc 15.2.0 + boost 1.90.0) コンパイル: `g++-15 -O2 -lm -std=c++17 -Wuninitialized -DONLINE_JUDGE -o a.out _filename_` 実行: `./a.out`
結果	AC
実行時間	2,400 ms / 5,000 ms
コード長	16,798 bytes
記録記録タグの例: 初AC ショートコード純ショートコード純主流ショートコード最速実行時間
コンパイル時間	3,462 ms
コンパイル使用メモリ	306,616 KB
実行使用メモリ	92,416 KB
最終ジャッジ日時	2026-07-05 18:42:47
合計ジャッジ時間	101,144 ms
ジャッジサーバーID （参考情報）	judge3_0 / judge2_0
このコードへのチャレンジ
（要ログイン）
ファイルパターン	結果
sample	AC * 3
other	AC * 65
権限があれば一括ダウンロードができます
ソースコード

raw source code
#ifndef HIDDEN_IN_VS // 折りたたみ用

// 警告の抑制
#define _CRT_SECURE_NO_WARNINGS

// ライブラリの読み込み
#include <bits/stdc++.h>
using namespace std;

// 型名の短縮
using ll = long long; using ull = unsigned long long; // -2^63 ～ 2^63 = 9e18（int は -2^31 ～ 2^31 = 2e9）
using pii = pair<int, int>;	using pll = pair<ll, ll>;	using pil = pair<int, ll>;	using pli = pair<ll, int>;
using vi = vector<int>;		using vvi = vector<vi>;		using vvvi = vector<vvi>;	using vvvvi = vector<vvvi>;
using vl = vector<ll>;		using vvl = vector<vl>;		using vvvl = vector<vvl>;	using vvvvl = vector<vvvl>;
using vb = vector<bool>;	using vvb = vector<vb>;		using vvvb = vector<vvb>;
using vc = vector<char>;	using vvc = vector<vc>;		using vvvc = vector<vvc>;
using vd = vector<double>;	using vvd = vector<vd>;		using vvvd = vector<vvd>;
template <class T> using priority_queue_rev = priority_queue<T, vector<T>, greater<T>>;
using Graph = vvi;

// 定数の定義
const double PI = acos(-1);
int DX[4] = { 1, 0, -1, 0 }; // 4 近傍（下，右，上，左）
int DY[4] = { 0, 1, 0, -1 };
int INF = 1001001001; ll INFL = 4004004003094073385LL; // (int)INFL = INF, (int)(-INFL) = -INF;

// 入出力高速化
struct fast_io { fast_io() { cin.tie(nullptr); ios::sync_with_stdio(false); cout << fixed << setprecision(18); } } fastIOtmp;

// 汎用マクロの定義
#define all(a) (a).begin(), (a).end()
#define sz(x) ((int)(x).size())
#define lbpos(a, x) (int)distance((a).begin(), std::lower_bound(all(a), (x)))
#define ubpos(a, x) (int)distance((a).begin(), std::upper_bound(all(a), (x)))
#define Yes(b) {cout << ((b) ? "Yes\n" : "No\n");}
#define rep(i, n) for(int i = 0, i##_len = int(n); i < i##_len; ++i) // 0 から n-1 まで昇順
#define repi(i, s, t) for(int i = int(s), i##_end = int(t); i <= i##_end; ++i) // s から t まで昇順
#define repir(i, s, t) for(int i = int(s), i##_end = int(t); i >= i##_end; --i) // s から t まで降順
#define repe(v, a) for(const auto& v : (a)) // a の全要素（変更不可能）
#define repea(v, a) for(auto& v : (a)) // a の全要素（変更可能）
#define repb(set, d) for(int set = 0, set##_ub = 1 << int(d); set < set##_ub; ++set) // d ビット全探索（昇順）
#define repis(i, set) for(int i = lsb(set), bset##i = set; i < 32; bset##i -= 1 << i, i = lsb(bset##i)) // set の全要素（昇順）
#define repp(a) sort(all(a)); for(bool a##_perm = true; a##_perm; a##_perm = next_permutation(all(a))) // a の順列全て（昇順）
#define uniq(a) {sort(all(a)); (a).erase(unique(all(a)), (a).end());} // 重複除去
#define EXIT(a) {cout << (a) << endl; exit(0);} // 強制終了
#define inQ(x, y, u, l, d, r) ((u) <= (x) && (l) <= (y) && (x) < (d) && (y) < (r)) // 半開矩形内判定

// 汎用関数の定義
template <class T> inline ll powi(T n, int k) { ll v = 1; rep(i, k) v *= n; return v; }
template <class T> inline bool chmax(T& M, const T& x) { if (M < x) { M = x; return true; } return false; } // 最大値を更新（更新されたら true を返す）
template <class T> inline bool chmin(T& m, const T& x) { if (m > x) { m = x; return true; } return false; } // 最小値を更新（更新されたら true を返す）
template <class T> inline T getb(T set, int i) { return (set >> i) & T(1); }
template <class T> inline T smod(T n, T m) { n %= m; if (n < 0) n += m; return n; } // 非負mod

// 演算子オーバーロード
template <class T, class U> inline istream& operator>>(istream& is, pair<T, U>& p) { is >> p.first >> p.second; return is; }
template <class T> inline istream& operator>>(istream& is, vector<T>& v) { repea(x, v) is >> x; return is; }
template <class T> inline vector<T>& operator--(vector<T>& v) { repea(x, v) --x; return v; }
template <class T> inline vector<T>& operator++(vector<T>& v) { repea(x, v) ++x; return v; }

#endif // 折りたたみ用


#if __has_include(<atcoder/all>)
#include <atcoder/all>
using namespace atcoder;

#ifdef _MSC_VER
#include "localACL.hpp"
#endif

//using mint = modint1000000007;
using mint = modint998244353;
//using mint = static_modint<1234567891>;
//using mint = modint; // mint::set_mod(m);

string mint_to_frac(mint x, int v_max = 31595) {
	repi(dnm, 1, v_max) {
		int num = (x * dnm).val();
		if (num == 0) {
			return "0";
		}
		if (num <= v_max) {
			if (dnm == 1) return to_string(num);
			return to_string(num) + "/" + to_string(dnm);
		}
		if (mint::mod() - num <= v_max) {
			if (dnm == 1) return "-" + to_string(mint::mod() - num);
			return "-" + to_string(mint::mod() - num) + "/" + to_string(dnm);
		}
	}

	return to_string(x.val());
}

namespace atcoder {
	inline istream& operator>>(istream& is, mint& x) { ll x_; is >> x_; x = x_; return is; }
#ifdef _MSC_VER
	inline ostream& operator<<(ostream& os, const mint& x) { os << mint_to_frac(x); return os; }
#else
	inline ostream& operator<<(ostream& os, const mint& x) { os << x.val(); return os; }
#endif	
}
using vm = vector<mint>; using vvm = vector<vm>; using vvvm = vector<vvm>; using vvvvm = vector<vvvm>; using pim = pair<int, mint>;
#endif


#ifdef _MSC_VER // 手元環境（Visual Studio）
#include "local.hpp"
#else // 提出用（gcc）
inline int popcount(int n) { return __builtin_popcount(n); }
inline int popcount(ll n) { return __builtin_popcountll(n); }
inline int lsb(int n) { return n != 0 ? __builtin_ctz(n) : 32; }
inline int lsb(ll n) { return n != 0 ? __builtin_ctzll(n) : 64; }
template <size_t N> inline int lsb(const bitset<N>& b) { return b._Find_first(); }
inline int msb(int n) { return n != 0 ? (31 - __builtin_clz(n)) : -1; }
inline int msb(ll n) { return n != 0 ? (63 - __builtin_clzll(n)) : -1; }
#define dump(...)
#define dumpel(...)
#define dump_list(v)
#define dump_mat(v)
#define input_from_file(f)
#define output_to_file(f)
#define Assert(b) { if (!(b)) { vc MLE(1<<30); EXIT(MLE.back()); } } // RE の代わりに MLE を出す
#endif


//【座標圧縮】O(n log n)
/*
* a[0..n) を座標圧縮した結果を a_cp[0..n) に格納し，その値域の大きさを返す．
* また xs[j] に圧縮された座標 j に対応する元の座標を格納する．
*
* a に重複する要素がなければ，a_cp[i] は a[i] が昇順で何番目かを表し，
* xs[j] は昇順で j 番目の要素が何かを表す．
*/
template <class T>
int coordinate_compression(const vector<T>& a, vi& a_cp, vector<T>* xs = nullptr) {
	// verify : https://atcoder.jp/contests/tessoku-book/tasks/tessoku_book_o

	int n = sz(a);
	if (xs == nullptr) xs = new vector<T>;

	// *xs : a の x 座標のユニークな昇順列
	*xs = a;
	uniq(*xs);

	// a[i] が xs において何番目かを求める．
	a_cp.resize(n);
	rep(i, n) a_cp[i] = lbpos(*xs, a[i]);

	return sz(*xs);
}


//【転倒数（座圧）】O(n log n)
/*
* a[0..n) の転倒数を返す．
*
* 利用：【座標圧縮】
*/
template <class T>
vl inversion_number_cc(const vector<T>& a) {
	// verify : https://onlinejudge.u-aizu.ac.jp/courses/lesson/1/ALDS1/all/ALDS1_5_D

	int n = sz(a);

	// b : a を座標圧縮した結果
	vi b;
	int m = coordinate_compression(a, b);

	// fw[i] : 今まで見てきた範囲に値 i が何個あったか
	fenwick_tree<int> fw(m);
	vl res(n);

	// 位置について昇順に見ていく．
	rep(i, n) {
		fw.add(b[i], 1);

		// 自身より大きい数が今までに何個あったか調べ，加算する．
		res[i] = fw.sum(b[i] + 1, m) + (i > 0 ? res[i - 1] : 0);
	}
	return res;
}


vl TLE(int n, vi p) {
	vvl inv(n + 1, vl(n + 1));
	rep(i, n) {
		vi a(p.begin() + i, p.end());
		auto b = inversion_number_cc(a);
		repi(j, i + 1, n) inv[i][j] = b[j - (i + 1)];
	}
	dumpel(inv);

	// dp[i][j] : 頂点 i までの辺を j 本通る経路のスコアの最大値
	vvl dp(n + 1, vl(n + 1, -INFL));
	dp[0][0] = 0;

	rep(i, n) {
		repi(j, 0, n - 1) {
			repi(ni, i + 1, n) { // 遅い
				chmax(dp[ni][j + 1], dp[i][j] + inv[i][ni]);
			}
		}
	}
	dumpel(dp);

	vl res;
	repi(j, 1, n) res.push_back(inv[0][n] - dp[n][j]);

	return res;
}


//【行列（半環）】
/*
* Matrix<S, add, o, mul, e>(m, n) : O(m n)
*	m×n 零行列で初期化する．
*   成分は半環 <S, add, o, mul, e> の元とする．
*
* Matrix<S, add, o, mul, e>(n) : O(n^2)
*	n×n 単位行列で初期化する．
*
* Matrix<S, add, o, mul, e>(vvS a) : O(m n)
*	配列 a[0..m)[0..n) の要素で初期化する．
*
* A + B : O(m n)
*	m×n 行列 A, B の和を返す．+= も使用可．
*
* c * A ／ A * c : O(m n)
*	m×n 行列 A とスカラー c のスカラー積を返す．
*
* A * x ／ x * A : O(m n)
*	行列ベクトル積[ベクトル行列積]を返す．
*
* A * B : O(l m n)
*	l×m 行列 A と m×n 行列 B の積を返す．
*
* pow(d) : O(n^3 log d)
*	自身を d 乗した行列を返す．
*/
template <class S, S(*add)(S, S), S(*o)(), S(*mul)(S, S), S(*e)()>
struct Matrix {
	int m, n; // 行列のサイズ（m 行 n 列）
	vector<vector<S>> v; // 行列の成分

	// コンストラクタ（初期化なし，零行列，単位行列，二次元配列）
	Matrix() : m(0), n(0) {}
	Matrix(int m, int n) : m(m), n(n), v(m, vector<S>(n, o())) {}
	Matrix(int n) : m(n), n(n), v(n, vector<S>(n, o())) { rep(i, n) v[i][i] = e(); }
	Matrix(const vector<vector<S>>& a) : m(sz(a)), n(sz(a[0])), v(a) {}

	// 代入
	Matrix(const Matrix& b) = default;
	Matrix& operator=(const Matrix& b) = default;

	// 入力
	friend istream& operator>>(istream& is, Matrix& a) {
		rep(i, a.m) rep(j, a.n) is >> a[i][j];
		return is;
	}

	// アクセス
	vector<S> const& operator[](int i) const { return v[i]; }
	vector<S>& operator[](int i) { return v[i]; }

	// 比較
	bool operator==(const Matrix& b) const { return m == b.m && n == b.n && v == b.v; }
	bool operator!=(const Matrix& b) const { return !(*this == b); }

	// 加算
	Matrix& operator+=(const Matrix& b) {
		rep(i, m) rep(j, n) v[i][j] = add(v[i][j], b[i][j]);
		return *this;
	}
	Matrix operator+(const Matrix& b) const { Matrix a = *this; return a += b; }

	// 左右からのスカラー倍
	Matrix operator*(const S& c) const {
		Matrix res(*this);
		rep(i, m) rep(j, n) res[i][j] = mul(res[i][j], c);
		return res;
	}
	friend Matrix operator*(const S& c, const Matrix& a) {
		Matrix res(a);
		rep(i, a.m) rep(j, a.n) res[i][j] = mul(c, res[i][j]);
		return res;
	}

	// 行列ベクトル積 : O(m n)
	vector<S> operator*(const vector<S>& x) const {
		vector<S> y(m, o());
		rep(i, m) rep(j, n)	y[i] = add(y[i], mul(v[i][j], x[j]));
		return y;
	}

	// ベクトル行列積 : O(m n)
	friend vector<S> operator*(const vector<S>& x, const Matrix& a) {
		// verify : https://codeforces.com/contest/1681/problem/E

		vector<S> y(a.n, o());
		rep(i, a.m) rep(j, a.n) y[j] = add(y[j], mul(x[i], a[i][j]));
		return y;
	}

	// 積：O(n^3)
	Matrix operator*(const Matrix& b) const {
		// verify : https://codeforces.com/contest/1681/problem/E

		Matrix res(m, b.n);
		rep(i, res.m) rep(j, res.n) rep(k, n) res[i][j] = add(res[i][j], mul(v[i][k], b[k][j]));
		return res;
	}

	// 累乗：O(n^3 log d)
	Matrix pow(ll d) const {
		// verify : https://atcoder.jp/contests/abc009/tasks/abc009_4

		Matrix res(n), pow2(*this);
		while (d > 0) {
			if ((d & 1) != 0) res = res * pow2;
			pow2 = pow2 * pow2;
			d /= 2;
		}
		return res;
	}

#ifdef _MSC_VER
	friend ostream& operator<<(ostream& os, const Matrix& a) {
		rep(i, a.m) {
			rep(j, a.n) os << a[i][j] << " ";
			os << endl;
		}
		return os;
	}
#endif
};


//【max - plus 可環半環（トロピカル半環）】
/* verify : https://atcoder.jp/contests/abc310/tasks/abc310_h */
using S804 = ll;
S804 add804(S804 x, S804 y) { return max(x, y); }
S804 o804() { return -INFL; }
S804 mul804(S804 x, S804 y) { return x + y; }
S804 e804() { return 0; }
#define Max_plus_semiring S804, add804, o804, mul804, e804


// TLE() を max-plus 半環上の行列ベクトル積の繰り返しと解釈したもの
vl TLE2(int n, vi p) {
	using MAT = Matrix<Max_plus_semiring>;

	MAT M(n + 1, n + 1);
	rep(i, n) {
		vi a(p.begin() + i, p.end());
		auto b = inversion_number_cc(a);
		repi(j, i + 1, n) M[i][j] = b[j - (i + 1)];
	}
	dump("M:"); dumpel(M.v, 4);

	vl res(n, M[0][n]);

	vl vec(n + 1, o804());
	vec[0] = e804();
	dump("vec:", vec);

	rep(j, n) {
		vvl a(M.v);
		repi(x, 0, n) repi(y, 0, n) a[x][y] += vec[x];
		dump("A:"); dumpel(a, 4);

		vec = vec * M;
		dump("vec:", vec);

		res[j] -= vec[n];
	}

	return res;
}


//【Monge 性判定（上三角）】O(n^2)
/*
* 行列 a[0..n)[0..n) の狭義上三角部分が Monge かを返す
*/
template <class T>
bool mongeQ_UT(const vector<vector<T>>& a) {
	if (a.empty()) return true;

	int n = sz(a);
	repi(i, 0, n - 3) repi(j, i + 2, n - 2) {
		if (a[i][j] + a[i + 1][j + 1] > a[i][j + 1] + a[i + 1][j]) return false;
	}
	return true;
}


//【上三角 → 矩形集合】O(n log n)
/*
* n×n 格子の狭義上三角部分 S = {(i,j) | 0≦i<j<n} を矩形に分割し，矩形のリストを返す．
* strict = false にすると広義上三角部分 S = {(i,j) | 0≦i≦j<n} を矩形に分割する．
* 矩形 [i1..i2)×[j1..j2) は 4 つ組 {i1, i2, j1, j2} で表す．
*
*（分割統治法）
*/
vector<tuple<int, int, int, int>> trig_to_rects(int n, bool strict = true) {
	vector<tuple<int, int, int, int>> rects;

	// {(i,j) | l≦i<j<r} を矩形に分割する．
	function<void(int, int)> rf = [&](int l, int r) {
		if (r - l == 1) {
			if (!strict) rects.emplace_back(l, l + 1, l, l + 1);
			return;
		}

		int m = (l + r) / 2;
		rects.emplace_back(l, m, m, r);
		rf(l, m);
		rf(m, r);
	};
	rf(0, n);

	return rects;
}


//【SMAWK algorithm】O(h + w)
/*
* 与えられた totally monotone 行列 a[0..h)[0..w) について，各行の最小値の位置を並べたリストを返す．
*/
template <class FUNC>
vi smawk(int h, int w, const FUNC& a) {
	// 参考 : https://speakerdeck.com/tatyam_prime/monge-noshou-yin-shu
	// verify : https://atcoder.jp/contests/colopl2018-final/tasks/colopl2018_final_c

	int K = msb(h);

	// js[k][pt] : lsb が k 未満である行と，それまでの行最小値をとり得ない列を捨てた行列について，
	//		その pt 番目の列に対応する a の列番号
	vvi js(K + 2);
	js[0].resize(w);
	iota(all(js[0]), 0);
	repi(k, 0, K) js[k + 1].reserve((h >> k) + 1);

	repi(k, 0, K) {
		int di = 1 << k, i = di, pt = 0;
		while (pt < sz(js[k])) {
			if (js[k + 1].empty()) {
				js[k + 1].push_back(js[k][pt++]);
				continue;
			}

			if (i == 0 || a(i - 1, js[k + 1].back()) <= a(i - 1, js[k][pt])) {
				if (i + di <= h) {
					js[k + 1].push_back(js[k][pt]);
					i += di;
				}
				pt++;
			}
			else {
				js[k + 1].pop_back();
				i -= di;
			}
		}
	}

	vi j_min(h);

	repir(k, K, 0) {
		int di = 1 << k, pt = 0;

		for (int i = di; i <= h; i += di << 1) {
			ll a_min = 2 * INFL + 10;
			int jR = (i + di <= h ? j_min[i + di - 1] : w - 1);

			while (pt < sz(js[k + 1]) && js[k + 1][pt] < jR) {
				if (chmin(a_min, a(i - 1, js[k + 1][pt]))) j_min[i - 1] = js[k + 1][pt];
				pt++;
			}
			if (chmin(a_min, a(i - 1, jR))) j_min[i - 1] = jR;
		}
	}

	return j_min;

	/* a の定義の雛形
	auto a = [&](int i, int j) {
		return 0LL;
	};
	*/
}


//【Monge 性判定】O(h w)
/*
* 行列 a[0..h)[0..w) が Monge 行列かを返す
*/
template <class FUNC>
bool mongeQ_func(int h, int w, const FUNC& a) {
	// verify : https://yukicoder.me/problems/no/1867

	rep(i, h - 1) rep(j, w - 1) {
		if (a(i, j) + a(i + 1, j + 1) > a(i, j + 1) + a(i + 1, j)) return false;
	}
	return true;
}


vl solve(int n, vi p) {
	using MAT = Matrix<Max_plus_semiring>;

	MAT M(n + 1, n + 1);
	rep(i, n) {
		vi a(p.begin() + i, p.end());
		auto b = inversion_number_cc(a);
		repi(j, i + 1, n) M[i][j] = b[j - (i + 1)];
	}
	dumpel(M.v, 4);
	dump("Monge?:", mongeQ_UT(M.v));

	vl res(n, M[0][n]);

	vl vec(n + 1, o804());
	vec[0] = e804();
	dump(vec);

	auto rects = trig_to_rects(n + 1);
	
	rep(k, n) {
		dump("----- k:", k, "-----");
				
		vl nvec(n + 1, o804());

		for (auto [i1, i2, j1, j2] : rects) {
			dump("rect:", i1, i2, j1, j2);

			int h = i2 - i1;
			int w = j2 - j1;

			auto a = [&](int j, int i) {
//				dump("j, i:", j, i);
				return -(M[i1 + i][j2 - 1 - j] + vec[i1 + i]);
			};
//			rep(j, w) rep(i, h) cout << a(j, i) << " \n"[i == h - 1];
			dump("Monge?:", mongeQ_func(w, h, a));
			
			auto i_min = smawk(w, h, a);
			dump(i_min);

			rep(j, w) {
				chmax(nvec[j2 - 1 - j], -a(j, i_min[j]));
			}
			dump(nvec);
		}

		dump(vec * M);
		vec = move(nvec);
		dump(vec);

		res[k] -= vec[n];
	}

	return res;
}


int main() {
//	input_from_file("input.txt");
//	output_to_file("output.txt");

	dump(INFL = 499);

	int n;
	cin >> n;

	vi p(n);
	cin >> p;

	dump(TLE(n, p)); dump("-----");

	dump(TLE2(n, p)); dump("-----");

	auto res = solve(n, p);

	rep(i, n) cout << res[i] << "\n";
}