#include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include using namespace std; using lint = long long; using pint = pair; using plint = pair; struct fast_ios { fast_ios(){ cin.tie(nullptr), ios::sync_with_stdio(false), cout << fixed << setprecision(20); }; } fast_ios_; #define ALL(x) (x).begin(), (x).end() #define FOR(i, begin, end) for(int i=(begin),i##_end_=(end);i=i##_begin_;i--) #define REP(i, n) FOR(i,0,n) #define IREP(i, n) IFOR(i,0,n) template void ndarray(vector& vec, const V& val, int len) { vec.assign(len, val); } template void ndarray(vector& vec, const V& val, int len, Args... args) { vec.resize(len), for_each(begin(vec), end(vec), [&](T& v) { ndarray(v, val, args...); }); } template bool chmax(T &m, const T q) { return m < q ? (m = q, true) : false; } template bool chmin(T &m, const T q) { return m > q ? (m = q, true) : false; } int floor_lg(long long x) { return x <= 0 ? -1 : 63 - __builtin_clzll(x); } template pair operator+(const pair &l, const pair &r) { return make_pair(l.first + r.first, l.second + r.second); } template pair operator-(const pair &l, const pair &r) { return make_pair(l.first - r.first, l.second - r.second); } template vector sort_unique(vector vec) { sort(vec.begin(), vec.end()), vec.erase(unique(vec.begin(), vec.end()), vec.end()); return vec; } template int arglb(const std::vector &v, const T &x) { return std::distance(v.begin(), std::lower_bound(v.begin(), v.end(), x)); } template int argub(const std::vector &v, const T &x) { return std::distance(v.begin(), std::upper_bound(v.begin(), v.end(), x)); } template istream &operator>>(istream &is, vector &vec) { for (auto &v : vec) is >> v; return is; } template ostream &operator<<(ostream &os, const vector &vec) { os << '['; for (auto v : vec) os << v << ','; os << ']'; return os; } template ostream &operator<<(ostream &os, const array &arr) { os << '['; for (auto v : arr) os << v << ','; os << ']'; return os; } #if __cplusplus >= 201703L template istream &operator>>(istream &is, tuple &tpl) { std::apply([&is](auto &&... args) { ((is >> args), ...);}, tpl); return is; } template ostream &operator<<(ostream &os, const tuple &tpl) { os << '('; std::apply([&os](auto &&... args) { ((os << args << ','), ...);}, tpl); return os << ')'; } #endif template ostream &operator<<(ostream &os, const deque &vec) { os << "deq["; for (auto v : vec) os << v << ','; os << ']'; return os; } template ostream &operator<<(ostream &os, const set &vec) { os << '{'; for (auto v : vec) os << v << ','; os << '}'; return os; } template ostream &operator<<(ostream &os, const unordered_set &vec) { os << '{'; for (auto v : vec) os << v << ','; os << '}'; return os; } template ostream &operator<<(ostream &os, const multiset &vec) { os << '{'; for (auto v : vec) os << v << ','; os << '}'; return os; } template ostream &operator<<(ostream &os, const unordered_multiset &vec) { os << '{'; for (auto v : vec) os << v << ','; os << '}'; return os; } template ostream &operator<<(ostream &os, const pair &pa) { os << '(' << pa.first << ',' << pa.second << ')'; return os; } template ostream &operator<<(ostream &os, const map &mp) { os << '{'; for (auto v : mp) os << v.first << "=>" << v.second << ','; os << '}'; return os; } template ostream &operator<<(ostream &os, const unordered_map &mp) { os << '{'; for (auto v : mp) os << v.first << "=>" << v.second << ','; os << '}'; return os; } #ifdef HITONANODE_LOCAL const string COLOR_RESET = "\033[0m", BRIGHT_GREEN = "\033[1;32m", BRIGHT_RED = "\033[1;31m", BRIGHT_CYAN = "\033[1;36m", NORMAL_CROSSED = "\033[0;9;37m", RED_BACKGROUND = "\033[1;41m", NORMAL_FAINT = "\033[0;2m"; #define dbg(x) cerr << BRIGHT_CYAN << #x << COLOR_RESET << " = " << (x) << NORMAL_FAINT << " (L" << __LINE__ << ") " << __FILE__ << COLOR_RESET << endl #define dbgif(cond, x) ((cond) ? cerr << BRIGHT_CYAN << #x << COLOR_RESET << " = " << (x) << NORMAL_FAINT << " (L" << __LINE__ << ") " << __FILE__ << COLOR_RESET << endl : cerr) #else #define dbg(x) (x) #define dbgif(cond, x) 0 #endif // 領域木 template class rangetree_bit { int n; std::vector> _pts; struct BIT { std::vector data; BIT(int len) : data(len, e()) {} void add(int pos, S v) { for (pos++; pos and pos <= int(data.size()); pos += pos & -pos) opadd(data[pos - 1], v); } S sum(int r) const { S ret = e(); while (r) opadd(ret, data[r - 1]), r -= r & -r; return ret; } }; std::vector> _range2ys; std::vector bits; void _add_singlenode(int v, Coordinate y, S val) { auto i = std::distance(_range2ys[v].begin(), std::lower_bound(_range2ys[v].begin(), _range2ys[v].end(), y)); bits[v].add(i, val); } S _get_singlenode(int v, Coordinate y) const { auto i = std::distance(_range2ys[v].begin(), std::lower_bound(_range2ys[v].begin(), _range2ys[v].end(), y)); return bits[v].sum(i); } S _sum(Coordinate xl, Coordinate xr, Coordinate yr) const { // [xl, xr) * (-INF, yr) auto compx = [](std::pair l, std::pair r) { return l.first < r.first; }; int l = n + std::distance(_pts.begin(), std::lower_bound(_pts.begin(), _pts.end(), std::make_pair(xl, yr), compx)); int r = n + std::distance(_pts.begin(), std::lower_bound(_pts.begin(), _pts.end(), std::make_pair(xr, yr), compx)); S ret = e(); while (l < r) { if (l & 1) opadd(ret, _get_singlenode(l++, yr)); if (r & 1) opadd(ret, _get_singlenode(--r, yr)); l >>= 1, r >>= 1; } return ret; } public: rangetree_bit() = default; void add_point(Coordinate x, Coordinate y) noexcept { _pts.emplace_back(x, y); } void build() { std::sort(_pts.begin(), _pts.end()); _pts.erase(std::unique(_pts.begin(), _pts.end()), _pts.end()); n = _pts.size(); _range2ys.resize(n * 2); for (int i = 0; i < n; i++) _range2ys[n + i] = {_pts[i].second}; for (int i = n - 1; i > 0; i--) { auto &lch = _range2ys[i * 2]; auto &rch = _range2ys[i * 2 + 1]; std::merge(lch.begin(), lch.end(), rch.begin(), rch.end(), std::back_inserter(_range2ys[i])); _range2ys[i].erase(std::unique(_range2ys[i].begin(), _range2ys[i].end()), _range2ys[i].end()); } for (const auto &v : _range2ys) bits.push_back(BIT(v.size())); } void add(Coordinate x, Coordinate y, S val) { int i = std::distance(_pts.begin(), std::lower_bound(_pts.begin(), _pts.end(), std::make_pair(x, y))); assert(i < n and _pts[i] == std::make_pair(x, y)); for (i += n; i; i >>= 1) _add_singlenode(i, y, val); } S sum(Coordinate xl, Coordinate xr, Coordinate yl, Coordinate yr) const { auto ret_r = _sum(xl, xr, yr); auto ret_l = _sum(xl, xr, yl); opsub(ret_r, ret_l); return ret_r; } }; void opadd(int &x, int y) { x += y; } void opsub(int &x, int y) { x -= y; } int ope() { return 0; } int main() { int M, K; cin >> M >> K; const int N = M * K; vector A(N); cin >> A; vector ord(N); vector freq(M); rangetree_bit tree; vector> v2i(M); for (int i = 0; i < N; ++i) { ord[i] = A[i] + freq[A[i]] * M; v2i[A[i]].push_back(i); tree.add_point(i, ord[i]); tree.add_point(i, ord[i] + M); freq[A[i]]++; } tree.build(); long long current = 0; for (int i = 0; i < N; ++i) { current += tree.sum(0, i, ord[i] + 1, 1 << 20); tree.add(i, ord[i], 1); } long long ret = current; for (auto &is : v2i) { reverse(is.begin(), is.end()); for (int i : is) { int y = ord[i]; tree.add(i, y, -1); current += tree.sum(i, N, y, y + M); current -= tree.sum(0, i, y, y + M); tree.add(i, y + M, 1); } ret = min(ret, current); } cout << ret << '\n'; }