#include #include void add_BIT(int N, int BIT[], int i, int k) { while (i <= N) { BIT[i] += k; i += (i & -i); } } int sum_BIT(int BIT[], int r) { int sum = 0; while (r > 0) { sum += BIT[r]; r -= (r & -r); } return sum; } void chmin(long long* a, long long b) { if (*a > b) *a = b; } int main() { int i, M, K, N, A[400001], num[400001] = {}, *p[400001]; scanf("%d %d", &M, &K); for (i = 0; i < M; i++) p[i] = (int*)malloc(sizeof(int) * (K + 1)); for (i = 1, N = M * K; i <= N; i++) { scanf("%d", &(A[i])); p[A[i]][++num[A[i]]] = i; A[i] += M * (num[A[i]] - 1) + 1; } int j, BIT[400001] = {}, dif[400001]; long long ans = 0, tmp; for (i = 1; i <= N; i++) { ans += i - sum_BIT(BIT, A[i]) - 1; dif[i] = (sum_BIT(BIT, ((A[i] - 1) / M + 1) * M) - sum_BIT(BIT, ((A[i] - 1) / M) * M)) * 2 - (M - 1); add_BIT(N, BIT, A[i], 1); } for (i = M - 1, tmp = ans; i >= 1; i--) { for (j = 1; j <= K; j++) tmp += dif[p[i][j]]; chmin(&ans, tmp); } printf("%lld\n", ans); fflush(stdout); return 0; }