// #pragma GCC target("avx2") // #pragma GCC optimize("O3") // #pragma GCC optimize("unroll-loops") #include using namespace std; using ll = long long; using ull = unsigned long long; template using pq = priority_queue; template using qp = priority_queue, greater>; #define vec(T, A, ...) vector A(__VA_ARGS__); #define vvec(T, A, h, ...) vector> A(h, vector(__VA_ARGS__)); #define vvvec(T, A, h1, h2, ...) vector>> A(h1, vector>(h2, vector(__VA_ARGS__))); #ifndef RIN__LOCAL #define endl "\n" #endif #define spa ' ' #define len(A) A.size() #define all(A) begin(A), end(A) #define fori1(a) for (ll _ = 0; _ < (a); _++) #define fori2(i, a) for (ll i = 0; i < (a); i++) #define fori3(i, a, b) for (ll i = (a); i < (b); i++) #define fori4(i, a, b, c) for (ll i = (a); ((c) > 0 || i > (b)) && ((c) < 0 || i < (b)); i += (c)) #define overload4(a, b, c, d, e, ...) e #define fori(...) overload4(__VA_ARGS__, fori4, fori3, fori2, fori1)(__VA_ARGS__) vector stoc(string &S) { int n = S.size(); vector ret(n); for (int i = 0; i < n; i++) ret[i] = S[i]; return ret; } #define INT(...) \ int __VA_ARGS__; \ inp(__VA_ARGS__); #define LL(...) \ ll __VA_ARGS__; \ inp(__VA_ARGS__); #define STRING(...) \ string __VA_ARGS__; \ inp(__VA_ARGS__); #define CHAR(...) \ char __VA_ARGS__; \ inp(__VA_ARGS__); #define VEC(T, A, n) \ vector A(n); \ inp(A); #define VVEC(T, A, n, m) \ vector> A(n, vector(m)); \ inp(A); const ll MOD1 = 1000000007; const ll MOD9 = 998244353; template auto min(const T &a) { return *min_element(all(a)); } template auto max(const T &a) { return *max_element(all(a)); } template auto clamp(T &a, const S &l, const S &r) { return (a > r ? r : a < l ? l : a); } template inline bool chmax(T &a, const S &b) { return (a < b ? a = b, 1 : 0); } template inline bool chmin(T &a, const S &b) { return (a > b ? a = b, 1 : 0); } template inline bool chclamp(T &a, const S &l, const S &r) { auto b = clamp(a, l, r); return (a != b ? a = b, 1 : 0); } void FLUSH() { cout << flush; } void print() { cout << endl; } template void print(Head &&head, Tail &&...tail) { cout << head; if (sizeof...(Tail)) cout << spa; print(forward(tail)...); } template void print(vector &A) { int n = A.size(); for (int i = 0; i < n; i++) { cout << A[i]; if (i != n - 1) cout << ' '; } cout << endl; } template void print(vector> &A) { for (auto &row : A) print(row); } template void print(pair &A) { cout << A.first << spa << A.second << endl; } template void print(vector> &A) { for (auto &row : A) print(row); } template void prisep(vector &A, S sep) { int n = A.size(); for (int i = 0; i < n; i++) { cout << A[i]; if (i != n - 1) cout << sep; } cout << endl; } template void priend(T A, S end) { cout << A << end; } template void priend(T A) { priend(A, spa); } template bool printif(bool f, T A, S B) { if (f) print(A); else print(B); return f; } template void inp(T &...a) { (cin >> ... >> a); } template void inp(vector &A) { for (auto &a : A) cin >> a; } template void inp(vector> &A) { for (auto &row : A) inp(row); } template void inp(pair &A) { inp(A.first, A.second); } template void inp(vector> &A) { for (auto &row : A) inp(row.first, row.second); } template T sum(vector &A) { T tot = 0; for (auto a : A) tot += a; return tot; } template vector compression(vector X) { sort(all(X)); X.erase(unique(all(X)), X.end()); return X; } vector> read_edges(int n, int m, bool direct = false, int indexed = 1) { vector> edges(n, vector()); for (int i = 0; i < m; i++) { INT(u, v); u -= indexed; v -= indexed; edges[u].push_back(v); if (!direct) edges[v].push_back(u); } return edges; } vector> read_tree(int n, int indexed = 1) { return read_edges(n, n - 1, false, indexed); } template vector>> read_wedges(int n, int m, bool direct = false, int indexed = 1) { vector>> edges(n, vector>()); for (int i = 0; i < m; i++) { INT(u, v); T w; inp(w); u -= indexed; v -= indexed; edges[u].push_back({v, w}); if (!direct) edges[v].push_back({u, w}); } return edges; } template vector>> read_wtree(int n, int indexed = 1) { return read_wedges(n, n - 1, false, indexed); } inline bool yes(bool f = true) { cout << (f ? "yes" : "no") << endl; return f; } inline bool Yes(bool f = true) { cout << (f ? "Yes" : "No") << endl; return f; } inline bool YES(bool f = true) { cout << (f ? "YES" : "NO") << endl; return f; } inline bool no(bool f = true) { cout << (!f ? "yes" : "no") << endl; return f; } inline bool No(bool f = true) { cout << (!f ? "Yes" : "No") << endl; return f; } inline bool NO(bool f = true) { cout << (!f ? "YES" : "NO") << endl; return f; } void solve() { INT(h, w); VVEC(int, S, h, w); vvec(int, A, 0, 0); vec(int, row, h, 0); vec(int, col, w, 0); fori(i, h) fori(j, w) { row[i] += S[i][j]; col[j] += S[i][j]; } fori(i, h) { if (row[i] == 0) continue; vec(int, tmp, 0); fori(j, w) { if (col[j]) tmp.push_back(S[i][j]); } A.push_back(tmp); } // swap(A, S); h = S.size(); if (h == 0) { print(0); return; } w = S[0].size(); vvec(int, dp, h + 1, w + 1, 1 << 30); vvec(int, cum, h + 1, w + 1, 0); fori(i, h) fori(j, w) { cum[i + 1][j + 1] = cum[i + 1][j] + cum[i][j + 1] - cum[i][j] + S[i][j]; } auto f = [&](int i0, int i1, int j0, int j1) { return cum[i1][j1] - cum[i0][j1] - cum[i1][j0] + cum[i0][j0]; }; vec(int, zz, h + 1, w); fori(i, h + 1) { while (zz[i] > 0 && f(i, h, zz[i] - 1, w) == 0) zz[i]--; } dp[h][w] = 0; fori(i, h, -1, -1) fori(j, w, -1, -1) { if (i != h && f(i, i + 1, j, w) == 0) chmin(dp[i][j], dp[i + 1][j]); if (j != w && f(i, h, j, j + 1) == 0) chmin(dp[i][j], dp[i][j + 1]); vec(int, row, h + 1, 0); vec(int, col, w + 1, 0); fori(i, h) row[i + 1] = row[i] + (f(i, i + 1, j, w) > 0 ? 1 : 0); fori(j, w) col[j + 1] = col[j] + (f(i, h, j, j + 1) > 0 ? 1 : 0); fori(i2, i, h + 1) { int j2 = max(int(j + 1), zz[i2]); int tmp = dp[i2][j] + dp[i][j2] + (row[i2] - row[i]) * (col[j2] - col[j]) - f(i, i2, j, j2); chmin(dp[i][j], tmp); } } print(dp[0][0]); } int main() { cin.tie(0)->sync_with_stdio(0); // cout << fixed << setprecision(12); int t; t = 1; // cin >> t; while (t--) solve(); return 0; }