#line 1 "main.cpp" #include using namespace std; #ifdef LOCAL #include #define debug(...) debug_print::multi_print(#__VA_ARGS__, __VA_ARGS__) #else #define debug(...) (static_cast(0)) #endif //#pragma GCC target("avx,avx2") //#pragma GCC optimize("O3") //#pragma GCC optimize("unroll-loops") using ll = long long; using ull = unsigned long long; using ld = long double; using pll = pair; using pii = pair; using vi = vector; using vvi = vector; using vvvi = vector; using vl = vector; using vvl = vector; using vvvl = vector; using vul = vector; using vpii = vector; using vvpii = vector; using vpll = vector; using vs = vector; template using pq = priority_queue, greater>; #define overload4(_1, _2, _3, _4, name, ...) name #define overload3(a,b,c,name,...) name #define rep1(n) for (ll UNUSED_NUMBER = 0; UNUSED_NUMBER < (n); ++UNUSED_NUMBER) #define rep2(i, n) for (ll i = 0; i < (n); ++i) #define rep3(i, a, b) for (ll i = (a); i < (b); ++i) #define rep4(i, a, b, c) for (ll i = (a); i < (b); i += (c)) #define rep(...) overload4(__VA_ARGS__, rep4, rep3, rep2, rep1)(__VA_ARGS__) #define rrep1(n) for(ll i = (n) - 1;i >= 0;i--) #define rrep2(i,n) for(ll i = (n) - 1;i >= 0;i--) #define rrep3(i,a,b) for(ll i = (b) - 1;i >= (a);i--) #define rrep4(i,a,b,c) for(ll i = (a) + (((b)-(a)-1) / (c) - (((b)-(a)-1) % (c) && (((b)-(a)-1) ^ c) < 0)) * (c);i >= (a);i -= c) #define rrep(...) overload4(__VA_ARGS__, rrep4, rrep3, rrep2, rrep1)(__VA_ARGS__) #define all1(i) begin(i) , end(i) #define all2(i,a) begin(i) , begin(i) + a #define all3(i,a,b) begin(i) + a , begin(i) + b #define all(...) overload3(__VA_ARGS__, all3, all2, all1)(__VA_ARGS__) #define sum(...) accumulate(all(__VA_ARGS__),0LL) template bool chmin(T &a, const T &b){ if(a > b){ a = b; return 1; } else return 0; } template bool chmax(T &a, const T &b){ if(a < b){ a = b; return 1; } else return 0; } template auto min(const T& a){return *min_element(all(a));} template auto max(const T& a){return *max_element(all(a));} template void in(Ts&... t); #define INT(...) int __VA_ARGS__; in(__VA_ARGS__) #define LL(...) ll __VA_ARGS__; in(__VA_ARGS__) #define STR(...) string __VA_ARGS__; in(__VA_ARGS__) #define CHR(...) char __VA_ARGS__; in(__VA_ARGS__) #define DBL(...) double __VA_ARGS__; in(__VA_ARGS__) #define LD(...) ld __VA_ARGS__; in(__VA_ARGS__) #define VEC(type, name, size) vector name(size); in(name) #define VV(type, name, h, w) vector> name(h, vector(w)); in(name) ll intpow(ll a, ll b){ll ans = 1; while(b){if(b & 1) ans *= a; a *= a; b /= 2;} return ans;} ll modpow(ll a, ll b, ll p){ ll ans = 1; a %= p;if(a < 0) a += p;while(b){ if(b & 1) (ans *= a) %= p; (a *= a) %= p; b /= 2; } return ans; } bool is_clamp(ll val,ll low,ll high) {return low <= val && val < high;} void Yes() {cout << "Yes\n";return;} void No() {cout << "No\n";return;} void YES() {cout << "YES\n";return;} void NO() {cout << "NO\n";return;} template T floor(T a, T b) {return a / b - (a % b && (a ^ b) < 0);} template T ceil(T x, T y) {return floor(x + y - 1, y);} template T bmod(T x, T y) {return x - y * floor(x, y);} template pair divmod(T x, T y) {T q = floor(x, y);return {q, x - q * y};} namespace IO{ #define VOID(a) decltype(void(a)) struct setting{ setting(){cin.tie(nullptr); ios::sync_with_stdio(false);fixed(cout); cout.precision(15);}} setting; template struct P : P{}; template<> struct P<0>{}; template void i(T& t){ i(t, P<3>{}); } void i(vector::reference t, P<3>){ int a; i(a); t = a; } template auto i(T& t, P<2>) -> VOID(cin >> t){ cin >> t; } template auto i(T& t, P<1>) -> VOID(begin(t)){ for(auto&& x : t) i(x); } template void ituple(T& t, index_sequence){in(get(t)...);} template auto i(T& t, P<0>) -> VOID(tuple_size{}){ituple(t, make_index_sequence::value>{});} #undef VOID } #define unpack(a) (void)initializer_list{(a, 0)...} template void in(Ts&... t){ unpack(IO :: i(t)); } #undef unpack constexpr long double PI = 3.141592653589793238462643383279L; template struct REC { F f; REC(F &&f_) : f(forward(f_)) {} template auto operator()(Args &&...args) const { return f(*this, forward(args)...); }}; constexpr int mod = 998244353; //constexpr int mod = 1000000007; #line 2 "library/modint/Modint.hpp" template struct Modint{ int x; Modint():x(0) {} Modint(long long y): x(y >= 0 ? y % mod : (mod - (-y) % mod) % mod) {} Modint &operator += (const Modint &p) { if((x += p.x) >= mod) x -= mod; return *this;} Modint &operator -= (const Modint &p) { if ((x += mod - p.x) >= mod) x -= mod; return *this;} Modint &operator *= (const Modint &p) { x = (int)(1LL * x * p.x % mod); return *this;} Modint &operator /= (const Modint &p) { *this *= p.inverse(); return *this;} Modint operator -() const{return Modint(-x);} Modint operator +(const Modint &p) const {return Modint(*this) += p;} Modint operator -(const Modint &p) const {return Modint(*this) -= p;} Modint operator *(const Modint &p) const {return Modint(*this) *= p;} Modint operator /(const Modint &p) const {return Modint(*this) /= p;} Modint &operator ++() {if(x == mod - 1) x = 0; else x++; return *this;} Modint &operator --() {if(x == 0) x = mod - 1; else x--; return *this;} bool operator == (const Modint &p) const {return x == p.x;} bool operator != (const Modint &p) const {return x != p.x;} Modint inverse() const { int a = x, b = mod, u = 1, v = 0, t; while (b > 0) { t = a / b; swap(a -= t * b, b); swap(u -= t * v, v); } return Modint(u);} Modint pow(long long n) const { Modint ret(1), mul(x); while (n > 0) { if (n & 1) ret *= mul; mul *= mul; n >>= 1; } return ret;} friend ostream &operator<<(ostream &os, const Modint &p) { return os << p.x; } friend istream &operator>>(istream &is, Modint &a) { long long t; is >> t; a = Modint(t); return (is); } int get() const { return x; } static constexpr int get_mod() {return mod;} }; #line 99 "main.cpp" using mint = Modint; using vm = vector; using vvm = vector; using vvvm = vector; #line 2 "set-function/subset-convolution.hpp" #line 107 "main.cpp" using namespace std; template struct SubsetConvolution { using fps = array; static constexpr int s = _s; vector pc; SubsetConvolution() : pc(1 << s) { for (int i = 1; i < (1 << s); i++) pc[i] = pc[i - (i & -i)] + 1; } void add(fps& l, const fps& r, int d) { for (int i = 0; i < d; ++i) l[i] += r[i]; } void sub(fps& l, const fps& r, int d) { for (int i = d; i <= s; ++i) l[i] -= r[i]; } void zeta(vector& a) { int n = a.size(); for (int w = 1; w < n; w *= 2) { for (int k = 0; k < n; k += w * 2) { for (int i = 0; i < w; ++i) { add(a[k + w + i], a[k + i], pc[k + w + i]); } } } } void mobius(vector& a) { int n = a.size(); for (int w = n >> 1; w; w >>= 1) { for (int k = 0; k < n; k += w * 2) { for (int i = 0; i < w; ++i) { sub(a[k + w + i], a[k + i], pc[k + w + i]); } } } } vector lift(const vector& a) { vector A(a.size()); for (int i = 0; i < (int)a.size(); i++) { fill(begin(A[i]), end(A[i]), mint()); A[i][pc[i]] = a[i]; } return A; } vector unlift(const vector& A) { vector a(A.size()); for (int i = 0; i < (int)A.size(); i++) a[i] = A[i][pc[i]]; return a; } void prod(vector& A, const vector& B) { int n = A.size(), d = __builtin_ctz(n); for (int i = 0; i < n; i++) { fps c{}; for (int j = 0; j <= d; j++) { for (int k = 0; k <= d - j; k++) { c[j + k] += A[i][j] * B[i][k]; } } A[i].swap(c); } } vector multiply(const vector& a, const vector& b) { vector A = lift(a), B = lift(b); zeta(A), zeta(B); prod(A, B); mobius(A); return unlift(A); } }; /** * @brief Subset Convolution * @docs docs/set-function/subset-convolution.md */ void solve() { INT(n,m); VV(int,a,n,m); mint ans; if(n <= 20) { vi used(n); rep(i,n) { if(used[i]) continue; vi v; rep(j,n) { if(a[i][0] == a[j][0]) { used[j] = 1; v.emplace_back(j); } } vm dp(1 << v.size()); dp.back() = 1; rep(j,m) { vm ndp(1 << v.size()); rep(k,1 << v.size()) { if(dp[k] == 0) continue; rep(l,v.size()) { if(k >> l & 1) { if(j + 1 == m || a[i][0] == a[v[l]][j+1]) ndp[k] += dp[k]; else ndp[k ^ (1 << l)] += dp[k]; } } } dp = move(ndp); } rep(j,1 << v.size()) ans += dp[j]; } cout << ans << '\n'; } else { vi used(n); SubsetConvolution sc; rep(i,n) { if(used[i]) continue; vi v; rep(j,n) { if(a[i][0] == a[j][0]) { used[j] = 1; v.emplace_back(j); } } vm dp(1 << m); dp[0] = 1; rep(j,v.size()) { vm dp2(1 << m); rep(k,1 << m) { int ok = 1; int x = a[v[j]][0]; rep(l,m) { if(k >> l & 1) { if(x != a[v[j]][0]) { ok = 0; break; } if(l + 1 < m) x = a[v[j]][l+1]; } } dp2[k] = ok; } dp = sc.multiply(dp,dp2); } ans += dp.back(); } cout << ans << '\n'; } } int main() { //INT(TT); int TT = 1; rep(i,TT) solve(); }