#include using namespace std; #define rep(i, n) for (int i = 0; i < (n); i++) #define per(i, n) for (int i = (n)-1; i >= 0; i--) #define rep2(i, l, r) for (int i = (l); i < (r); i++) #define per2(i, l, r) for (int i = (r)-1; i >= (l); i--) #define each(e, v) for (auto &e : v) #define MM << " " << #define pb push_back #define eb emplace_back #define all(x) begin(x), end(x) #define rall(x) rbegin(x), rend(x) #define sz(x) (int)x.size() using ll = long long; using pii = pair; using pil = pair; using pli = pair; using pll = pair; template using minheap = priority_queue, greater>; template using maxheap = priority_queue; template bool chmax(T &x, const T &y) { return (x < y) ? (x = y, true) : false; } template bool chmin(T &x, const T &y) { return (x > y) ? (x = y, true) : false; } template int flg(T x, int i) { return (x >> i) & 1; } template void print(const vector &v, T x = 0) { int n = v.size(); for (int i = 0; i < n; i++) cout << v[i] + x << (i == n - 1 ? '\n' : ' '); if (v.empty()) cout << '\n'; } template void printn(const vector &v, T x = 0) { int n = v.size(); for (int i = 0; i < n; i++) cout << v[i] + x << '\n'; } template int lb(const vector &v, T x) { return lower_bound(begin(v), end(v), x) - begin(v); } template int ub(const vector &v, T x) { return upper_bound(begin(v), end(v), x) - begin(v); } template void rearrange(vector &v) { sort(begin(v), end(v)); v.erase(unique(begin(v), end(v)), end(v)); } template vector id_sort(const vector &v, bool greater = false) { int n = v.size(); vector ret(n); iota(begin(ret), end(ret), 0); sort(begin(ret), end(ret), [&](int i, int j) { return greater ? v[i] > v[j] : v[i] < v[j]; }); return ret; } template pair operator+(const pair &p, const pair &q) { return make_pair(p.first + q.first, p.second + q.second); } template pair operator-(const pair &p, const pair &q) { return make_pair(p.first - q.first, p.second - q.second); } template istream &operator>>(istream &is, pair &p) { S a; T b; is >> a >> b; p = make_pair(a, b); return is; } template ostream &operator<<(ostream &os, const pair &p) { return os << p.first << ' ' << p.second; } struct io_setup { io_setup() { ios_base::sync_with_stdio(false); cin.tie(NULL); cout << fixed << setprecision(15); } } io_setup; const int inf = (1 << 30) - 1; const ll INF = (1LL << 60) - 1; // const int MOD = 1000000007; const int MOD = 998244353; template struct Binary_Indexed_Tree { vector bit; const int n; Binary_Indexed_Tree(const vector &v) : n((int)v.size()) { bit.resize(n + 1); copy(begin(v), end(v), begin(bit) + 1); for (int a = 2; a <= n; a <<= 1) { for (int b = a; b <= n; b += a) bit[b] += bit[b - a / 2]; } } Binary_Indexed_Tree(int n, const T &x) : Binary_Indexed_Tree(vector(n, x)) {} void add(int i, const T &x) { for (i++; i <= n; i += (i & -i)) bit[i] += x; } void change(int i, const T &x) { add(i, x - query(i, i + 1)); } T sum(int i) const { i = min(i, n); T ret = 0; for (; i > 0; i -= (i & -i)) ret += bit[i]; return ret; } T query(int l, int r) const { if (l >= r) return 0; return sum(r) - sum(l); } T operator[](int i) const { return query(i, i + 1); } // v[0]+...+v[r] >= x を満たす最小の r (なければ n) int lower_bound(T x) const { int ret = 0; for (int k = 31 - __builtin_clz(n); k >= 0; k--) { if (ret + (1 << k) <= n && bit[ret + (1 << k)] < x) x -= bit[ret += (1 << k)]; } return ret; } // v[0]+...+v[r] > x を満たす最小の r (なければ n) int upper_bound(T x) const { int ret = 0; for (int k = 31 - __builtin_clz(n); k >= 0; k--) { if (ret + (1 << k) <= n && bit[ret + (1 << k)] <= x) x -= bit[ret += (1 << k)]; } return ret; } }; template long long inversion_number(const vector &a) { int n = a.size(); vector v(n); iota(begin(v), end(v), 0); sort(begin(v), end(v), [&](int i, int j) { if (a[i] != a[j]) return a[i] < a[j]; return i < j; }); Binary_Indexed_Tree bit(n, 0); long long ret = 0; for (int i = 0; i < n; i++) { ret += bit.query(v[i] + 1, n); bit.add(v[i], 1); } return ret; } // a を b に変換するのに必要な最小バブルソート回数 template long long inversion_number(const vector &a, const vector &b) { int n = a.size(); assert(b.size() == n); vector u(n), v(n); iota(begin(u), end(u), 0); sort(begin(u), end(u), [&](int i, int j) { if (a[i] != a[j]) return a[i] < a[j]; return i < j; }); iota(begin(v), end(v), 0); sort(begin(v), end(v), [&](int i, int j) { if (b[i] != b[j]) return b[i] < b[j]; return i < j; }); vector w(n); for (int i = 0; i < n; i++) { if (a[u[i]] != b[v[i]]) return -1; w[v[i]] = u[i]; } Binary_Indexed_Tree bit(n, 0); long long ret = 0; for (int i = 0; i < n; i++) { ret += bit.query(w[i] + 1, n); bit.add(w[i], 1); } return ret; } int judge(const vector> &a) { int N = sz(a); vector x(N), y(N); rep(i, N) x[i] = inversion_number(a[i]); rep(j, N) { vector v(N); rep(i, N) v[i] = a[i][j]; y[j] = inversion_number(v); } return inversion_number(x) + inversion_number(y); } int main() { int N, K; cin >> N >> K; if (K > N * (N - 1)) { cout << "No\n"; return 0; } cout << "Yes\n"; if (K == 1) { vector> a(N, vector(N, 0)); a[N - 2][N - 2] = 1; rep(i, N) a[N - 1][i] = 1; rep(i, N) print(a[i]); // if (judge(a) != K) cout << "-1\n"; return 0; } if (K == 3) { vector> a(N, vector(N, 0)); rep(i, N) a[N - 2][i] = 1; rep(i, N) a[N - 1][i] = 2; a[N - 3][N - 3] = 1; a[N - 2][N - 2] = 2; rep(i, N) print(a[i]); // if (judge(a) != K) cout << "-1\n"; return 0; } int L = K / 2; vector P(N); iota(all(P), 0); rep(i, N) { per2(j, i, N - 1) { if (L > 0) { swap(P[j], P[j + 1]); L--; } } } // print(P); if (K & 1) { per(i, N - 1) { if (P[i] < P[i + 1]) { swap(P[i], P[i + 1]); break; } } } if (K == N * (N - 1) - 3) { rep(i, N) P[i] = N - 1 - i; swap(P[0], P[1]); } // print(P); vector> a(N, vector(N, 1)); rep(i, N) a[i][P[i]] = 0; if (K & 1) { int x = -1; rep(i, N) { if (P[i] == N - 1) x = i; } int y = P[N - 2]; a[x][y] = 2; } rep(i, N) print(a[i]); // if (judge(a) != K) cout << "-1\n"; }