#include #include #include #include #include #include #include #include #include #include #include static const int MOD = 1000000007; using ll = long long; using namespace std; template constexpr T INF = ::numeric_limits::max()/32*15+208; template vector make_v(U size, const T& init){ return vector(static_cast(size), init); } template auto make_v(U size, Ts... rest) { return vector(static_cast(size), make_v(rest...)); } template void chmin(T &a, const T &b){ a = (a < b ? a : b); } template void chmax(T &a, const T &b){ a = (a > b ? a : b); } int main() { ll n, k; cin >> n >> k; int m = n/k; if(n == 1){ puts("Yes"); cout << 1 << "\n"; return 0; }else if(k == 1){ puts("Yes"); for (int i = 0; i < n; ++i) { if(i) printf(" "); printf("%d", i+1); } puts(""); return 0; }else if(n*(n+1)/2%k != 0){ puts("No"); return 0; }else if(m == 1){ puts("No"); return 0; } puts("Yes"); vector> ans(k); int cnt = 1; if(m%2){ for (int i = 0; i < k; ++i) { ans[i].emplace_back(cnt++); } for (int i = 0; i < k; ++i) { ans[(i+(k+1)/2)%k].emplace_back(cnt++); } for (int i = 0; i < k; ++i) { ans[i].emplace_back(3*(3*k+1)/2-ans[i][0]-ans[i][1]); } cnt += k; m -= 3; } for (int i = 0; i < m; ++i) { if(i&1){ for (int j = 0; j < k; ++j) { ans[j].emplace_back(cnt++); } }else { for (int j = k-1; j >= 0; --j) { ans[j].emplace_back(cnt++); } } } for (int i = 0; i < k; ++i) { for (int j = 0; j < ans[i].size(); ++j) { if(j) printf(" "); printf("%d", ans[i][j]); } puts(""); } return 0; }