結果
| 問題 | No.3567 Modulo Grid |
| コンテスト | |
| ユーザー |
Rubikun
|
| 提出日時 | 2026-06-05 23:11:50 |
| 言語 | C++17 (gcc 15.2.0 + boost 1.89.0) |
| 結果 |
AC
|
| 実行時間 | 65 ms / 2,000 ms |
| コード長 | 9,246 bytes |
| 記録 | |
| コンパイル時間 | 2,116 ms |
| コンパイル使用メモリ | 227,356 KB |
| 実行使用メモリ | 32,892 KB |
| 最終ジャッジ日時 | 2026-06-05 23:11:55 |
| 合計ジャッジ時間 | 4,351 ms |
|
ジャッジサーバーID (参考情報) |
judge3_1 / judge1_0 |
| 純コード判定待ち |
(要ログイン)
| ファイルパターン | 結果 |
|---|---|
| sample | AC * 2 |
| other | AC * 25 |
コンパイルメッセージ
main.cpp:44:9: warning: '#pragma once' in main file [-Wpragma-once-outside-header]
44 | #pragma once
| ^~~~
main.cpp:97:9: warning: '#pragma once' in main file [-Wpragma-once-outside-header]
97 | #pragma once
| ^~~~
main.cpp:109:9: warning: '#pragma once' in main file [-Wpragma-once-outside-header]
109 | #pragma once
| ^~~~
ソースコード
#include <bits/stdc++.h>
using namespace std;
typedef long long ll;
template<class T>bool chmax(T &a, const T &b) { if (a<b) { a=b; return true; } return false; }
template<class T>bool chmin(T &a, const T &b) { if (b<a) { a=b; return true; } return false; }
#define vi vector<int>
#define vl vector<ll>
#define vii vector<pair<int,int>>
#define vll vector<pair<ll,ll>>
#define vvi vector<vector<int>>
#define vvl vector<vector<ll>>
#define vvii vector<vector<pair<int,int>>>
#define vvll vector<vector<pair<ll,ll>>>
#define vst vector<string>
#define pii pair<int,int>
#define pll pair<ll,ll>
#define pb push_back
#define all(x) (x).begin(),(x).end()
#define mkunique(x) sort(all(x));(x).erase(unique(all(x)),(x).end())
#define fi first
#define se second
#define mp make_pair
#define si(x) int(x.size())
const int mod=998244353,MAX=300005,INF=15<<26;
//高速素因数分解
/**
* Author: chilli, Ramchandra Apte, Noam527, Simon Lindholm
* Date: 2019-04-24
* License: CC0
* Source: https://github.com/RamchandraApte/OmniTemplate/blob/master/modulo.hpp…
* Description: Calculate $a\cdot b\bmod c$ (or $a^b \bmod c$) for $0 \le a, b \le c \le 7.2\cdot 10^{18}$.
* Time: O(1) for \texttt{modmul}, O(\log b) for \texttt{modpow}
* Status: stress-tested, proven correct
* Details:
* This runs ~2x faster than the naive (__int128_t)a * b % M.
* A proof of correctness is in doc/modmul-proof.tex. An earlier version of the proof,
* from when the code used a * b / (long double)M, is in doc/modmul-proof.md.
* The proof assumes that long doubles are implemented as x87 80-bit floats; if they
* are 64-bit, as on e.g. MSVC, the implementation is only valid for
* $0 \le a, b \le c < 2^{52} \approx 4.5 \cdot 10^{15}$.
*/
#pragma once
typedef unsigned long long ull;
ull modmul(ull a, ull b, ull M) {
ll ret = a * b - M * ull(1.L / M * a * b);
return ret + M * (ret < 0) - M * (ret >= (ll)M);
}
ull modpow(ull b, ull e, ull mod) {
ull ans = 1;
for (; e; b = modmul(b, b, mod), e /= 2)
if (e & 1) ans = modmul(ans, b, mod);
return ans;
}
/**
* Author: chilli, SJTU, pajenegod
* Date: 2020-03-04
* License: CC0
* Source: own
* Description: Pollard-rho randomized factorization algorithm. Returns prime
* factors of a number, in arbitrary order (e.g. 2299 -> \{11, 19, 11\}).
* Time: $O(n^{1/4})$, less for numbers with small factors.
* Status: stress-tested
*
* Details: This implementation uses the improvement described here
* (https://en.wikipedia.org/wiki/Pollard%27s_rho_algorithm#Variants…), where
* one can accumulate gcd calls by some factor (40 chosen here through
* exhaustive testing). This improves performance by approximately 6-10x
* depending on the inputs and speed of gcd. Benchmark found here:
* (https://ideone.com/nGGD9T)
*
* GCD can be improved by a factor of 1.75x using Binary GCD
* (https://lemire.me/blog/2013/12/26/fastest-way-to-compute-the-greatest-common-divisor/…).
* However, with the gcd accumulation the bottleneck moves from the gcd calls
* to the modmul. As GCD only constitutes ~12% of runtime, speeding it up
* doesn't matter so much.
*
* This code can probably be sped up by using a faster mod mul - potentially
* montgomery reduction on 128 bit integers.
* Alternatively, one can use a quadratic sieve for an asymptotic improvement,
* which starts being faster in practice around 1e13.
*
* Brent's cycle finding algorithm was tested, but doesn't reduce modmul calls
* significantly.
*
* Subtle implementation notes:
* - we operate on residues in [1, n]; modmul can be proven to work for those
* - prd starts off as 2 to handle the case n = 4; it's harmless for other n
* since we're guaranteed that n > 2. (Pollard rho has problems with prime
* powers in general, but all larger ones happen to work.)
* - t starts off as 30 to make the first gcd check come earlier, as an
* optimization for small numbers.
*/
#pragma once
/**
* Author: chilli, c1729, Simon Lindholm
* Date: 2019-03-28
* License: CC0
* Source: Wikipedia, https://miller-rabin.appspot.com
* Description: Deterministic Miller-Rabin primality test.
* Guaranteed to work for numbers up to $7 \cdot 10^{18}$; for larger numbers, use Python and extend A randomly.
* Time: 7 times the complexity of $a^b \mod c$.
* Status: Stress-tested
*/
#pragma once
bool isPrime(ull n) {
if (n < 2 || n % 6 % 4 != 1) return (n | 1) == 3;
ull A[] = {2, 325, 9375, 28178, 450775, 9780504, 1795265022},
s = __builtin_ctzll(n-1), d = n >> s;
for (ull a : A) { // ^ count trailing zeroes
ull p = modpow(a%n, d, n), i = s;
while (p != 1 && p != n - 1 && a % n && i--)
p = modmul(p, p, n);
if (p != n-1 && i != s) return 0;
}
return 1;
}
ull pollard(ull n) {
auto f = [n](ull x) { return modmul(x, x, n) + 1; };
ull x = 0, y = 0, t = 30, prd = 2, i = 1, q;
while (t++ % 40 || __gcd(prd, n) == 1) {
if (x == y) x = ++i, y = f(x);
if ((q = modmul(prd, max(x,y) - min(x,y), n))) prd = q;
x = f(x), y = f(f(y));
}
return __gcd(prd, n);
}
vector<ull> factor(ull n) {
if (n == 1) return {};
if (isPrime(n)) return {n};
ull x = pollard(n);
auto l = factor(x), r = factor(n / x);
l.insert(l.end(), all(r));
return l;
}
vector<int> prime;//i番目の素数
bool is_prime[MAX+1];
void sieve(int n){
for(int i=0;i<=n;i++){
is_prime[i]=true;
}
is_prime[0]=is_prime[1]=false;
for(int i=2;i<=n;i++){
if(is_prime[i]){
prime.push_back(i);
for(int j=2*i;j<=n;j+=i){
is_prime[j] = false;
}
}
}
}
vvi X;
vi A;
void DFS(int u,int st,int seki){
if(u==si(X)){
A.pb(seki);
return;
}
if(st%2==0){
for(int j=0;j<si(X[u]);j++){
DFS(u+1,st*si(X[u])+j,seki*X[u][j]);
}
}else{
for(int j=0;j<si(X[u]);j++){
DFS(u+1,st*si(X[u])+j,seki*X[u][si(X[u])-1-j]);
}
}
}
vi F(int N){
X.clear();
A.clear();
int NN=N;
for(int p:prime){
if(NN%p==0){
vi Y={1};
while(NN%p==0){
Y.pb(Y.back()*p);
NN/=p;
}
X.pb(Y);
}
}
DFS(0,0,1);
vi res;
vi CN(N+1);
for(int i=1;i<=N;i++) CN[gcd(i,N)]++;
for(int x:A){
for(int t=0;t<CN[x];t++) res.pb(x);
}
return res;
}
int main(){
std::ifstream in("text.txt");
std::cin.rdbuf(in.rdbuf());
cin.tie(0);
ios::sync_with_stdio(false);
sieve(MAX-2);
int H,W;cin>>H>>W;
auto X=F(H),Y=F(W);
vvi ans(H,vi(W)),B(H,vi(W,1));
vvi Z(H*W+1);
for(int a=1;a<=H*W;a++) Z[gcd(a,H*W)].pb(a);
{
int N=H*W;
for(int p:prime){
if(N%p==0){
if(H%p==0){
if(W%p==0){
int ma=-1;
for(int i=0;i<H;i++){
int now=X[i],kake=1;
while(now%p==0){
now/=p;
kake*=p;
}
chmax(ma,kake);
}
for(int i=0;i<H;i++){
for(int j=0;j<W;j++){
int now=X[i],kake=1;
while(now%p==0){
now/=p;
kake*=p;
}
if(kake==ma){
now=Y[j];
while(now%p==0){
now/=p;
kake*=p;
}
B[i][j]*=kake;
}else{
B[i][j]*=kake;
}
}
}
}else{
for(int i=0;i<H;i++){
for(int j=0;j<W;j++){
int now=X[i],kake=1;
while(now%p==0){
now/=p;
kake*=p;
}
B[i][j]*=kake;
}
}
}
}else{
for(int i=0;i<H;i++){
for(int j=0;j<W;j++){
int now=Y[j],kake=1;
while(now%p==0){
now/=p;
kake*=p;
}
B[i][j]*=kake;
}
}
}
}
}
}
for(int i=0;i<H;i++){
for(int j=0;j<W;j++){
cout<<Z[B[i][j]].back()<<" ";
//cout<<B[i][j]<<" ";
Z[B[i][j]].pop_back();
}
cout<<"\n";
}
}
Rubikun