#include using namespace std; #define rep(i, n) for (int i = 0; i < (n); i++) #define per(i, n) for (int i = (n)-1; i >= 0; i--) #define rep2(i, l, r) for (int i = (l); i < (r); i++) #define per2(i, l, r) for (int i = (r)-1; i >= (l); i--) #define each(e, v) for (auto &e : v) #define MM << " " << #define pb push_back #define eb emplace_back #define all(x) begin(x), end(x) #define rall(x) rbegin(x), rend(x) #define sz(x) (int)x.size() using ll = long long; using pii = pair; using pil = pair; using pli = pair; using pll = pair; template using minheap = priority_queue, greater>; template using maxheap = priority_queue; template bool chmax(T &x, const T &y) { return (x < y) ? (x = y, true) : false; } template bool chmin(T &x, const T &y) { return (x > y) ? (x = y, true) : false; } template int flg(T x, int i) { return (x >> i) & 1; } int pct(int x) { return __builtin_popcount(x); } int pct(ll x) { return __builtin_popcountll(x); } int topbit(int x) { return (x == 0 ? -1 : 31 - __builtin_clz(x)); } int topbit(ll x) { return (x == 0 ? -1 : 63 - __builtin_clzll(x)); } int botbit(int x) { return (x == 0 ? -1 : __builtin_ctz(x)); } int botbit(ll x) { return (x == 0 ? -1 : __builtin_ctzll(x)); } template void print(const vector &v, T x = 0) { int n = v.size(); for (int i = 0; i < n; i++) cout << v[i] + x << (i == n - 1 ? '\n' : ' '); if (v.empty()) cout << '\n'; } template void printn(const vector &v, T x = 0) { int n = v.size(); for (int i = 0; i < n; i++) cout << v[i] + x << '\n'; } template int lb(const vector &v, T x) { return lower_bound(begin(v), end(v), x) - begin(v); } template int ub(const vector &v, T x) { return upper_bound(begin(v), end(v), x) - begin(v); } template void rearrange(vector &v) { sort(begin(v), end(v)); v.erase(unique(begin(v), end(v)), end(v)); } template vector id_sort(const vector &v, bool greater = false) { int n = v.size(); vector ret(n); iota(begin(ret), end(ret), 0); sort(begin(ret), end(ret), [&](int i, int j) { return greater ? v[i] > v[j] : v[i] < v[j]; }); return ret; } template void reorder(vector &a, const vector &ord) { int n = a.size(); vector b(n); for (int i = 0; i < n; i++) b[i] = a[ord[i]]; swap(a, b); } template T floor(T x, T y) { assert(y != 0); if (y < 0) x = -x, y = -y; return (x >= 0 ? x / y : (x - y + 1) / y); } template T ceil(T x, T y) { assert(y != 0); if (y < 0) x = -x, y = -y; return (x >= 0 ? (x + y - 1) / y : x / y); } template pair operator+(const pair &p, const pair &q) { return make_pair(p.first + q.first, p.second + q.second); } template pair operator-(const pair &p, const pair &q) { return make_pair(p.first - q.first, p.second - q.second); } template istream &operator>>(istream &is, pair &p) { S a; T b; is >> a >> b; p = make_pair(a, b); return is; } template ostream &operator<<(ostream &os, const pair &p) { return os << p.first << ' ' << p.second; } struct io_setup { io_setup() { ios_base::sync_with_stdio(false); cin.tie(NULL); cout << fixed << setprecision(15); cerr << fixed << setprecision(15); } } io_setup; constexpr int inf = (1 << 30) - 1; constexpr ll INF = (1LL << 60) - 1; // constexpr int MOD = 1000000007; constexpr int MOD = 998244353; template struct Binary_Indexed_Tree { vector bit; const int n; Binary_Indexed_Tree(const vector &v) : n((int)v.size()) { bit.resize(n + 1); copy(begin(v), end(v), begin(bit) + 1); build(); } Binary_Indexed_Tree(int n, T x = 0) : Binary_Indexed_Tree(vector(n, x)) {} void set(int i, const T &x) { bit[i + 1] = x; } void build() { for (int a = 2; a <= n; a <<= 1) { for (int b = a; b <= n; b += a) bit[b] += bit[b - a / 2]; } } void add(int i, const T &x) { for (i++; i <= n; i += (i & -i)) bit[i] += x; } void change(int i, const T &x) { add(i, x - query(i, i + 1)); } T sum(int i) const { i = min(i, n); if (i <= 0) return 0; T ret = 0; for (; i > 0; i -= (i & -i)) ret += bit[i]; return ret; } T query(int l, int r) const { l = max(l, 0), r = min(r, n); if (l >= r) return 0; return sum(r) - sum(l); } T operator[](int i) const { return query(i, i + 1); } // v[0]+...+v[r] >= x を満たす最小の r (なければ n) int lower_bound(T x) const { int ret = 0; for (int k = 31 - __builtin_clz(n); k >= 0; k--) { if (ret + (1 << k) <= n && bit[ret + (1 << k)] < x) x -= bit[ret += (1 << k)]; } return ret; } // v[0]+...+v[r] > x を満たす最小の r (なければ n) int upper_bound(T x) const { int ret = 0; for (int k = 31 - __builtin_clz(n); k >= 0; k--) { if (ret + (1 << k) <= n && bit[ret + (1 << k)] <= x) x -= bit[ret += (1 << k)]; } return ret; } }; template struct Range_Add_Range_Sum { Binary_Indexed_Tree bit0, bit1; const int n; Range_Add_Range_Sum(const vector &v) : n(v.size()), bit0(v), bit1(v.size(), 0) {} Range_Add_Range_Sum(int n, const T &x) : Range_Add_Range_Sum(vector(n, x)) {} void add(int l, int r, const T &x) { l = max(l, 0), r = min(r, n); if (l >= r) return; bit0.add(l, -x * T(l)), bit1.add(l, x); if (r < n) bit0.add(r, x * T(r)), bit1.add(r, -x); } T sum(int i) const { i = min(i, n); if (i < 0) return 0; return bit0.sum(i) + bit1.sum(i) * T(i); } T query(int l, int r) const { l = max(l, 0), r = min(r, n); if (l >= r) return 0; return sum(r) - sum(l); } }; template struct Slope_Trick { priority_queue l; priority_queue, greater> r; const T INF_T = numeric_limits::max() / 2; T add_l, add_r; T min_f = 0; // f(x) = 0 で初期化 Slope_Trick() : add_l(0), add_r(0) { l.push(-INF_T); r.push(INF_T); } T get_min() const { return min_f; }; void add_constant(const T &c) { min_f += c; }; // f(x) += max(-x+a, 0) void add_line_left(const T &a) { if (a > r.top() + add_r) { min_f += -(r.top() + add_r) + a; l.push(r.top() + add_r - add_l); r.pop(); r.push(a - add_r); } else { l.push(a - add_l); } } // f(x) += max(x-a, 0) void add_line_right(const T &a) { if (a < l.top() + add_l) { min_f += (l.top() + add_l) - a; r.push(l.top() + add_l - add_r); l.pop(); l.push(a - add_l); } else { r.push(a - add_r); } } // f(x) += |x-a| void add_abs(const T &a) { add_line_left(a); add_line_right(a); } // f(x) <- min{f(y) | y <= x} void left_min() { while ((int)r.size() > 1) r.pop(); } // f(x) <- min{f(y) | y >= x} void right_min() { while ((int)l.size() > 1) l.pop(); } // f(x) <- min{f(y) | x-b <= y <= x-a} void slide_min(const T &a, const T &b) { assert(a <= b); add_l += a; add_r += b; } // f(x) <- f(x-a) void shift(const T &a) { add_l += a; add_r += a; } // f(x) を入手 (ただし、l と r は破壊される) T get(const T &x) { T ret = min_f; while (!l.empty()) { ret += max(T(0), -x + (l.top() + add_l)); l.pop(); } while (!r.empty()) { ret += max(T(0), x - (r.top() + add_r)); r.pop(); } return ret; } }; void solve() { ll N, K, LEFT, RIGHT; cin >> N >> K >> LEFT >> RIGHT; vector a(N); rep(i, N) cin >> a[i]; ll D = RIGHT - LEFT; vector> ids(K); rep(i, N) ids[a[i] % K].eb(a[i]); vector xs; each(e, a) { xs.eb(ceil(e - D, K)); xs.eb(ceil(e - D - (K - 1), K)); xs.eb(floor(e, K)); xs.eb(floor(e - (K - 1), K)); } rearrange(xs); int L = sz(xs); Binary_Indexed_Tree b_cnt(L, 0), b_plus(L, 0); ll sum = 0; auto erase = [&](ll l, int type = 0) { int t = lb(xs, l); assert(xs[t] == l); b_cnt.add(t, -1); b_plus.add(t, -l); if (type) sum -= l; }; auto insert = [&](ll l, int type = 0) { int t = lb(xs, l); assert(xs[t] == l); b_cnt.add(t, 1); b_plus.add(t, l); if (type) sum += l; }; auto get_ans = [&]() { // for (int i = 0; i < L; i++) cout << b_cnt[i] << (i == L - 1 ? '\n' : ' '); int t = b_cnt.lower_bound(N); return -b_plus.query(0, t + 1) + b_cnt.query(0, t + 1) * xs[t] - xs[t] * N + sum; // ll l = b_cnt.query(0, t) * xs[t] - b_plus.query(0, t); // ll r = b_plus.query(t, L) - b_cnt.query(t, L) * xs[t]; // cout << "! " << t MM L MM l MM r MM xs[t] MM sum << endl; // return l + r - xs[t] * N + sum; }; rep(i, N) { insert(ceil(a[i] - D, K), 1); insert(floor(a[i], K)); } ll ans = get_ans(); // print(xs); rep2(j, 1, K) { { int m = (j - 1) % K; if (m < 0) m += K; each(e, ids[m]) { erase(floor(e - (j - 1), K)); insert(floor(e - j, K)); } } { int m = (D + j) % K; if (m < 0) m += K; each(e, ids[m]) { erase(ceil(e - D - (j - 1), K), 1); insert(ceil(e - D - j, K), 1); } } chmin(ans, get_ans()); } cout << ans << '\n'; // auto erase = [&](int i, int j) { // for (auto &e : ids[i]) { // ll l = ceil(e - D - j, K); // ll r = ceil(e - j, K); // } // }; // auto insert = [&](int i, int j) { // for (auto &e : ids[i]) { // ll l = ceil(e - D - j, K); // ll r = ceil(e - j, K); // } // }; // auto get_upper = [&]() { // vector ret(N, 0); // Binary_Indexed_Tree bit(K, 0); // queue que; // que.emplace(a[N - 1]); // ll ans = 0; // per(i, N - 1) { // ll d = a[i + 1] - a[i]; // ans += bit.query(0, K) * (d / K); // d %= K; // ll r = (a[i + 1] + D) % K + 1; // ll l = r - d; // if (0 <= l) { // ans += bit.query(l, r); // } else { // ans += bit.query(K + l, K); // ans += bit.query(0, r); // } // while (!empty(que)) { // ll x = que.front(); // if (x > a[i] + D) { // ans += ceil(x - (a[i] + D), K); // bit.add(x % K, 1); // que.pop(); // } else { // break; // } // } // ret[i] = ans; // que.emplace(a[i]); // } // return ret; // }; // auto get_lower = [&]() { // vector ret(N, 0); // Binary_Indexed_Tree bit(K, 0); // queue que; // que.emplace(a[0]); // ll ans = 0; // rep2(i, 1, N) { // ll d = a[i] - a[i - 1]; // ans += bit.query(0, K) * (d / K); // d %= K; // ll l = a[i - 1] % K; // ll r = l + d; // if (r <= K) { // ans += bit.query(l, r); // } else { // ans += bit.query(l, K); // ans += bit.query(0, r - K); // } // while (!empty(que)) { // ll x = que.front(); // if (x < a[i]) { // ans += ceil(a[i] - x, K); // bit.add(x % K, 1); // que.pop(); // } else { // break; // } // } // ret[i] = ans; // que.emplace(a[i]); // } // return ret; // }; // auto up = get_upper(), lo = get_lower(); // ll ans = INF; // vector nup(N, 0), nlo(N, 0); // rep(i, N) { // rep2(j, i + 1, N) { // if (a[j] > a[i] + D) nup[i] += ceil(a[j] - a[i] - D, K); // } // rep(j, i) { // if (a[j] < a[i]) nlo[i] += ceil(a[i] - a[j], K); // } // } // print(a), print(up), print(nup), print(lo), print(nlo); // rep(i, N) chmin(ans, up[i] + lo[i]); // cout << ans << '\n'; } int main() { int T = 1; // cin >> T; while (T--) solve(); }