QOJ.ac
QOJ
ID | Problem | Submitter | Result | Time | Memory | Language | File size | Submit time | Judge time |
---|---|---|---|---|---|---|---|---|---|
#508452 | #7632. Balanced Arrays | pandapythoner | TL | 0ms | 0kb | C++23 | 15.4kb | 2024-08-07 15:43:32 | 2024-08-07 15:43:32 |
answer
#include <bits/stdc++.h>
using namespace std;
using ll = long long;
#define flt double
#define all(a) a.begin(), a.end()
#define rall(a) a.rbegin(), a.rend()
#define rep(i, n) for(int i = 0; i < n; i += 1)
#define len(a) ((int)(a).size())
mt19937 rnd(234);
const ll mod = 998244353;
ll bin_pow(ll x, ll n) {
ll rs = 1;
for (ll i = 1, a = x; i <= n; i *= 2, a = a * a % mod)
if (n & i) rs = rs * a % mod;
return rs;
}
ll inv(ll x) {
return bin_pow(x, mod - 2);
}
namespace fft {
int mxpw;
int mxn;
ll w;
void build_w() {
ll phi = mod - 1;
ll f = phi;
vector<ll> p;
for (ll i = 2; i * i <= f; i += 1) {
if (f % i == 0) {
p.push_back(i);
while (f % i == 0) {
f /= i;
}
}
}
if (f > 1) {
p.push_back(f);
}
for (int i = 1; i < mod; i += 1) {
bool ok = true;
for (auto q : p) {
if (bin_pow(i, phi / q) == 1) {
ok = false;
break;
}
}
if (ok) {
w = bin_pow(i, phi / (1 << mxpw));
break;
}
}
}
vector<ll> rvx;
void build_rvx(int n) {
rvx.resize(n + 1);
for (int i = 1; i <= n; i += 1) {
rvx[i] = inv(i);
}
}
vector<ll> rvi, wpws;
void build(int _mxpw) {
mxpw = _mxpw;
mxn = (1 << mxpw);
build_w();
int n = (1 << mxpw);
rvi.resize(n);
rvi[0] = 0;
for (int i = 1; i < n; i += 1) {
rvi[i] = (rvi[i >> 1] >> 1);
if (i & 1) {
rvi[i] += (1 << (mxpw - 1));
}
}
wpws.resize(n + 1);
wpws[0] = 1;
for (int i = 1; i <= n; i += 1) {
wpws[i] = (wpws[i - 1] * w) % mod;
}
build_rvx(mxn);
}
void fft(vector<ll>& a, int nk) {
int n = (1 << nk);
for (int i = 0; i < n; i += 1) {
int mrv = (rvi[i] >> (mxpw - nk));
if (mrv < i) {
swap(a[mrv], a[i]);
}
}
for (int ln = 1; ln < n; ln *= 2) {
int ln2 = ln + ln;
for (int i = 0; i < n; i += ln2) {
for (int j = 0; j < ln; j += 1) {
ll mw = wpws[mxn / ln2 * j];
int u = i + j;
int v = u + ln;
ll y = a[v] * mw % mod;
a[v] = a[u] - y;
if (a[v] < 0) {
a[v] += mod;
}
a[u] += y;
if (a[u] >= mod) {
a[u] -= mod;
}
}
}
}
}
void rev_fft(vector<ll>& a, int nk) {
int n = (1 << nk);
fft(a, nk);
ll rvn = inv(n);
reverse(a.begin() + 1, a.end());
for (int i = 0; i < n; i += 1) {
a[i] = (a[i] * rvn) % mod;
}
}
vector<ll> square(vector<ll> a) {
int nk = 0;
while ((1 << nk) < (int)a.size() + (int)a.size() - 1) {
nk += 1;
}
int n = (1 << nk);
a.resize(n, 0);
fft(a, nk);
for (int i = 0; i < n; i += 1) {
a[i] = (a[i] * a[i]) % mod;
}
rev_fft(a, nk);
while (!a.empty() && a.back() == 0) {
a.pop_back();
}
return a;
}
vector<ll> mul(vector<ll> a, vector<ll> b) {
int nk = 0;
while ((1 << nk) < (int)a.size() + (int)b.size() - 1) {
nk += 1;
}
int n = (1 << nk);
a.resize(n, 0);
b.resize(n, 0);
fft(a, nk);
fft(b, nk);
for (int i = 0; i < n; i += 1) {
a[i] = (a[i] * b[i]) % mod;
}
rev_fft(a, nk);
while (!a.empty() && a.back() == 0) {
a.pop_back();
}
return a;
}
void add_inplace(vector<ll>& a, const vector<ll>& b, ll k = 1) {
a.resize(max(a.size(), b.size()), 0);
for (int i = 0; i < (int)b.size(); i += 1) {
a[i] = (a[i] + b[i] * k) % mod;
}
}
vector<ll> add(vector<ll> a, const vector<ll>& b, ll k = 1) {
a.resize(max(a.size(), b.size()), 0);
for (int i = 0; i < (int)b.size(); i += 1) {
a[i] = (a[i] + b[i] * k) % mod;
}
return a;
}
vector<ll> sub(vector<ll> a, const vector<ll>& b, ll k = 1) {
a.resize(max(a.size(), b.size()), 0);
for (int i = 0; i < (int)b.size(); i += 1) {
a[i] = (a[i] + mod - b[i] * k % mod) % mod;
}
return a;
}
vector<ll> replace_x_slow(vector<ll>& a, const vector<ll>& b) {
vector<ll> rs = {};
vector<ll> bpw = { 1 };
for (int i = 0; i < (int)a.size(); i += 1) {
if (i > 0) {
bpw = mul(bpw, b);
}
add_inplace(rs, bpw, a[i]);
}
return rs;
}
vector<ll> replace_x(vector<ll>& a, const vector<ll>& b) {
vector<ll> rs = {};
vector<ll> bpw = b;
int n = a.size();
vector<vector<ll>> d(n);
for (int i = 0; i < n; i += 1) {
d[i] = { a[i] };
}
while (n > 1) {
int m = (n + 1) / 2;
vector<vector<ll>> nd(m);
for (int i = 0; i < n; i += 1) {
if (i % 2 == 0) {
nd[i / 2] = d[i];
} else {
add_inplace(nd[i / 2], mul(d[i], bpw));
}
}
n = m;
d.swap(nd);
if (n != 1) {
bpw = square(bpw);
}
}
return d[0];
}
vector<ll> shift_x(vector<ll> a, ll t) {
if (a.empty()) {
return {};
}
int n = (int)a.size() - 1;
vector<ll> f(n + 1), rf(n + 1);
f[0] = rf[0] = 1;
for (int i = 1; i <= n; i += 1) {
f[i] = (f[i - 1] * i) % mod;
rf[i] = inv(f[i]);
}
vector<ll> b(n + 1), c(n + 1);
ll tpw = 1;
for (int i = 0; i <= n; i += 1) {
b[i] = (a[i] * tpw % mod * f[i] % mod);
tpw = (tpw * t) % mod;
}
for (int i = 0; i <= n; i += 1) {
c[n - i] = rf[i];
}
a = mul(b, c);
vector<ll> d(n + 1);
ll rvt = inv(t);
ll rvt_pw = 1;
for (int i = 0; i <= n; i += 1) {
d[i] = rvt_pw * rf[i] % mod * a[i + n] % mod;
rvt_pw = (rvt_pw * rvt) % mod;
}
return d;
}
vector<ll> rev_polynom(const vector<ll>& a, int n) {
int sz = a.size();
vector<ll> b = { inv(a[0]) };
int m = 1;
int mk = 0;
while (m < n) {
int m2 = m + m;
int m4 = m2 + m2;
b.resize(m4);
fft(b, mk + 2);
vector<ll> nb(m4);
for (int i = 0; i < sz && i < m2; i += 1) {
nb[i] = a[i];
}
fft(nb, mk + 2);
for (int i = 0; i < m4; i += 1) {
nb[i] = (2 * b[i] - nb[i] * b[i] % mod * b[i]) % mod;
if (nb[i] < 0) {
nb[i] += mod;
}
}
rev_fft(nb, mk + 2);
nb.resize(m2);
b.swap(nb);
m = m2;
mk += 1;
}
b.resize(n);
return b;
}
vector<ll> square_root(const vector<ll>& a, int n) {
ll sz = a.size();
ll rv2 = inv(2);
vector<ll> b = { 1 };
int m = 1;
while (m < n) {
ll m2 = m + m;
vector<ll> rvb = rev_polynom(b, m2);
vector<ll> ab(m2);
for (int i = 0; i < m2 && i < sz; i += 1) {
ab[i] = a[i];
}
ab = mul(ab, rvb);
ab.resize(m2);
b.resize(m2);
for (int i = 0; i < m2; i += 1) {
b[i] = (rv2 * ((b[i] + ab[i]) % mod)) % mod;
}
m = m2;
}
b.resize(n);
return b;
}
vector<ll> derivative(vector<ll> a) {
int n = a.size();
if (n == 0) {
return {};
}
for (int i = 0; i + 1 < n; i += 1) {
a[i] = (a[i + 1] * (i + 1)) % mod;
}
a.resize(n - 1);
return a;
}
vector<ll> integrate(vector<ll> a) {
int n = a.size();
a.resize(n + 1);
for (int i = n; i > 0; i -= 1) {
a[i] = (a[i - 1] * rvx[i]) % mod;
}
a[0] = 0;
return a;
}
vector<ll> sin_polynomial(int n) {
vector<ll> a(n, 0);
ll fct = 1;
for (int i = 0; i < n; i += 1) {
if (i != 0) {
fct = (fct * i) % mod;
}
if (i % 2 == 1) {
int sign = 1;
if ((i / 2) % 2 == 1) {
sign = -1;
}
a[i] = (mod + sign * inv(fct)) % mod;
}
}
return a;
}
vector<ll> cos_polynomial(int n) {
vector<ll> a(n, 0);
ll fct = 1;
for (int i = 0; i < n; i += 1) {
if (i != 0) {
fct = (fct * i) % mod;
}
if (i % 2 == 0) {
int sign = 1;
if ((i / 2) % 2 == 1) {
sign = -1;
}
a[i] = (mod + sign * inv(fct)) % mod;
}
}
return a;
}
vector<ll> super_cos_polynomial(int n, int k) {
vector<ll> a(n, 0);
ll fct = 1;
for (int i = 0; i < n; i += 1) {
if (i != 0) {
fct = (fct * i) % mod;
}
if (i % k == 0) {
int sign = 1;
if ((i / k) % 2 == 1) {
sign = -1;
}
a[i] = (mod + sign * inv(fct)) % mod;
}
}
return a;
}
vector<ll> logarithm(const vector<ll>& a, int n) {
if (n == 0) {
return {};
}
vector<ll> b = integrate(mul(derivative(a), rev_polynom(a, n)));
b.resize(n);
return b;
}
vector<ll> exponent(const vector<ll>& a, int n) {
vector<ll> b = { 1 };
int m = 1;
while (m < n) {
int m2 = m + m;
vector<ll> t = logarithm(b, m2);
for (int i = 0; i < m2 && i < (int)a.size(); i += 1) {
t[i] = (t[i] - a[i]);
if (t[i] < 0) {
t[i] += mod;
}
}
vector<ll> q = fft::mul(t, b);
q.resize(m2);
b.resize(m2);
for (int i = 0; i < m2; i += 1) {
b[i] -= q[i];
if (b[i] < 0) {
b[i] += mod;
}
}
m = m2;
}
b.resize(n);
return b;
}
vector<ll> solve_differential(const vector<ll>& a, const vector<ll>& b, int n) {
vector<ll> e = exponent(integrate(a), n);
vector<ll> result = mul(e, integrate(mul(b, rev_polynom(e, n))));
result.resize(n);
return result;
}
vector<ll> pure_exponent(int n, ll k = 1) {
if (n == 0) {
return {};
}
k %= mod;
if (k < 0) {
k += mod;
}
vector<ll> rs(n);
rs[0] = 1;
ll rv_fct = 1;
for (int i = 1; i < n; i += 1) {
rv_fct = (rv_fct * rvx[i]) % mod * k % mod;
rs[i] = rv_fct;
}
return rs;
}
} // namespace fft
vector<ll> f, invf;
void build_f(int n) {
f.resize(n + 1);
invf.resize(n + 1);
f[0] = invf[0] = 1;
for (int i = 1; i <= n; i += 1) {
f[i] = (f[i - 1] * i) % mod;
invf[i] = inv(f[i]);
}
}
ll cnk(ll n, ll k) {
if (n < 0 or k < 0 or k > n) return 0;
return (f[n] * invf[k] % mod * invf[n - k] % mod);
}
ll catalan(ll n) {
return cnk(2 * n, n) * inv(n + 1) % mod;
}
ll choose_repeating(ll n, ll k) {
return cnk(n + k - 1, k);
}
ll solve_smart(int n, int m) {
build_f(n + m + 1e5);
ll result = 1;
for (int t = 1; t <= m; t += 1) {
result = (result + choose_repeating(2 * t + 1, n - 1)) % mod;
for (int cnt = 1; 2 * cnt + 1 <= n and cnt <= t - 1; cnt += 1) {
ll coeff = (cnk(t, cnt) * cnk(t - 1, cnt) % mod * 2 +
cnk(t, cnt + 1) * cnk(t - 1, cnt) % mod +
cnk(t - 1, cnt + 1) * cnk(t, cnt)) % mod;
coeff = coeff * inv(2 * t + 1) % mod;
result = (result + coeff * cnk(2 * t + n - 2 * cnt - 1, n - 2 * cnt - 1)) % mod;
}
}
return result;
}
ll solve(int n, int m) {
build_f(2 * n + 2 * m + 1e5);
ll result = 1;
for (int t = 1; t <= m; t += 1) {
result = (result + choose_repeating(2 * t + 1, n - 1)) % mod;
}
for (int mask = 0; mask <= 2; mask += 1) {
int x = mask % 2;
int y = (mask / 2) % 2;
int mx_cnt = (n - 1) / 2;
vector<ll> a(mx_cnt + 1);
for (int cnt = 1; cnt <= mx_cnt; cnt += 1) {
a[cnt] = invf[cnt + x] * invf[cnt + y] % mod;
if (mask == 0) {
a[cnt] = (a[cnt] * 2) % mod;
}
a[cnt] = a[cnt] * invf[n - 2 * cnt - 1] % mod;
}
vector<ll> b(m);
for (int t_cnt = y + 1; t_cnt <= m - 1; t_cnt += 1) {
b[t_cnt] = invf[t_cnt - x] * invf[t_cnt - 1 - y] % mod;
b[t_cnt] = b[t_cnt] * f[n - 1 + 2 * t_cnt] % mod;
}
auto c = fft::mul(a, b);
for (int t = 1; t <= m and t < len(c); t += 1) {
result += c[t] * f[t] % mod * f[t - 1] % mod * invf[2 * t] % mod * inv(2 * t + 1) % mod;
}
result %= mod;
}
return result;
}
ll solve_slow(int n, int m) {
vector<vector<vector<ll>>> dp(n + 1, vector<vector<ll>>(m + 1, vector<ll>(m + 1)));
rep(i, m + 1) dp[0][0][m] = 1;
rep(i, n) {
rep(x, m + 1) rep(y, m + 1 - x) {
rep(k, x) dp[i + 1][x][y] += dp[i][k][y];
for (int k = m; k >= y; k -= 1) dp[i + 1][x][y] += dp[i][x][k];
dp[i + 1][x][y] %= mod;
}
}
ll result = 0;
rep(x, m + 1) rep(y, m + 1 - x) result += dp[n][x][y];
result %= mod;
return result;
}
void stress() {
int c = 0;
while (1) {
cout << ++c << "\n";
int n = rnd() % 100 + 1;
int m = rnd() % 100 + 1;
auto my_rs = solve(n, m);
auto right_rs = solve_slow(n, m);
if (my_rs != right_rs) {
cout << n << " " << m << "\n";
break;
}
}
}
int32_t main() {
fft::build(22);
stress();
if (1) {
ios::sync_with_stdio(0);
cin.tie(0);
cout.tie(0);
}
int n, m;
cin >> n >> m;
cout << solve(n, m) << "\n";
return 0;
}
Details
Tip: Click on the bar to expand more detailed information
Test #1:
score: 0
Time Limit Exceeded
input:
2 2