#	User	Rating
1	Benq	3792
2	VivaciousAubergine	3647
3	Kevin114514	3611
4	jiangly	3583
5	strapple	3515
6	tourist	3470
7	Radewoosh	3415
8	Um_nik	3376
9	maroonrk	3361
10	XVIII	3345

#	User	Contrib.
1	Qingyu	162
2	adamant	148
3	Um_nik	145
4	Dominater069	143
5	errorgorn	141
6	cry	138
7	Proof_by_QED	136
8	YuukiS	135
9	chromate00	134
10	soullless	132

Sorry for the long wait. All problems were written, prepared, and editorialized by Yam, hyforces, culver0412, HaccerKat, alexlikemath007, jay_jayjay, n685, Mustela_Erminea, Jasonwei08, eysbutno, training4usaco, nyctivoe, and gg_gong. The problems (with problem credits) can be found in the Novice Gym and Advanced Gym. Also thanks to our testers for providing valuable feedback and to our logistics and web team for making TeamsCode possible!

Novice A/Advanced A: Lily Pads

Hint 1

Hint 2

Hint 3

Solution

Code (Python)

n = int(input())
print(n)

Novice B: Sacrifice the Rook

Hint 1

Hint 2

Hint 3

Solution

Code

#include <bits/stdc++.h>
using namespace std;

#define pii pair<int, int>
#define fi first
#define se second

bool isAdjacent(pii p1, pii p2) { return (abs(p1.fi - p2.fi) <= 1 && abs(p1.se - p2.se) <= 1); }

bool pathClear(pii start, pii end, pii wk, pii bk) {
    if (start.se == end.se) {
        int col1 = min(start.fi, end.fi), col2 = max(start.fi, end.fi);
        for (int col = col1 + 1; col < col2; col++) {
            if ((wk.fi == col && wk.se == start.se) || (bk.fi == col && bk.se == start.se))
                return 0;
        }
    } else if (start.fi == end.fi) {
        int row1 = min(start.se, end.se), row2 = max(start.se, end.se);
        for (int row = row1 + 1; row < row2; row++) {
            if ((wk.fi == start.fi && wk.se == row) || (bk.fi == start.fi && bk.se == row))
                return 0;
        }
    }
    return 1;
}

signed main() {
    ios::sync_with_stdio(0), cin.tie(0);
    int t;
    cin >> t;
    for(int tc = 0; tc < t; tc++){
        string wks, wrs, bks;
        cin >> wks >> wrs >> bks;
    
        auto toPos = [&](string s) -> pii { return {s[0] - 'a' + 1, s[1] - '0'}; };
    
        pii wk = toPos(wks), wr = toPos(wrs), bk = toPos(bks);
        bool flg = 0;
        for (int dc = -1; dc <= 1; dc++) {
            for (int dr = -1; dr <= 1; dr++) {
                if (dc == 0 && dr == 0)
                    continue;
                pii cur = {bk.fi + dc, bk.se + dr};
    
                if (cur.fi < 1 || cur.fi > 8 || cur.se < 1 || cur.se > 8)
                    continue;
                if (cur.fi != wr.fi && cur.se != wr.se)
                    continue;
                if ((cur.fi == wk.fi && cur.se == wk.se) ||
                    (cur.fi == bk.fi && cur.se == bk.se))
                    continue;
                if (!pathClear(wr, cur, wk, bk))
                    continue;
                if (isAdjacent(cur, wk))
                    continue;
    
                flg = true;
            }
        }
    
        cout << (flg ? "YES" : "NO") << "\n";
    }
    return 0;
}

Novice C: Fill the world with Argon

Hint 1

Hint 2

Hint 3

Solution

Code

/**
 * @author n685
 * @date 2025-03-22 19:02:42
 */
#include <bits/stdc++.h>

#ifdef LOCAL
#include "dd/debug.h"
#else
#define dbg(...) 42
#define dbg_proj(...) 420
#define dbg_rproj(...) 420420
void nline() {}
void bar() {}
void start_clock() {}
void end_clock() {}
#endif

namespace rs = std::ranges;
namespace rv = std::views;

using u32 = unsigned int;
using i64 = long long;
using u64 = unsigned long long;

const std::array<int, 4> dx{-1, 0, 1, 0}, dy{0, 1, 0, -1};

int main() {
#ifndef LOCAL
  std::ios::sync_with_stdio(false);
  std::cin.tie(nullptr);
#endif

  int n, m;
  std::cin >> n >> m;

  std::vector a(n, std::vector<int>(m));
  for (std::vector<int>& arr : a) {
    for (int& val : arr) {
      std::cin >> val;
    }
  }

  int ans = 0;
  for (int i = 0; i < n; ++i) {
    for (int j = 0; j < m; ++j) {
      bool good = true;
      for (int d = 0; d < 4; ++d) {
        int x = i + dx[d];
        int y = j + dy[d];
        if (x < 0 || x >= n || y < 0 || y >= m) {
          continue;
        }
        if (a[i][j] < a[x][y]) {
          good = false;
          break;
        }
      }
      if (good) {
        ++ans;
      }
    }
  }

  std::cout << ans << '\n';
}

Alternative Solution

Code (Alternative Solution)

/**
 * @author n685
 * @date 2025-03-22 19:10:16
 */
#include <bits/stdc++.h>

#ifdef LOCAL
#include "dd/debug.h"
#else
#define dbg(...) 42
#define dbg_proj(...) 420
#define dbg_rproj(...) 420420
void nline() {}
void bar() {}
void start_clock() {}
void end_clock() {}
#endif

using u32 = unsigned int;
using i64 = long long;
using u64 = unsigned long long;

const std::array<int, 4> dx{-1, 0, 1, 0}, dy{0, 1, 0, -1};

int main() {
#ifndef LOCAL
  std::ios::sync_with_stdio(false);
  std::cin.tie(nullptr);
#endif

  int n, m;
  std::cin >> n >> m;

  std::vector a(n, std::vector<int>(m));
  for (std::vector<int>& arr : a) {
    for (int& val : arr) {
      std::cin >> val;
    }
  }

  std::vector<std::pair<int, int>> coord;
  for (int i = 0; i < n; ++i) {
    for (int j = 0; j < m; ++j) {
      coord.emplace_back(i, j);
    }
  }

  std::sort(
    coord.begin(),
    coord.end(),
    [&](const std::pair<int, int>& lhs, const std::pair<int, int>& rhs) {
      return a[lhs.first][lhs.second] > a[rhs.first][rhs.second];
    }
  );

  std::vector fl(n, std::vector<bool>(m));
  auto dfs = [&](auto&& self, int i, int j) -> void {
    for (int d = 0; d < 4; ++d) {
      int x = i + dx[d];
      int y = j + dy[d];
      if (x < 0 || x >= n || y < 0 || y >= m || fl[x][y] || a[i][j] < a[x][y]) {
        continue;
      }
      fl[x][y] = true;
      self(self, x, y);
    }
  };
  int ans = 0;
  for (auto [i, j] : coord) {
    if (!fl[i][j]) {
      ++ans;
      fl[i][j] = true;
      dfs(dfs, i, j);
    }
  }
  std::cout << ans << '\n';
}

Novice D: Please solve this in O(N^3)

There are two ways to solve this problem — the normal way, and the cool $$$O(N^3)$$$ way.

Normal Way:

Hint 1

Hint 2

Solution

Code

#include <bits/stdc++.h>
using namespace std;

#define pii pair<int, int>
#define fi first
#define se second

const int N = 755;

struct DSU {
    vector<int> fa;
    DSU(int n) : fa(n) { iota(fa.begin(), fa.end(), 0); }
    int find(int a) { return fa[a] == a ? a : fa[a] = find(fa[a]); }
    void merge(int a, int b) {
        a = find(a), b = find(b);
        if (a != b) fa[b] = a;
    }
};

int n, m, cm[N];
vector<pii> G;
bitset<N> vis[N];

signed main() {
    ios::sync_with_stdio(0), cin.tie(0);

    cin >> n >> m;
    for (int i = 0; i < n; i++)
        cin >> cm[i];

    for (int i = 1, u, v; i <= m; i++) {
        cin >> u >> v, u--, v--;
        G.push_back({u, v});
    }

    for (int i = 0; i < n; i++)
        vis[i].reset(), vis[i].set(i, 1);

    for (int c = 0; c < 30; c++) {
        DSU dsu(N);

        for (auto &[u, v] : G) {
            if ((cm[u] & (1 << c)) && (cm[v] & (1 << c)))
                dsu.merge(u, v);
        }

        unordered_map<int, vector<int>> mp;
        for (int i = 0; i < n; i++) {
            if (cm[i] & (1 << c)) {
                int rt = dsu.find(i);
                mp[rt].push_back(i);
            }
        }

        for (auto &p : mp) {
            vector<int> &lc = p.se;
            for (auto u : lc)
                for (auto v : lc)
                    vis[u].set(v, 1);
        }
    }

    for (int i = 0; i < n; i++) {
        for (int j = 0; j < n; j++)
            cout << (vis[i].test(j) ? '1' : '0');
        cout << "\n";
    }

    return 0;
}

Cool way:

Hint 1

Hint 2

Solution

Code

#include <iostream>
using namespace std;

int main()
{
    ios::sync_with_stdio(0), cin.tie(0);
    int n, m;
    cin >> n >> m;
    int a [n];
    for(int i = 0; i < n; i++){
        cin >> a[i];
    }
    int edg [n][n];
    for(int i = 0; i < n; i++){
        for(int j = 0; j < n; j++){
            edg[i][j] = 0;
        }
    }
    for(int i = 0; i < n; i++){
        edg[i][i] = a[i];
    }
    for(int i = 0; i < m; i++){
        int x, y;
        cin >> x >> y;
        x--;
        y--;
        edg[x][y] = edg[y][x] = (a[y] & a[x]);
    }
    for(int i = 0; i < n; i++){
        for(int j = 0; j < n; j++){
            for(int k = 0; k < n; k++){
                edg[j][k] |= edg[j][i] & edg[i][k];
            }
        }
    }

    for(int i = 0; i < n; i++){
        for(int j = 0; j < n; j++){
            cout << (edg[i][j] != 0);
        }
        cout << '\n';
    }
    return 0;
}

Novice E: Mingle

Hint 1

Hint 2

Solution

Code (C++)

#include <bits/stdc++.h>

using ll = long long;

int main() {
    std::ios_base::sync_with_stdio(false);
    std::cin.tie(nullptr);
    
    int n, m;
    std::cin >> n >> m;
    std::vector<std::vector<int>> adj(n);
    for (int i = 0; i < m; i++) {
        int u, v;
        std::cin >> u >> v;
        u--, v--;
        adj[u].push_back(v);
        adj[v].push_back(u);
    }

    std::vector<std::array<int, 2>> res;
    std::vector<bool> vis(n);
    const auto dfs = [&](int u, auto &&self) -> int {
        vis[u] = true;
        std::vector<int> ok;
        for (const int &v : adj[u]) {
            if (!vis[v] && self(v, self)) { ok.push_back(v); }
        }

        ok.push_back(u);
        for (int i = 1; i < ok.size(); i += 2) {
            res.push_back({ok[i - 1], ok[i]});
        }

        return ok.size() % 2;
    };

    for (int i = 0; i < n; i++) {
        if (!vis[i]) { dfs(i, dfs); }
    }

    std::cout << res.size() << '\n';
    for (const auto &[u, v] : res) {
        std::cout << u + 1 << ' ' << v + 1 << '\n';
    }
}

Code (Python)

import sys
sys.setrecursionlimit(10**6)

n, m = map(int, input().split())
adj = [[] for _ in range(n)]
for _ in range(m):
    u, v = map(int, input().split())
    u -= 1
    v -= 1
    adj[u].append(v)
    adj[v].append(u)

res = []
vis = [False] * n

def dfs(u):
    vis[u] = True
    ok = []
    for v in adj[u]:
        if vis[v]:
            continue
        if dfs(v):
            ok.append(v)

    ok.append(u)
    for i in range(1, len(ok), 2):
        res.append((ok[i - 1], ok[i]))
		
    return len(ok) % 2

for i in range(n):
    if not vis[i]:
        dfs(i)

print(len(res))
for u, v in res:
    print(u + 1, v + 1)

Novice F: Keys

Hint 1

Hint 2

Hint 3

Solution

Code

#include<bits/stdc++.h>
using namespace std;
 
int main(){
    ios_base::sync_with_stdio(0); cin.tie(0);
    int n,m,k;
    cin >> n >> m >> k;
    long long int s[n+1]={0};
    for(int i=1;i<=n;i++) s[i]=(s[i-1]<<1)^1;
    pair<long long int,long long int> p[m];
    for(int i=0;i<m;i++) cin >> p[i].first >> p[i].second;
    long long int a=0,b=0;
    int x,y;
    for(int i=0;i<k;i++){
        cin >> x >> y;
        a^=s[x]; b^=s[y];
    }
    for(int i=0;i<m;i++){
        cout << (p[i].first^a) << ' ' << (p[i].second^b) << '\n';
    }
}

Novice G: Path on Big Grid

Hint 1

Hint 2

Hint 3

Solution

Code

#include <iostream>
using namespace std;

int grid [1000][1000];
int dp [2000][2000];

int main(){
    ios_base::sync_with_stdio(false);
    cin.tie(NULL);
    int n, m, N, M;
    cin >> n >> m >> N >> M;
    for(int i = 0; i < n; i++){
        for(int j = 0; j < m; j++){
            cin >> grid[i][j];
        }
    }
    for(int i = 0; i < 2 * n; i++){
        for(int j = 0; j < 2 * m; j++){
            dp[i][j] = 2000500000;
        }
    }
    dp[0][0] = grid[0][0];
    for(int i = 0; i < 2 * n; i++){
        for(int j = 0; j < 2 * m; j++){
            if(i != 0){
                dp[i][j] = min(dp[i][j], dp[i-1][j] + grid[i/2][j/2] * (i%2 == 0 ? 1 : N-1));
            }
            if(j != 0){
                dp[i][j] = min(dp[i][j], dp[i][j-1] + grid[i/2][j/2] * (j%2 == 0 ? 1 : M-1));
            }
        }
    }
    cout << dp[2 * n-1][2 * m-1] << endl;
}

Novice H: Fibocchi Sequence

Hint 1

Hint 2

Solution

Code

#include "bits/stdc++.h"
using namespace std;
const int N = 5000005;
const int inf = 1e9;
int n, m, k, qq;
int dp[N];
void solve() {
    cin >> n >> qq;
    vector<int> f(n), pref(n);
    f[0] = f[1] = pref[0] = 1, pref[1] = 2;
    for (int i = 2; i < n; i++) {
        f[i] = f[i - 1] + f[i - 2];
        pref[i] = pref[i - 1] + f[i];
    }
 
    fill(dp, dp + N, inf);
    dp[0] = 0, pref[n - 1] = pref[n - 3] + 1;
    for (int i = 0; i < n; i++) {
        int w = pref[i];
        for (int j = w; j < N; j++) {
            dp[j] = min(dp[j], dp[j - w] + 1);
        }
    }
 
    while (qq--) {
        int a, b, x;
        cin >> a >> b >> x;
        x -= pref[n - 1] * a + pref[n - 2] * b;
        cout << (x < 0 ? -1 : dp[x]) << "\n";
    }
}
 
int32_t main() {
    std::ios::sync_with_stdio(false);
    cin.tie(NULL);
    solve();
}

Novice I/Advanced B: Cell Towers

Hint 1

Hint 2

Solution

Code

#include <iostream>
#include <algorithm>
#include <vector>
#define ll long long
using namespace std;

int main(){
    int n;
    cin >> n;
    vector <pair<ll,ll>> v;
    for(int i = 0; i < n; i++){
        ll r; ll c;
        cin >> r >> c;
        v.push_back(make_pair(c, r+c));
    }
    sort(v.begin(), v.end());
    ll minL = v[0].first;
    ll maxR = 0;
    for(int i = 0; i < n; i++){
        maxR = max(maxR, v[i].second);
    }
    vector <ll> gaps;
    ll curMxR = v[0].second;
    int cnt = 0;
    for(int i = 1; i < n; i++){
        if((v[i].first - curMxR) > 0){
            cnt++;
        }
        gaps.push_back(max(0ll, v[i].first - curMxR));
        curMxR = max(curMxR, v[i].second);
    }
    sort(gaps.begin(), gaps.end());
    reverse(gaps.begin(), gaps.end());
    ll ans = maxR - minL;
    cout << ans << " ";
    for(int i = 0; i < (n-1); i++){
        ans -= gaps[i];
        cout << ans << " ";
    }
    cout << endl;
}

Novice J/Advanced C: Walk

Hint 1

Hint 2

Solution

Code

#include "bits/stdc++.h"
using namespace std;
typedef long long ll;
const int mod = 998244353;
const int N = 1000005;
int fact[N], inv_fact[N];
int mul(int x, int y) {
    return (ll)x * y % mod;
}

int qpow(int b, int p) {
    int res = 1;
    for (; p; p >>= 1) {
        if (p & 1) res = mul(res, b);
        b = mul(b, b);
    }

    return res;
}

int C(int n, int k) {
    if (k < 0) return 0;
    return mul(fact[n], mul(inv_fact[k], inv_fact[n - k]));
}

void solve() {
    int a, b, c, d;
    cin >> a >> b >> c >> d;
    a--;
    if (a + d != b + c) {
        cout << "0\n";
    }

    else {
        cout << mul(C(a + d - 1, a - 1), C(b + c, b)) << "\n";
    }
}

int32_t main() {
    std::ios::sync_with_stdio(false);
    cin.tie(NULL);
    fact[0] = 1;
    for (int i = 1; i < N; i++) {
        fact[i] = mul(fact[i - 1], i);
    }

    inv_fact[N - 1] = qpow(fact[N - 1], mod - 2);
    for (int i = N - 2; i >= 0; i--) {
        inv_fact[i] = mul(inv_fact[i + 1], i + 1);
    }

    int tt;
    cin >> tt;
    while (tt--) {
        solve();
    }
}

Novice K/Advanced D: Not Japanese Triangle

Hint 1

Hint 2

Hint 3

Solution

Compute Spans:
For each $$$b[i]$$$ (the $$$i$$$'th element in the bottom row), compute:

$$$A_i = i - L[i] - 1$$$, where $$$L[i]$$$ is the index of the last element to the left that is smaller than $$$b[i]$$$,
$$$B_i = R[i] - i - 1$$$, where $$$R[i]$$$ is the index of the next element to the right that is less than or equal to $$$b[i]$$$.

To actually calculate $$$L[i]$$$ and $$$R[i]$$$, we will maintain a monotonic stack. When checking the current one, we keep on removing element bigger than the current, until a smaller one is found (which, must be the closest one because it's in a stack). We do this process from left to right for $$$L[i]$$$ and right to left for $$$R[i]$$$.

Finding Contribution Function:
Recognize that $$$b[i]$$$ contributes to every subarray (of lengths $$$t+1$$$ for $$$t$$$ from 0 to $$$A_i+B_i$$$) with weight $$$b[i] \times g_i(t)$$$, where $$$g_i(t)$$$ is:

$$$t + 1$$$ for $$$0 \le t \le m$$$,
$$$m + 1$$$ for $$$m \lt t \le M$$$,
$$$A_i + B_i - t + 1$$$ for $$$M \lt t \le A_i + B_i$$$,

with $$$m = \min(A_i, B_i)$$$ and $$$M = \max(A_i, B_i)$$$.

Range Updates of Piece-wise Function:
For each element $$$b[i]$$$, break its contribution into three parts and “range update” an auxiliary array (or, equivalently, update two difference arrays for polynomial updates).

The standard prefix sum update only deals with constant update values, such as adding $$$4$$$ to range $$$[1, 23]$$$. However, we have a piece-wise, linear function to add. So, suppose we want to add function $$$F(i) = a \cdot i + b$$$ to range $$$[L, R]$$$, we perform the following updates:

$$$p_1[L] += a$$$ and $$$p_1[R + 1] -= a$$$
$$$p_0[L] += b$$$ and $$$p_0[R + 1] -= b$$$

After calculating prefix sum on $$$p_0$$$ and $$$p_1$$$. Our answer for $$$i$$$ will be $$$(i - 1) \cdot p_1[i] + p_0[i]$$$ (for $$$1$$$ indexing).

We essentially do this $$$3$$$ times because our function has $$$3$$$ pieces.

The total time complexity is $$$O(n)$$$, which is more than enough to pass this problem.

Note

Code

#include <bits/stdc++.h>
using namespace std;

#define ll long long
#define pll pair<ll, ll>
#define fi first
#define se second
#define uwu make_pair

const int N = 1e5 + 5;

ll n, a[N];
int l[N], r[N];

signed main() {
    ios::sync_with_stdio(0), cin.tie(0);

    cin >> n;
    for (int i = 1; i <= n; i++)
        cin >> a[i];

    pll stk[N];
    ll tp = 0;
    stk[0] = uwu(-1, 0);
    for (ll i = 1; i <= n; i++) {
        while (stk[tp] > uwu(a[i], i))
            tp--;
        l[i] = stk[tp].se;
        stk[++tp] = uwu(a[i], i);
    }

    tp = 0;
    stk[0] = uwu(-1, n + 1);
    for (ll i = n; i >= 1; i--) {
        while (stk[tp] > uwu(a[i], i))
            tp--;
        r[i] = stk[tp].se;
        stk[++tp] = uwu(a[i], i);
    }

    vector<ll> p1(n + 2, 0), p0(n + 2, 0), res(n + 2, 0);

    auto upd = [&](int pl, int pr, ll a, ll b) {
        p1[pl] += a, p1[pr + 1] -= a;
        p0[pl] += b, p0[pr + 1] -= b;
    };

    for (int i = 1; i <= n; i++) {
        int st = i - l[i] - 1, ed = r[i] - i - 1;
        int mi = min(st, ed), mx = max(st, ed), T = st + ed;

        upd(1, mi + 1, a[i], a[i]);
        if (mi + 1 <= mx) upd(mi + 2, mx + 1, 0, a[i] * (mi + 1));
        if (mx + 1 <= T) upd(mx + 2, T + 1, -a[i], a[i] * (st + ed + 1));
    }

    for (int t = 2; t <= n; t++) {
        p1[t] = p1[t - 1] + p1[t];
        p0[t] = p0[t - 1] + p0[t];
    }

    for (int t = 1; t <= n; t++)
        res[t] = (t - 1) * p1[t] + p0[t];

    for (int t = n; t >= 1; t--)
        cout << res[t] << " ";
    cout << "\n";

    return 0;
}

Novice L/Advanced E: Robot Racing

Hint 1

Hint 2

Solution

First, let's replace each $$$a_i$$$ with $$$\left\lfloor \frac{L}{a_i} \right\rfloor$$$: the latest possible second you have to shoot this robot by. For convenience, reverse $$$a$$$ so that it stays sorted in non-decreasing order.

Let’s consider solving the problem on one array. How can we check if we can make $$$k$$$ groups?

Say we have some arbitrary division of the robots into $$$k$$$ groups. For each group, we essentially only care about the robot $$$i$$$ with the smallest value $$$a_i$$$ out of all the robots in this group, because we must shoot this group before the fastest robot passes the end. Let this value for $$$j$$$-th group be $$$t_j$$$, meaning we have to shoot this group at time $$$t_j$$$ or before. Optimally, we should shoot the groups from smallest to greatest value of $$$t_j$$$. So to check if we can divide the robots into $$$k$$$ groups, we see if $$$t_1 \geq 1$$$, $$$t_2 \geq 2$$$, $$$t_3 \geq 3$$$, $$$\ldots$$$, $$$t_k \geq k$$$ is satisfied.

When dividing the robots into $$$k$$$ groups, it is optimal to have the last $$$k - 1$$$ robots in individual groups and the remaining prefix of $$$n - (k - 1)$$$ robots in one group.

Proof

Using this, we can write the condition as $$$a_1 \geq 1$$$, $$$a_{n - k + 2} \geq 2$$$, $$$a_{n - k + 3} \geq 3$$$, $$$\ldots$$$, $$$a_n \geq k$$$.

Since all $$$a_i \geq 1$$$, we can replace the first condition, giving us $$$a_{n - k + 1} \geq 1$$$, $$$a_{n - k + 2} \geq 2$$$, $$$a_{n - k + 3} \geq 3$$$, $$$\ldots$$$, $$$a_n \geq k$$$. In other words, $$$a_{n - k + i} \geq i$$$ for all $$$1 \leq i \leq k$$$.

Looping through each subarray from left to right and maintaining the maximal $$$k$$$ value allows us to solve the first subtask in $$$O\left(N^3\right)$$$. We can even loop through the array once for each left subarray index while maintaining the maximum $$$k$$$ value, giving us a $$$O\left(N^2\right)$$$ solution.

To fully optimize this, we can notice that subarrays ending at the same index $$$r$$$ hold the same maximal $$$k$$$ value. To find the maximum $$$k$$$ where $$$a_{r - k + i} \geq i$$$ holds for $$$1 \leq i \leq k$$$, we can take the prefix minimum of $$$a_l + r - l$$$ among $$$1 \leq l \lt i$$$. Now we can calculate the answer for each subarray ending at $$$i$$$, which will be $$$\displaystyle\sum_{l=1}^{i}\text{min}(k, r - l + 1).$$$

Time Complexity: $$$O\left(N\right)$$$

Code

// {{{1
extern "C" int __lsan_is_turned_off() { return 1; }
#include <bits/stdc++.h>
using namespace std;
 
#include <tr2/dynamic_bitset>
using namespace tr2;
#include <ext/pb_ds/assoc_container.hpp>
 
#define ll long long
#define inf 0x3f3f3f3f
#define infl 0x3f3f3f3f3f3f3f3fll
 
#include <assert.h>
#ifdef DEBUG
#define dprintf(args...) fprintf(stderr,args)
#endif
#ifndef DEBUG
#define dprintf(args...) 69
#endif
#define all(x) (x).begin(), (x).end()
struct cintype { template<typename T> operator T() { T x; cin>>x; return x; } };
// 1}}}
cintype in;
 
int main()
{
        int n=in,L=in;vector<int>a(n);for(auto&x:a)x=in;
        for(auto&x:a)x=L/x;reverse(all(a));
 
        auto b=a;for(int i=0;i<n;i++)b[i]-=i;
        for(int i=1;i<n;i++)b[i]=min(b[i],b[i-1]);
        ll ans=0;
        for(int i=0;i<n;i++){
                int x = b[i]+i;
                ll s=0;
                if(i-x>=0) s+=1ll*x*(x+1)/2+1ll*(i+1-x)*x;
                else s+=1ll*(i+1)*(x+x+i)/2;
                ans+=s;
        }
        printf("%lld\n",ans);
}

Advanced F: Binary Function

Definitions

Hint 1

Hint 2

Hint 3

Hint 4

Hint 5

Solution

Code

#include "bits/stdc++.h"
using namespace std;
template <typename T>
T inverse(T a, T m) {
  T u = 0, v = 1;
  while (a != 0) {
    T t = m / a;
    m -= t * a; swap(a, m);
    u -= t * v; swap(u, v);
  }
  assert(m == 1);
  return u;
}
 
template <typename T>
class Modular {
 public:
  using Type = typename decay<decltype(T::value)>::type;
 
  constexpr Modular() : value() {}
  template <typename U>
  Modular(const U& x) {
    value = normalize(x);
  }
 
  template <typename U>
  static Type normalize(const U& x) {
    Type v;
    if (-mod() <= x && x < mod()) v = static_cast<Type>(x);
    else v = static_cast<Type>(x % mod());
    if (v < 0) v += mod();
    return v;
  }
 
  const Type& operator()() const { return value; }
  template <typename U>
  explicit operator U() const { return static_cast<U>(value); }
  constexpr static Type mod() { return T::value; }
 
  Modular& operator+=(const Modular& other) { if ((value += other.value) >= mod()) value -= mod(); return *this; }
  Modular& operator-=(const Modular& other) { if ((value -= other.value) < 0) value += mod(); return *this; }
  template <typename U> Modular& operator+=(const U& other) { return *this += Modular(other); }
  template <typename U> Modular& operator-=(const U& other) { return *this -= Modular(other); }
  Modular& operator++() { return *this += 1; }
  Modular& operator--() { return *this -= 1; }
  Modular operator++(int) { Modular result(*this); *this += 1; return result; }
  Modular operator--(int) { Modular result(*this); *this -= 1; return result; }
  Modular operator-() const { return Modular(-value); }
 
  template <typename U = T>
  typename enable_if<is_same<typename Modular<U>::Type, int>::value, Modular>::type& operator*=(const Modular& rhs) {
#ifdef _WIN32
    uint64_t x = static_cast<int64_t>(value) * static_cast<int64_t>(rhs.value);
    uint32_t xh = static_cast<uint32_t>(x >> 32), xl = static_cast<uint32_t>(x), d, m;
    asm(
      "divl %4; \n\t"
      : "=a" (d), "=d" (m)
      : "d" (xh), "a" (xl), "r" (mod())
    );
    value = m;
#else
    value = normalize(static_cast<int64_t>(value) * static_cast<int64_t>(rhs.value));
#endif
    return *this;
  }
  template <typename U = T>
  typename enable_if<is_same<typename Modular<U>::Type, long long>::value, Modular>::type& operator*=(const Modular& rhs) {
    long long q = static_cast<long long>(static_cast<long double>(value) * rhs.value / mod());
    value = normalize(value * rhs.value - q * mod());
    return *this;
  }
  template <typename U = T>
  typename enable_if<!is_integral<typename Modular<U>::Type>::value, Modular>::type& operator*=(const Modular& rhs) {
    value = normalize(value * rhs.value);
    return *this;
  }
 
  Modular& operator/=(const Modular& other) { return *this *= Modular(inverse(other.value, mod())); }
 
  friend const Type& abs(const Modular& x) { return x.value; }
 
  template <typename U>
  friend bool operator==(const Modular<U>& lhs, const Modular<U>& rhs);
 
  template <typename U>
  friend bool operator<(const Modular<U>& lhs, const Modular<U>& rhs);
 
  template <typename V, typename U>
  friend V& operator>>(V& stream, Modular<U>& number);
 
 private:
  Type value;
};
 
template <typename T> bool operator==(const Modular<T>& lhs, const Modular<T>& rhs) { return lhs.value == rhs.value; }
template <typename T, typename U> bool operator==(const Modular<T>& lhs, U rhs) { return lhs == Modular<T>(rhs); }
template <typename T, typename U> bool operator==(U lhs, const Modular<T>& rhs) { return Modular<T>(lhs) == rhs; }
 
template <typename T> bool operator!=(const Modular<T>& lhs, const Modular<T>& rhs) { return !(lhs == rhs); }
template <typename T, typename U> bool operator!=(const Modular<T>& lhs, U rhs) { return !(lhs == rhs); }
template <typename T, typename U> bool operator!=(U lhs, const Modular<T>& rhs) { return !(lhs == rhs); }
 
template <typename T> bool operator<(const Modular<T>& lhs, const Modular<T>& rhs) { return lhs.value < rhs.value; }
 
template <typename T> Modular<T> operator+(const Modular<T>& lhs, const Modular<T>& rhs) { return Modular<T>(lhs) += rhs; }
template <typename T, typename U> Modular<T> operator+(const Modular<T>& lhs, U rhs) { return Modular<T>(lhs) += rhs; }
template <typename T, typename U> Modular<T> operator+(U lhs, const Modular<T>& rhs) { return Modular<T>(lhs) += rhs; }
 
template <typename T> Modular<T> operator-(const Modular<T>& lhs, const Modular<T>& rhs) { return Modular<T>(lhs) -= rhs; }
template <typename T, typename U> Modular<T> operator-(const Modular<T>& lhs, U rhs) { return Modular<T>(lhs) -= rhs; }
template <typename T, typename U> Modular<T> operator-(U lhs, const Modular<T>& rhs) { return Modular<T>(lhs) -= rhs; }
 
template <typename T> Modular<T> operator*(const Modular<T>& lhs, const Modular<T>& rhs) { return Modular<T>(lhs) *= rhs; }
template <typename T, typename U> Modular<T> operator*(const Modular<T>& lhs, U rhs) { return Modular<T>(lhs) *= rhs; }
template <typename T, typename U> Modular<T> operator*(U lhs, const Modular<T>& rhs) { return Modular<T>(lhs) *= rhs; }
 
template <typename T> Modular<T> operator/(const Modular<T>& lhs, const Modular<T>& rhs) { return Modular<T>(lhs) /= rhs; }
template <typename T, typename U> Modular<T> operator/(const Modular<T>& lhs, U rhs) { return Modular<T>(lhs) /= rhs; }
template <typename T, typename U> Modular<T> operator/(U lhs, const Modular<T>& rhs) { return Modular<T>(lhs) /= rhs; }
 
template<typename T, typename U>
Modular<T> power(const Modular<T>& a, const U& b) {
  assert(b >= 0);
  Modular<T> x = a, res = 1;
  U p = b;
  while (p > 0) {
    if (p & 1) res *= x;
    x *= x;
    p >>= 1;
  }
  return res;
}
 
template <typename T>
bool IsZero(const Modular<T>& number) {
  return number() == 0;
}
 
template <typename T>
string to_string(const Modular<T>& number) {
  return to_string(number());
}
 
// U == std::ostream? but done this way because of fastoutput
template <typename U, typename T>
U& operator<<(U& stream, const Modular<T>& number) {
  return stream << number();
}
 
// U == std::istream? but done this way because of fastinput
template <typename U, typename T>
U& operator>>(U& stream, Modular<T>& number) {
  typename common_type<typename Modular<T>::Type, long long>::type x;
  stream >> x;
  number.value = Modular<T>::normalize(x);
  return stream;
}

// using ModType = int;
// struct VarMod { static ModType value; };
// ModType VarMod::value;
// ModType& md = VarMod::value;
// using Mint = Modular<VarMod>;
 
constexpr int md = (int) 998244353;
using Mint = Modular<std::integral_constant<decay<decltype(md)>::type, md>>;
 
vector<Mint> fact;
vector<Mint> inv_fact;
 
Mint C(int n, int k) {
    if (k < 0 || k > n) {
        return 0;
    }

    if (fact.empty()) {
        fact.push_back(1);
        inv_fact.push_back(1);
    }

    while ((int) fact.size() < n + 1) {
        fact.push_back(fact.back() * (int) fact.size());
        inv_fact.push_back(1 / fact.back());
    }

    return fact[n] * inv_fact[k] * inv_fact[n - k];
}

void solve() {
    int n;
    string s;
    cin >> s;
    n = s.size();
    int pc = 0;
    Mint cur = 0, out = 0;
    for (int i = n - 1; i >= 0; i--) {
        int l = n - i - 1;
        cur = 2 * cur - C(l - 1, pc + 1);
        if (s[i] == '0') cur += C(l, pc + 1);
        else pc++;
        if (s[i] == '1') out += cur;
    }

    cout << out << "\n";
}

int32_t main() {
    std::ios::sync_with_stdio(false);
    cin.tie(NULL);
    int tt;
    cin >> tt;
    while (tt--) {
        solve();
    }
}

Advanced G: Binary Function II

Hint 1

Hint 2

Hint 3

Hint 4

Hint 5

Solution

Let $$$sumf(n)$$$ be the sum of $$$f(x)$$$ for $$$x=1...n-1$$$. Then, the answer would just be $$$sumf(r+1)-sumf(l)$$$. Let's see how to calculate $$$sumf(n)$$$ with the following example:

Let $$$n=10100$$$. Let set $$$A$$$ be numbers to have $$$0$$$ as their first bit ($$$00001, 00010, 00011, 00100, etc.)$$$ and set $$$B$$$ be numbers that have $$$100$$$ as their first 3 bits ($$$10000, 10001, 10010, 10011$$$). Thus, both sets satisfy the condition that they are less than $$$n$$$. We know that the every number in $$$A$$$ < every number in $$$B$$$, so now we need to find how many numbers in $$$A$$$ have a higher popcount than numbers in $$$B$$$.

Using casework and grouping, we find $$${2 \choose 0} ({4 \choose 2} + {4 \choose 3} + {4 \choose 4}) + {2 \choose 1} ({4 \choose 3} + {4 \choose 4}) + {2 \choose 2} {4 \choose 4}$$$. Since $$${n \choose k} = {n \choose {n-k}}$$$.

We can rewrite this to be: $$${2 \choose 2} ({4 \choose 2} + {4 \choose 3} + {4 \choose 4}) + {2 \choose 1} ({4 \choose 3} + {4 \choose 4}) + {2 \choose 0} {4 \choose 4}$$$.

Regrouping, we get $$$({2 \choose 2}{4 \choose 2} + {2 \choose 1}{4 \choose 3} + {2 \choose 0}{4 \choose 4}) + ({2 \choose 2}{4 \choose 3} + {2 \choose 1}{4 \choose 4}) + ({2 \choose 2}{4 \choose 4})$$$.

Applying Vandermonde's, we get: $$${6 \choose 4} + {6 \choose 5} + {6 \choose 6}$$$. This form can be generalized into: $$${n \choose k} + {n \choose k + 1} + ... + {n \choose n}$$$.

Next, we've considered the interaction between the two sets, but what about the values within the sets themselves? Well, since all the numbers in a set share the same prefix, we only have to worry about their suffix because the prefix shares the number of 1s. This is now no different than solving $$$sumf(2^k)$$$ where there are $$$2^k$$$ numbers in the set. To do that, we use a similar technique in breaking up the sets into two smaller sets: numbers that start with $$$0$$$ and numbers that start with $$$1$$$. Let this function be considered $$$solvepart(k)$$$

For instance, consider $$$k=4$$$.

0000   1000
0001   1001
0010   1010
0011   1011
0100   1100
0101   1101
0110   1110
0111   1111

Within each set, $$$\sum{f(x)} = solvepart(k-1)$$$. To find the interaction, the calculation is almost identical to the previous and we use Vandermonde's identity to simplify. Then, $$$solvepart(k)=2 \cdot solvepart(k-1) + \sum_{x=k+1}^{2k-2}{{2k-2} \choose {x}}$$$.

Combining everything together, we create a new set for every time there is a 1 bit by finding numbers that share the prefix but turn that bit into a 0. Then, we calculate the individual contribution of that set. Next, for each pair of sets, we calculate their interaction, and summing everything together would get the final answer. To speed up the process, I precomputed consecutive summations of combinations. My solution alters $$$solvepart$$$ just a bit by changing $$$k$$$ to $$$k-1$$$, but it works the same way.

Code

#include <iostream>
#include <vector>
#include <functional>
#include <string>
#include <cmath>

using namespace std;

const int MOD = 998244353;
const int MAX_N = 1010;

vector<long long> factorial(2 * MAX_N + 1, 1);

void precompute_factorials() {
    for (int i = 1; i <= 2 * MAX_N; ++i) {
        factorial[i] = factorial[i - 1] * i % MOD;
    }
}

long long pow_(long long a, long long b) {
    if (b == 0) return 1;
    long long res = pow_(a, b / 2);
    if (b % 2 == 0) return res * res % MOD;
    else return res * res % MOD * a % MOD;
}

long long inv(long long x) {
    return pow_(x, MOD - 2);
}

long long C(int n, int k) {
    return factorial[n] * inv(factorial[n - k] * factorial[k] % MOD) % MOD;
}

vector<vector<long long>> precomp(2 * MAX_N + 1);
long long solve_part[MAX_N + 1];
void precompute() {
    for (int n = 0; n <= 2 * MAX_N; ++n) {
        vector<long long> arr;
        for (int k = n; k >= 0; --k) {
            if (!arr.empty()) arr.push_back((arr.back() + C(n, k)) % MOD);
            else arr.push_back(C(n, k) % MOD);
        }
        precomp[n] = vector<long long>(arr.rbegin(), arr.rend());
    }
    for (int i = 2; i <= MAX_N; i++) {
        solve_part[i] = precomp[2 * i][i + 2];
        solve_part[i] += 2 * solve_part[i - 1] % MOD;
        solve_part[i] %= MOD;
    }
}

long long sum_f(const string &x) {
    long long res = 0;
    vector<pair<int, int>> pairs;
    int count = 0;
    for (int i = x.size() - 1; i >= 0; --i) {
        if (x[i] == '1') {
            if (x.size() - i - 2 >= 0) res += solve_part[x.size() - i - 2]; res %= MOD;
            pairs.emplace_back(x.size() - i - 1, count);
            count++;
        }
    }
    for (size_t i = 0; i < pairs.size(); ++i) {
        for (size_t j = i + 1; j < pairs.size(); ++j) {
            int a = pairs[i].first, d1 = pairs[i].second;
            int b = pairs[j].first, d2 = pairs[j].second;
            int n = a + b;
            int min_k = a + abs(d1 - d2) + 1;
            if (min_k <= n) {
                res += precomp[n][min_k];
                res %= MOD;
            }
        }
    }
    return res;
}

void binIncr(string& bin) {
    int n = bin.length();
    for (int i = n - 1; i >= 0; i--) {
        if (bin[i] == '0') {
            bin[i] = '1'; return;
        } else bin[i] = '0';
    } bin = '1' + bin;
}

int main() {
    ios::sync_with_stdio(false); cin.tie(nullptr);

    precompute_factorials();
    precompute();

    int t = 1;
    while (t--) {
        string l, r;
        cin >> l >> r;
        binIncr(r);
        cout << (sum_f(r) - sum_f(l) + MOD) % MOD << '\n';
    }

    return 0;
}

Advanced H: Permutation Composition

Definitions

Hint 1

Hint 2

Hint 3

Hint 4

Solution

Code

#include <iostream>
#include <vector>
#include <map>

using namespace std;

int main(){
    int n;
    cin >> n;
    int a [n+1];
    int b [n+1];
    for(int i = 1; i <= n; i++){
        cin >> a[i];
    }
    for(int i = 1; i <= n; i++){
        cin >> b[i];
    }
    int q;
    cin >> q;
    vector <bool> ops;
    for(int qt = 0; qt < q; qt++){
        int s;
        cin >> s;
        if(s == 1){
            ops.push_back(false);
        }else{
            ops.push_back(true);
        }
    }
    bool vis [n+1];
    int a2 [n+1];
    int b2 [n+1];
    for(int i = 1; i <= n; i++){
        vis[i] = false;
    }
    pair<int,int> mp [n+1];

    for(int i = 1; i <= n; i++){
        mp[i] = make_pair(-1, -1);
    }

    for(int i = 1; i <= n; i++){
        if(!vis[i]){
            int cur = i;
            vector <int> aside;
            vector <int> bside;
            do{
                aside.push_back(cur);
                bside.push_back(a[cur]);
                cur = b[a[cur]];
                vis[cur] = true;
            }while(cur != i);
            int cyc =  2 * aside.size();
            int len = aside.size();
            if(mp[len] == make_pair(-1, -1)){
                int ashift = 1;
                int bshift = 1;
                for(int j = 0; j < q; j++){
                    if(ops[j]){
                        bshift = (2 * bshift + ashift)%cyc;
                    }else{
                        ashift = (2 * ashift + bshift)%cyc;
                    }    
                }
                mp[len] = make_pair(ashift, bshift);
            }
            int ashift = mp[len].first/2;
            int bshift = mp[len].second/2 + 1;
            for(int j = 0; j < aside.size(); j++){
                a2[aside[j]] = bside[(j+ashift)%len];
                b2[bside[j]] = aside[(j+bshift)%len];
            }
        }
    }
    for(int i = 1; i <= n; i++){
        cout << a2[i] << " ";
    }
    cout << endl;
    for(int i = 1; i <= n; i++){
        cout << b2[i] << " ";
    }
    cout << endl;
    
}

Advanced I: Permutation Online

Hint 1

Hint 2

Hint 3

Hint 4

Solution

Code

#include <iostream>
#define ll long long
using namespace std;

int main(){
    ios_base::sync_with_stdio(false);
    cin.tie(NULL);
    int N, K, O;
    cin >> N >> K >> O;
    ll w [K];
    ll a [N+1];
    ll lives [N];
    ll prev [N];
    for(int i = 1; i <= N; i++){
        lives[i] = K;
    }
    for(int i = 0; i < K; i++){
        cin >> w[i];
    }
    ll last = 0;
    for(int i = 1; i <= N; i++){
        cin >> a[i];
        if(O == 1){
            a[i] = (last + a[i])%N + 1;
        }
        prev[i] = i-1;
        ll ans = 0;
        int pcu = i;
        int cur = i-1;
        int ind = 0;
        while(cur != 0){
            if(a[cur] > a[i]){
                ans += w[ind] * (cur);
                ind++;
                if(ind == K){
                    break;
                }
            }else{
                lives[cur]--;
                if(lives[cur] == 0){
                    prev[pcu] = prev[cur];
                    cur = pcu;
                }
            }
            pcu = cur;
            cur = prev[cur];
        }
        last = ans;
        cout << ans << ' ';
    }
}

Advanced J: Triangle Constructive

Hint 1

Hint 2

Hint 3

Solution

Code

#include <iostream>
#include <vector>
#define ll long long
using namespace std;

struct op{
    char type;
    int a;
    int b;
    ll c;
    op(char type_, int a_, int b_, ll c_){
        type = type_;
        a = a_;
        b = b_;
        c = c_;
    }
};

vector <op> ops;

void X(int y, int z, ll c){
    if(y >= 0 && z >= 0){
        ops.push_back(op('X', y, z, c));
    }
}

void Y(int z, int x, ll c){
    if(z >= 0 && x >= 0){
        ops.push_back(op('Y', z, x, c));
    }
}

void Z(int x, int y, ll c){
    if(x >= 0 && y >= 0){
        ops.push_back(op('Z', x, y, c));
    }
}

void pX(int ly, int lz, int ry, int rz, ll c){
    X(ly-1, lz-1, c);
    X(ly-1, rz, -c);
    X(ry, lz-1, -c);
    X(ry, rz, c);
}

void pY(int lz, int lx, int rz, int rx, ll c){
    Y(lz-1, lx-1, c);
    Y(lz-1, rx, -c);
    Y(rz, lx-1, -c);
    Y(rz, rx, c);
}

void pZ(int lx, int ly, int rx, int ry, ll c){
    Z(lx-1, ly-1, c);
    Z(lx-1, ry, -c);
    Z(rx, ly-1, -c);
    Z(rx, ry, c);
}

void solve(int n, int qx, int qy, int qz, ll c){
    //cout << qx << " " << qy << " " << qz << endl;
    if((qx + qy + qz) == n){
        pX(qy, qz, qy, qz, c);
    }else if((qx + qy + qz) > n){
        int size = (qx + qy + qz) - n;
        pX(qy - size/2, qz - size/2, qy, qz, c);
        pY(qz - size/2, qx - size/2, qz, qx, c);
        pZ(qx - size/2, qy - size/2, qx, qy, c);
        if(size != 1){
            solve(n, qx - size/2, qy - size/2, qz - size/2, -2 * c);
        }
    }else if((qx + qy + qz) < n){
        int size = n - (qx + qy + qz);
        pX(qy, qz, qy + size/2, qz + size/2, c);
        pY(qz, qx, qz + size/2, qx + size/2, c);
        pZ(qx, qy, qx + size/2, qy + size/2, c);
        if(size != 1){
            solve(n, qx + size/2, qy + size/2, qz + size/2, -2 * c);
        }
    }
}

int main()
{
    int n, qx, qy, qz;
    cin >> n >> qx >> qy >> qz;
    solve(n, qx, qy, qz, 1);
    cout << ops.size() << endl;
    for(int i = 0; i < ops.size(); i++){
        cout << ops[i].type << " " << ops[i].a << " " << ops[i].b << " " << ops[i].c << endl;
    }
    return 0;
}

Advanced K: Bocchi The Tour

Hint 1

Hint 2

Solution

Code

#include <algorithm>
#include <iostream>
#include <vector>
using namespace std;

const int MAXN = 2e5 + 5;
const int LOG = 19;
const int INF = 1e9 + 7;

int n, q, k;
int a[MAXN], b[MAXN], w[MAXN];
int ord[MAXN];
int par[MAXN];
int up[MAXN][LOG];
int timer = 1;
int tin[MAXN], tout[MAXN];
vector<int> adj[MAXN];

struct Query {
    int l, r, d;
};

Query queries[MAXN];

bool comp(int a, int b) {
    return w[a] < w[b];
}

struct Node {
    int cnt, mn, lazy;
    Node() : mn{INF}, cnt{0}, lazy{0} {}
};

Node tree[4 * MAXN];

Node merge(Node a, Node b) {
    Node ret;
    ret.mn = min(a.mn, b.mn);
    if(ret.mn == a.mn) ret.cnt += a.cnt;
    if(ret.mn == b.mn) ret.cnt += b.cnt;
    return ret;
}

void push(int u) {
    tree[2 * u].lazy += tree[u].lazy; tree[2 * u].mn += tree[u].lazy;
    tree[2 * u + 1].lazy += tree[u].lazy; tree[2 * u + 1].mn += tree[u].lazy;
    tree[u].lazy = 0;
}

Node query(int u, int l, int r, int ql, int qr) {
    if(r < ql || l > qr) return {};
    if(ql <= l && r <= qr) return tree[u];
    push(u);
    int mid = (l + r) / 2;
    return merge(query(2 * u, l, mid, ql, qr), query(2 * u + 1, mid + 1, r, ql, qr));
}

void update(int u, int l, int r, int ql, int qr, int x) {
    if(r < ql || l > qr) return;
    if(ql <= l && r <= qr) {
        tree[u].lazy += x; tree[u].mn += x;
        return;
    }
    push(u);
    int mid = (l + r) / 2;
    update(2 * u, l, mid, ql, qr, x); update(2 * u + 1, mid + 1, r, ql, qr, x);
    tree[u] = merge(tree[2 * u], tree[2 * u + 1]);
}

void build(int u, int l, int r) {
    if(l == r) {
        tree[u].mn = 0; tree[u].cnt = 1;
        return;
    }
    int mid = (l + r) / 2;
    build(2 * u, l, mid); build(2 * u + 1, mid + 1, r);
    tree[u] = merge(tree[2 * u], tree[2 * u + 1]);
}

void euler(int u) {
    tin[u] = timer;
    if(adj[u].size() == 0) ++timer;
    for(auto v : adj[u]) euler(v);
    tout[u] = timer - 1;
}

int find(int u) {
    if(u == par[u]) return u;
    return par[u] = find(par[u]);
}

int main() {
    cin.tie(0)->sync_with_stdio(false);
    cin >> n >> q >> k;

    for(int i = 0; i < MAXN; ++i) par[i] = i;

    for(int i = 1; i < n; ++i) {
        cin >> a[i] >> b[i] >> w[i];
        ord[i] = i;
    }

    sort(ord + 1, ord + n, comp);

    for(int i = 1; i < n; ++i) {
        int u = find(a[ord[i]]), v = find(b[ord[i]]);
        par[u] = par[v] = up[u][0] = up[v][0] = ord[i] + n;
    }

    for(int i = 1; i <= 2 * n; ++i) adj[up[i][0]].push_back(i);

    int krtroot = ord[n - 1] + n;
    up[krtroot][0] = krtroot;
    euler(krtroot);

    for(int j = 0; j < LOG - 1; ++j) {
        for(int i = 1; i < 2 * n; ++i) {
            up[i][j + 1] = up[up[i][j]][j];
        }
    }
    
    build(1, 1, n);

    int idx = 0;
    for(int i = 1; i <= q; ++i) {
        int d, u, s; cin >> d >> u >> s;

        for(int j = LOG - 1; j >= 0; --j) {
            if(w[up[u][j] - n] <= s) u = up[u][j];
        }

        queries[i] = {tin[u], tout[u], d};
        while(queries[idx].d + k <= d) {
            update(1, 1, n, queries[idx].l, queries[idx].r, -1);
            ++idx;
        }

        Node ret = query(1, 1, n, queries[i].l, queries[i].r);
        if(ret.mn != 0) cout << 0 << endl;
        else cout << ret.cnt << endl;
        update(1, 1, n, queries[i].l, queries[i].r, 1);
    }
}

Advanced L: Can you Count?

Hint 1

Hint 2

Solution

By algebra,

$$$ \displaystyle\sum^{\infty}_{k=0} S_{n,m,k}\cdot\frac{x^k}{k!} =\displaystyle\sum^{\infty}_{k=0} \left(\displaystyle\sum_{1\le a_i\le m}\left(\displaystyle\sum^{n}_{i=1}a_i\right)^k\right)\cdot\frac{x^k}{k!} =\displaystyle\sum_{1\le a_i\le m}\displaystyle\sum^{\infty}_{k=0}\left(\displaystyle\sum^{n}_{i=1}a_i\right)^k\cdot\frac{x^k}{k!} $$$ $$$ =\displaystyle\sum_{1\le a_i\le m}\displaystyle\sum^{\infty}_{k=0}\left(\displaystyle\sum^{n}_{i=1}a_i x\right)^k\cdot\frac{1}{k!} =\displaystyle\sum_{1\le a_i\le m}e^{\sum^{n}_{i=1}a_i x} =\displaystyle\sum_{1\le a_i\le m}\prod^{n}_{i=1}e^{a_i x} =\prod^{n}_{i=1}\displaystyle\sum_{1\le a_i\le m}e^{a_i x} =\prod^{n}_{i=1}\left(\frac{1-e^{mx}}{e^{-x}-1}\right) =\left(\frac{1-e^{mx}}{e^{-x}-1}\right)^n. $$$

For a fixed sum $$$s$$$, the number of arrays $$$b$$$ of length $$$k$$$ such that $$$\max^k_{j=1} = s$$$ is precisely the number of arrays $$$b$$$ with each element at most $$$s$$$ minus the number of arrays $$$b$$$ with each element almost $$$s-1$$$, which is equal to $$$s^k-(s-1)^k=s^k-\displaystyle\sum^{k}_{j=0} (-1)^{k-j}\binom{k}{j}s^j$$$. Hence, the total number of pairs $$$(a,b)$$$, which we denote as $$$p_{n,m,k}$$$. is given by

$$$ \displaystyle\sum_{1\le a_i\le m}\left(\left(\displaystyle\sum^{n}_{i=1}a_i\right)^k-\displaystyle\sum^{k}_{j=0} (-1)^{k-j}\binom{k}{j}\left(\displaystyle\sum^{n}_{i=1}a_i\right)^j\right) =\displaystyle\sum_{1\le a_i\le m}\left(\displaystyle\sum^{n}_{i=1}a_i\right)^k-\displaystyle\sum^{k-1}_{j=0} (-1)^{k-j}\binom{k}{j}\displaystyle\sum_{1\le a_i\le m}\left(\displaystyle\sum^{n}_{i=1}a_i\right)^j $$$ $$$ =S_{n,m,k}-\displaystyle \sum^{k}_{j=0} (-1)^{k-j}\binom{k}{j}S_{n,m,j} $$$

as mentioned in Hint $$$2$$$.

Let $$$P(x)=\displaystyle\sum^{\infty}_{k=0} p_{n,m,k}x^k$$$ and $$$Q(x)=\displaystyle\sum^{\infty}_{k=0} S_{n,m,k}x^{k\color{red}{+1}}$$$. We find

$$$ P(x)=\displaystyle\sum^{\infty}_{k=0} p_{n,m,k}x^k =\displaystyle\sum^{\infty}_{k=0} \left(S_{n,m,k}-\displaystyle \sum^{k}_{j=0} (-1)^{k-j}\binom{k}{j}S_{n,m,j}\right)x^k =\displaystyle\sum^{\infty}_{k=0} S_{n,m,k}x^k-\displaystyle\sum^{\infty}_{k=0} \displaystyle \sum^{\infty}_{j=0} (-1)^{k-j}\binom{k}{j}S_{n,m,j}x^k $$$ $$$ =\displaystyle\sum^{\infty}_{k=0} S_{n,m,k}x^k - \displaystyle\sum^{\infty}_{j=0} S_{n,m,j} \left(\displaystyle\sum^{\infty}_{k=0} (-1)^{k-j}\binom{k}{j}x^k\right) =\frac{1}{x} \displaystyle\sum^{\infty}_{k=0} S_{n,m,k}x^{k+1} - \frac{1}{x} \displaystyle\sum^{\infty}_{j=0} S_{n,m,j} \left(\frac{x}{1+x}\right)^{j+1} $$$ $$$ =\dfrac{1}{x} \left(Q(x)-Q\left(\dfrac{x}{1+x}\right)\right). $$$

Let $$$K$$$ be the maximum $$$k_i$$$ queried. We need the values of $$$S_{n,m,0},S_{n,m,1},...,S_{n,m,K}$$$. Hence, we need to extract the coefficients up to $$$x^K$$$ term in

$$$\displaystyle\sum^{\infty}_{k=0} S_{n,m,k}\cdot\frac{x^k}{k!}=\left(\frac{1-e^{mx}}{e^{-x}-1}\right)^n$$$

Division up till $$$x^K$$$ term can be done in $$$O(K\log K)$$$. Taking $$$S(x)=\frac{1-e^{mx}}{e^{-x}-1}$$$ to the $$$n$$$-th power is equivalent to computing $$$e^{n\ln S(x)}$$$. Since exponentiation and logarithms up till $$$x^K$$$ term can also be done in $$$O(K\log K)$$$, all of $$$S_{n,m,0},S_{n,m,1},...,S_{n,m,K}$$$ can be extracted in $$$O(K\log K)$$$. We substitute those values in to find $$$Q(x)$$$ up till $$$x^{K+1}$$$ term. Terms of $$$Q\left(\frac{x}{1+x}\right)=Q\left(1-\frac{1}{1+x}\right)$$$ up till $$$x^{K+1}$$$ can also be obtained in $$$O(K\log K)$$$ time from $$$Q(x)$$$ by doing the compositions $$$Q(x)\circ (1+x)\circ x^{-1}\circ (-x)\circ (1+x)$$$. Hence, terms of $$$P(x)$$$ up till $$$x^K$$$ can be obtained in $$$O(K\log K)$$$ time, and for each query on $$$k_i$$$ just return the coefficient of $$$x^{k_i}$$$ in $$$P(x)$$$.

Time complexity: $$$O(q+K \log K)$$$ where $$$K$$$ is the maximum $$$k_i$$$ queried.

Partial scores:

$$$q=1$$$ and $$$k_i\le 2\cdot 10^4$$$: See below.

$$$q=1$$$: Allows computing $$$p_{n,m,k}=S_{n,m,k}-\displaystyle \sum^{k}_{j=0} (-1)^{k-j}\binom{k}{j}S_{n,m,j}$$$ naively after obtaining the values of $$$S_{n,m,0},S_{n,m,1},...,S_{n,m,k}$$$. Time complexity is $$$O(K \log K)$$$.

$$$k_i\le 2\cdot 10^4$$$: Allows binary lifting to take $$$n$$$-th power. Time complexity is $$$O(q+K \log K\log N)$$$.

Useful materials

Code

#include<bits/stdc++.h>
using namespace std;
#define int long long
const int MOD=998244353;
const int lim=200010; // *
int fact[lim+1],ifact[lim+1],inve[lim+1]; // *
vector <int> root={31},iroot; // #

// * denotes factorial related functions
// # denotes ntt related functions
// $ denotes more gen func stuff
// delete if not needed

int mod(int a){
    a%=MOD; a+=MOD; a%=MOD;
    return a;
} // use when stuff might get negative

int bigmod(int a,int k){
    int ans=1,powa=a;
    while(k){
        if(k&1) ans=ans*powa%MOD;
        powa=powa*powa%MOD;
        k>>=1;
    }
    return ans;
}

void init_fact(){
    fact[0]=1;
    for(int i=1;i<=lim;i++){
        fact[i]=fact[i-1]*i%MOD;
    }
    ifact[lim]=bigmod(fact[lim],MOD-2);
    for(int i=lim;i>=1;i--){
        ifact[i-1]=ifact[i]*i%MOD;
    }
    inve[0]=0;
    for(int i=1;i<=lim;i++){
        inve[i]=fact[i-1]*ifact[i]%MOD;
    }
    return;
} // *

int nCr(int n,int r){
    if(n<0||r<0||r>n) return 0;
    return fact[n]*ifact[r]%MOD*ifact[n-r]%MOD;
} // *

int inCr(int n,int r){
    if(n<0||r<0||r>n) return 0;
    return ifact[n]*fact[r]%MOD*fact[n-r]%MOD;
} // *

void init_ntt(){
    iroot.push_back(bigmod(root[0],MOD-2));
    int ptr=0;
    while(root[ptr]!=1){
        root.push_back(root[ptr]*root[ptr]%MOD);
        iroot.push_back(iroot[ptr]*iroot[ptr]%MOD);
        ptr++;
    }
    return;
} // #

void ntt(vector <int> &f,bool inv){
    int n=f.size();
    int i=1,j=0,ptr=root.size()-1,s=1;
    while(i<n){
        if(i==s){
            s<<=1;
            ptr--;
        }
        int bit=(n>>1);
        while(j&bit){
            j^=bit;
            bit>>=1;
        }
        j^=bit;
        if(i<j) f[i]^=f[j]^=f[i]^=f[j];
        i++;
    }
    int mult=inv?root[ptr]:iroot[ptr];
    int poww[n]={1};
    for(int k=1;k<n;k++) poww[k]=poww[k-1]*mult%MOD;
    int k=1,jmp=n>>1;
    for(int K=2;K<=n;K<<=1){
        for(int L=0;L<n;L+=K){
            int idx=0;
            for(int l=L;l<(L^k);l++){
                int u=f[l],v=f[l^k]*poww[idx]%MOD;
                f[l]=u+v; if(f[l]>MOD) f[l]-=MOD;
                f[l^k]=u-v; if(f[l^k]<0) f[l^k]+=MOD;
                idx+=jmp;
            }
        }
        k=K; jmp>>=1;
    }
    if(inv){
        int in=bigmod(n,MOD-2);
        for(int k=0;k<n;k++) f[k]=in*f[k]%MOD;
    }
}

vector <int> conv(vector<int> f,vector<int> g){
    int k=f.size()+g.size()-1,n=1;
    while(n<k) n<<=1;
    f.resize(n,0); g.resize(n,0);
    ntt(f,0); ntt(g,0);
    for(int i=0;i<n;i++) f[i]=f[i]*g[i]%MOD;
    ntt(f,1);
    return {f.begin(),f.begin()+k};
} // #

vector <int> add(vector<int> f,vector<int> g){
    int k=max(f.size(),g.size());
    f.resize(k,0);
    g.resize(k,0);
    for(int i=0;i<k;i++){
        f[i]+=g[i];
        if(f[i]>MOD) f[i]-=MOD;
    }
    return f;
} // $

vector <int> neg(vector<int> f){
    int k=f.size();
    for(int i=0;i<k;i++){
        f[i]=(f[i])?(MOD-f[i]):0;
    }
    return f;
} // $

vector <int> inverse(vector<int> f){
    vector<int> ret={bigmod(f[0],MOD-2)};
    int k=f.size();
    f=neg(f);
    while(ret.size()<k){
        int d=ret.size()*2;
        if(k<d) f.resize(d);
        vector <int> temp=conv({f.begin(),f.begin()+d},ret);
        temp[0]+=2;
        if(temp[0]>MOD) temp[0]-=MOD;
        ret=conv({temp.begin(),temp.begin()+d},ret);
        ret={ret.begin(),ret.begin()+d};
    }
    return {ret.begin(),ret.begin()+k};
} // $

vector <int> divide(vector<int> f,vector<int> g){
    int k=max(f.size(),g.size());
    f.resize(k,0);
    g.resize(k,0);
    f=conv(f,inverse(g));
    return {f.begin(),f.begin()+k};
} // $

vector <int> derivative(vector<int> f){
    int k=f.size();
    if(k==1) return {0};
    vector <int> ret(k-1);
    for(int i=1;i<k;i++){
        ret[i-1]=f[i]*i%MOD;
    }
    return ret;
} // $

vector <int> integrate(vector<int> f){
    int k=f.size();
    vector <int> ret(k+1); ret[0]=0;
    for(int i=1;i<k;i++){
        ret[i]=f[i-1]*inve[i]%MOD;
    }
    return ret;
} // $

vector <int> ln(vector<int> f){
    int k=f.size();
    vector <int> ret=integrate(divide(derivative(f),f));
    return {ret.begin(),ret.begin()+k};
} // $

vector <int> expo(vector<int> f){
    vector<int> ret={1};
    int k=f.size();
    while(ret.size()<k){
        int d=ret.size()*2;
        if(k<d) f.resize(d);
        vector <int> temp={f.begin(),f.begin()+d};
        ret.resize(d,0);
        temp=add(temp,neg(ln(ret)));
        temp[0]+=1;
        if(temp[0]>MOD) temp[0]-=MOD;
        ret=conv(temp,ret);
        ret={ret.begin(),ret.begin()+d};
    }
    return {ret.begin(),ret.begin()+k};
} // $

vector <int> ead(vector <int> f,int a){
    vector <int> g;
    int n=f.size()-1,powa=1;
    g.resize(n+1);
    for(int i=0;i<=n;i++){
        f[i]=f[i]*fact[i]%MOD;
        g[n-i]=powa*ifact[i]%MOD;
        powa=powa*a%MOD;
    }
    g=conv(f,g);
    for(int i=0;i<=n;i++) g[n+i]=g[n+i]*ifact[i]%MOD;
    return {g.begin()+n,g.end()};
} // $

void solve(){
    int n,m,q,k=200010;
    cin >> n >> m >> q;
    vector <int> f(k),g(k);
    int powm=1;
    bool neg=0;
    for(int i=0;i<k;i++){
        powm=powm*m%MOD; neg=!neg;
        f[i]=MOD-powm*ifact[i+1]%MOD;
        g[i]=(neg)?(MOD-ifact[i+1]):ifact[i+1];
    }
    f=divide(f,g);
    f=ln(f);
    for(int i=0;i<k;i++){
        f[i]=f[i]*n%MOD;
    }
    f=expo(f);
    int mult=bigmod(m,n);
    for(int i=0;i<k;i++){
        f[i]=f[i]*mult%MOD;
    }
    neg=0;
    cout << '\n';*/
    f.resize(k+1);
    for(int i=k;i>0;i--){
        f[i]=f[i-1]*fact[i-1]%MOD;
    }
    f[0]=0;
    cout << '\n';*/
    vector <int> P=ead(f,1),Q(k+1);
    for(int i=1;i<=k;i+=2){
        if(P[i]>0) P[i]=MOD-P[i];
    }
    reverse(P.begin(),P.end());
    P=ead(P,1);
    int curc=1;
    for(int i=0;i<=k;i++){
        if(i){
            curc=MOD-curc*(k+i-1)%MOD;
        }
        Q[i]=curc;
    }
    curc=ifact[k];
    for(int i=k;i>=0;i--){
        Q[i]=Q[i]*curc%MOD;
        curc=curc*i%MOD;
    }
    P=conv(P,Q);
    for(int i=0;i<k;i++){
        f[i]=f[i+1]-P[i+1];
        if(f[i]<0) f[i]+=MOD;
    }
    for(int i=0;i<q;i++){
        int K; cin >> K;
        cout << f[K] << ' ';
    }
}

int32_t main(){
    ios_base::sync_with_stdio(0);
    cin.tie(0); cout.tie(0);
    init_fact(); // *
    init_ntt(); // #
    int t=1;
    while(t--){
        solve();
    }
}

Rev.	By	When	Δ	Comment
en8	HaccerKat	2025-04-15 02:22:01	206
en7	HaccerKat	2025-04-14 20:11:14	1507
en6	HaccerKat	2025-04-14 18:47:35	0	(published)
en5	HaccerKat	2025-04-14 18:40:42	4792
en4	HaccerKat	2025-04-14 06:46:19	34
en3	HaccerKat	2025-04-14 06:45:08	5484
en2	HaccerKat	2025-04-14 06:28:18	58764
en1	HaccerKat	2025-04-14 05:43:13	16525	Initial revision (saved to drafts)

History