#	User	Rating
1	ecnerwala	3650
2	Benq	3582
3	Geothermal	3570
3	orzdevinwang	3570
5	cnnfls_csy	3569
6	tourist	3565
7	maroonrk	3532
8	Radewoosh	3522
9	Um_nik	3483
10	jiangly	3468

#	User	Contrib.
1	maomao90	174
2	awoo	164
3	adamant	163
4	TheScrasse	159
5	nor	158
6	maroonrk	156
7	-is-this-fft-	151
8	SecondThread	147
9	orz	146
10	pajenegod	145

willy108's blog

Teamscode Spring 2024 Contest Official Editorial

By willy108, history, 2 weeks ago, In English

Sorry for the long wait. These problems were brought to you by Esomer, danx, dutin, jay_jayjay, oursaco, superhelen, thehunterjames, willy108, and yash_9a3b. Also, massive thanks to omeganot for his unofficial editorial (which was posted a lot sooner than ours).

Novice A/Advanced A: It's Time to Submit

Solution

Solution Code

print("NO")

Novice B: A Bit of Monkeying

Hint 1

Hint 2

Solution

Solution Code

#include <iostream>
#include <vector>
#include <map>
using namespace std;
int main(){
    cin.tie(0) -> sync_with_stdio(0);
    int T; cin >> T;
    while(T--){
	int n;
	cin >> n;
	vector<int> arr(n);
	map<int, int> cnt;
    	for(int&x : arr){
    	    cin >> x;
	    cnt[x]++;
	}
    	int or_sum = arr[0], and_sum = arr[0];
    	for(int i = 1; i<n; i++){
    	    or_sum = or_sum|arr[i];
    	    and_sum = and_sum&arr[i];
    	}
	if(cnt[or_sum] == cnt[and_sum]){
	    cout << "sad\n";
    	}else if(cnt[or_sum] > cnt[and_sum]){
	   cout << "or\n";
    	}else{
	   cout << "and\n";
	}	
    }
 
}

Novice C: Alternet Is Cheating

Solution

Solution Code


// {{{1 my template
extern "C" int __lsan_is_turned_off() { return 1; }
#include <bits/stdc++.h>
using namespace std;

#include <tr2/dynamic_bitset>
using namespace tr2;
#include <ext/pb_ds/assoc_container.hpp>

#define ll long long
#define inf 0x3f3f3f3f
#define infl 0x3f3f3f3f3f3f3f3fll

#include <assert.h>
#ifdef DEBUG
#define dprintf(args...) fprintf(stderr,args)
#endif
#ifndef DEBUG
#define dprintf(args...) 69
#endif
#define all(x) (x).begin(), (x).end()
// 1}}}
struct { template<typename T> operator T() { T x; cin>>x; return x; } } in;

int main()
{
        int tt = in;
        for(int ttn=0;ttn<tt;ttn++)
        {
                int n=in;
                vector<char> a(2*n-1);
                for (int i=0;i<n;i++) a[i+n-1] = in;
                // A is alternet
                // R is orz person
                // F is friend
                // P is friend but already chosen
                for(int i=n-2;~i;i--) {
                        int x = a[i*2+1], y = a[i*2+2];

                        char& z = a[i];
                        if (x == 'A')
                                z = y=='R'? 'R' : 'A';
                        else if (y == 'A')
                                z = x=='R'? 'R' : 'A';

                        else if (x == 'F')
                                z = y=='R'? 'P' : 'F';
                        else if (y == 'F')
                                z = x=='R'? 'P' : 'F';

                        else if (x == 'R' || y == 'R')
                                z = 'R';

                        else z = 'P';
                }

                printf("%s\n", a[0] == 'A'? "Yes" : "No");
        }
}

Novice D: Haagandaz is Justice

Hint 1

Solution

Solution code


#include <iostream>

using namespace std;

int answer(long long x){
	long long a = 1, b = 1;
	long long total = 0;
	int turns = 0;
	while(total < x){
		total += a;
		turns++;
		a += b;
		b = a - b;
	}
	return turns;
}

int main(){
	cin.tie(0) -> sync_with_stdio(0);
	int n;
	cin >> n;
	for(int i = 1; i<=n; i++){
		long long a; cin >> a;
		int t = answer(a);
		cerr << t << "\n";
		if(t%2 == 1){
			cout << "T";
		}else{
			cout << "K";
		}
	}
}

Novice E/Advanced B: Richard Lore

Hint 1

Solution

Solution Code


#include <iostream>
#include <utility>
#include <algorithm>
#include <vector>

using namespace std;

int main(){
  cin.tie(0) -> sync_with_stdio(0);
    int n, m, q;
	cin >> n >> m >> q;
	vector<int> p(n);	
	vector<pair<int, int>> arr(m);
	for(int i = 0; i<n; i++){
		cin >> p[i];
	}
	for(int i = 0; i<m; i++){
		int a, b;
		cin >> a >> b;
		a--, b--;
		arr[i] = pair(a, b);
	}
	vector<int> srt(n);
	for(int i = 0; i<n; i++){
		srt[i] = p[i];
	}
	sort(srt.begin(), srt.end());
	reverse(arr.begin(), arr.end());
	for(auto [a, b] : arr){
		swap(srt[a], srt[b]);
	}
	int cnt = 0;
	for(int i = 0; i<n; i++){
		if(srt[i] == p[i]) cnt++;
	}
	string ans;
	for(int i = 0; i<q; i++){
		int a, b;
		cin >> a >> b;
		a--, b--;
		cnt -= (srt[a] == p[a]);
		cnt -= (srt[b] == p[b]);
		swap(p[a], p[b]);
		cnt += (srt[a] == p[a]);
		cnt += (srt[b] == p[b]);
		if(cnt == n) ans.push_back('Y');
		else ans.push_back('N');
	}
	cout << ans << "\n";
  
  return 0;
}

Novice E/Advanced C: Unique Subsequences

Hint 1

Solution

Solution Code

 
#include <iostream>
#include <string>
#include <array>
using namespace std;

int main(){
	cin.tie(0) -> sync_with_stdio(0);
	int T;
	cin >> T;
	while(T--){
		int n, k;
		cin >> n >> k;
		string s;
		cin >> s;
		array<int, 26> occ;
		occ.fill(-1);
		int work = 1;
		for(int i = 0; i<n; i++){
			char c = s[i];
			if(occ[c-'a'] != -1){
				if((i - occ[c-'a']) <= (n - k)){
					work = 0;
				}
			}
			occ[c-'a'] = i;
		}	
		if(work) cout << "Yes\n";
		else cout << "No\n";
	}
}

Novice G/Advanced D: Sleepy Pandas

Hint 1

Hint 2

Solution

Solution Code

def ceil10(x):
    y = 1
    while y <= x:
        y *= 10
    return y

assert ceil10(0) == 1
assert ceil10(9) == 10
assert ceil10(19) == 100
assert ceil10(1e9) == 10000000000

T = int(input())

for _ in range(T):
    N, K = map(int, input().split())
    a = list(map(int, input().split()))

    cnt = 0
    for tp in [10**p for p in range(1, 10)]:  # Similar to 1e10 in C++
        mp = {}
        for i in range(N):
            x = (K - tp % K * a[i] % K) % K  # -a[i]*tp
            mp[x] = mp.get(x, 0) + 1

        for i in range(N):
            if ceil10(a[i]) != tp:
                continue
            x = (K - tp % K * a[i] % K) % K  # -a[i]*tp
            mp[x] -= 1
            cnt += mp.get(a[i] % K, 0)
            mp[x] += 1

    print(str(cnt))

Novice H: Afterimages

Hint 1

Hint 2

Solution

Solution Code

 
#include <iostream>
#include <vector>
#include <set>
#include <utility>
#include <algorithm>
#include <cmath>
#include <iterator>
#define all(x) x.begin(), x.end()

using namespace std;


long long answer(vector<int> A, vector<int> B, int steps){
	//same parity
	int n = A.size();
	multiset<int> ms;
	for(int i = 0; i<steps; i++){
		ms.insert(A[i]);
	}
	long long ret = 0;
	for(int i = 0; i<B.size(); i++){
		auto [mn, mx] = make_pair(*ms.begin(), *prev(ms.end()));
		ret += max(B[i] - mn, mx - B[i]);
		ms.erase(ms.lower_bound(A[i%n]));
		ms.insert(A[steps%n]);
		steps++;
	}
	return ret;
}



void solve(){
	int n; cin >> n;
	long long k; cin >> k;
	k--;
	vector<int> A(n), B(n);
	vector<int> Ao, Ae, Bo, Be; //A odd, A even, etc
	for(int i = 0; i<n; i++){
		cin >> A[i];
		if(i%2 == 0) Ae.push_back(A[i]);
		else Ao.push_back(A[i]);
	}
	for(int i = 0; i<n; i++){
		cin >> B[i];
		if(i%2 == 0) Be.push_back(B[i]);
		else Bo.push_back(B[i]);
	}

	auto ansAo = answer(Bo, Ao, min(k+1, (long long)n/2));
	auto ansAe = answer(Be, Ae, min(k+1, (long long)n/2));
	reverse(all(Ao)); reverse(all(Ae));
	reverse(all(Bo)); reverse(all(Be));
	auto ansBo = answer(Ao, Bo, min(k+1, (long long)n/2));
	auto ansBe = answer(Ae, Be, min(k+1, (long long)n/2));
	cout << ansAo + ansBo + ansAe + ansBe << "\n";
}


int main(){
	cin.tie(0) -> sync_with_stdio(0);
	int T; cin >> T;
	for(int i = 0; i<T; i++){
		solve();
	}
	return 0;
}

Novice I/Advanced F: Another Bitwise Problem

Solution

Solution Code

#include <bits/stdc++.h>
using namespace std;
#define int int64_t
typedef vector<int> vi;
typedef pair<int, int> pi;
typedef vector<pi> vpi;
#define all(x) x.begin(), x.end()
#define pb push_back
#define endl '\n'
#define f first
#define s second
#define FOR(i, a, b) for (int i = (a); i < (b); i++)
template <class T> istream &operator>>(istream& in, vector<T> &v) {for (auto& i : v) in >> i; return in;}

#ifdef HORI
#include "../../lib/debug.h"
#else
#define dbg(...)
#endif

const int M = 18;

signed main() {
  ios::sync_with_stdio(0); cin.tie(0);
  int n, l, r; cin >> n >> l >> r;
  vi a(n); cin >> a;
  vpi s;
  FOR(b, 0, M) {
    int z = 0, o = 0;
    FOR(i, 0, n) {
      if (a[i] & (1 << b)) {
        o++;
      } else {
        z++;
      }
    }
    s.pb({z * (1 << b), o * (1 << b)});
  }
  int ans = 0;
  set<int> st;
  FOR(mask, 0, (1 << M)) {
    int sum = 0;
    FOR(i, 0, M) {
      if ((1 << i) & mask) {
        sum += s[i].f;
      } else {
        sum += s[i].s;
      }
    }
    st.insert(sum);
  }
  for (int sum : st) {
    int nr = r - sum;
    int nl = l - sum;

    if (nr >= 0) {
      ans += nr / ((1 << M) * n) + 1;
    } 
    if (nl > 0) {
      ans -= (nl - 1) / ((1 << M) * n) + 1;
    }
  }
  cout << ans << endl;
}

Novice J: Everyone Loves Threes Magic (Easy Version)

Hint 1

Hint 2

Hint 3

Solution

Solution Code

 
#include <iostream>
using namespace std;
#define ll long long 

const int MX = 1e6+10;
const ll mod = 998244353;

ll pre[MX], prelin[MX], presq[MX];

int f(int x){
	if(x == 0) return 0;
	return (x%10 == 3) + f(x/10);
}

//(r - i + 1)(i - l + 1)f(i)
//(r+1)(-l+1)sum[i] + (-(-l+1) + r+1)*i*sum[i] + -i^2*sum[i]

void solve(){
	int l, r;
	cin >> l >> r;
	ll a = 1ll*(r+1)*(1+mod-l)%mod*(pre[r] + mod - pre[l-1])%mod;
	ll b = 1ll*(mod + -(-l + 1) + r + 1)*(prelin[r] + mod - prelin[l-1])%mod;
	ll c = 1ll*(mod -1)*(presq[r] + mod - presq[l-1])%mod;
	cout << (a + b + c)%mod << "\n";
}

int main(){
	cin.tie(0) -> sync_with_stdio(0);
	for(int i = 1; i<=(int)(1e6); i++){
		if(i%3 == 0){
			int F = f(i);
			pre[i] = F;
			prelin[i] = F*i;
			presq[i] = 1ll*F*i*i%mod;
		}
		pre[i] += pre[i-1];
		prelin[i] += prelin[i-1];
		presq[i] += presq[i-1];
		if(prelin[i] >= mod) prelin[i] %= mod;
		if(presq[i] >= mod) presq[i] %= mod;
	}
	int T; cin >> T;
	while(T--){
		solve();
	}
	return 0;
}

Novice K/Advanced E: Another Ordering Problem

Hint 1

Hint 2

Hint 3

Solution

Solution Code

The code may look long but the transitions are almost all the same.


#include <iostream>
#include <cmath>
#include <utility>
#include <cassert>
#include <algorithm>
#include <vector>
#include <array>


#define sz(x) ((int)(x.size()))
#define all(x) x.begin(), x.end()
#define pb push_back

using ll = long long;
const int MX = 2e5 +10, int_max = 0x3f3f3f3f;

using namespace std;

int par[MX];

ll dp[MX][2][2]; //took/not took | took good node/took bad node

vector<int> adj[MX];

int cost[MX], vis[MX], dsu[MX];
int n;

int find(int u){
	if(dsu[u] != u) dsu[u] = find(dsu[u]);
	return dsu[u];
}

void gpar(int u, int p){ //generate the parents
	par[u] = p;
	for(int v : adj[u]){
		if(v == p) continue;
		gpar(v, u);
	}
}

void gvis(int u){ //mark all the ancestors of a node
	if(u == 0) return ;
	vis[u] = 1;
	gvis(par[u]);
}	

void dfs(int u, int p, int bad){
	for(int v : adj[u]){
		if(v == p) continue;
		dfs(v, u, bad);
	}
	if(vis[u] == 0){
		ll sum0 = 0, sum1 = 0;
		for(int v : adj[u]){
			if(v == p) continue;
			sum0 += max(dp[v][0][0], dp[v][1][0]);
			sum1 += dp[v][0][0];
		}
		dp[u][0][0] = sum0;
		dp[u][1][0] = sum1 + cost[u];
	}else if(u == bad){
		ll sum0 = 0, sum1 = 0;
		for(int v : adj[u]){
			if(v == p) continue;
			sum0 += max(dp[v][0][0], dp[v][1][0]);
			sum1 += dp[v][0][0];
		}
		dp[u][0][0] = sum0;
		dp[u][1][1] = sum1 + cost[u];	
	}else{
		for(int j = 0; j<2; j++){
			ll sum0 = 0, sum1 = 0;
			for(int v : adj[u]){
				if(v == p) continue;
				if(vis[v]){
					sum0 += max(dp[v][0][j], dp[v][1][j]);
					sum1 += dp[v][0][j];
				}else{
					sum0 += max(dp[v][0][0], dp[v][1][0]);
					sum1 += dp[v][0][0];
				}
			}
			dp[u][0][j] = sum0;
			dp[u][1][j] = sum1 + cost[u];
		}
	}
}

ll go(pair<int, int> bad){
	auto [u, v] = bad;
	if(u == v) return 0;
	gpar(u, 0);
	gvis(v);
	dfs(u, 0, v);
	return max({dp[u][0][0], dp[u][0][1], dp[u][1][0]});
}

int main(){
	cin >> n;
	for(int i = 1; i<=n; i++) dsu[i] = i;
	vector<pair<int, int>> bad;
	for(int i =1; i<=n; i++){
		cin >> cost[i];
		int j;
		cin >> j;
		if(find(i) == find(j)){
			bad.push_back({i, j});
		}else{
			dsu[find(i)] = find(j);
			adj[i].pb(j);
			adj[j].pb(i);
		}
	}
	ll ans = 0;
	for(auto p : bad){
		ans += go(p);
	}
	cout << ans << "\n";
}

Novice L/Advanced H: Gaslighting

Hint 1

Hint 2

For each $$$l$$$, we can first generate all the intervals of $$$len$$$ for each $$$l'$$$. Then we can do a sweep where we maintain a set of "active" intervals for each $$$len$$$. At $$$len = c+1$$$, we can insert $$$l'$$$ to our active set, then at $$$len = lcp(l + c + 1, l' + c + 1) + 1$$$, we can remove it from our set. For each $$$len$$$, we check if any interval is active, and if so, store its $$$l'$$$ as a valid answer for a query with that $$$l$$$ and $$$len$$$.

vector<int> process(vector<array<int, 3>> arr){ //stores the intervals as [lo, hi, l']
	set<int> pres;
	vector<vector<int>> events(n+2);
	for(auto [a, b, c] : arr){
		events[a].pb(c);
		events[b+1].pb(-c);
	}
	vector<int> ans(n+1, 0);
	for(int i = 0; i<=n; i++){
		for(int x : events[i]){
			if(x < 0) pres.erase(-x);
			else pres.insert(x);
		}
		if(pres.size()) ans[i] = *pres.begin();
		else ans[i] = 0;
	}
	return ans;
}

This gives an $$$O(n^2 \log n + q)$$$ solution as we need a set.

Hint 3

Solution

Solution Code

The contestant yam had such a clean code, I just stole his instead of the model. :thumbs:

#include<bits/stdc++.h>
using namespace std;
using ll = long long;
#define all(x) (x).begin(), (x).end()

const int N = 7007;
int n, q;
string s;
int p[N][N], ans[N][N];

int main() {
    cin.tie(0)->sync_with_stdio(false);

    cin >> n >> q >> s;
    s = " " + s;

    for (int i = n; i >= 1; i--)
        for (int j = n; j >= 1; j--)
            p[i][j] = (s[i] == s[j] ? p[i + 1][j + 1] + 1 : 0);

    for (int i = 1; i <= n; i++) {
        vector<array<int, 2>> pts(n + 1);

        for (int j = 1; j <= n; j++) {
            int l = i + p[i][j], r = j + p[i][j];

            if (max(l, r) > n)
                continue;

            // range: l -> l + p[l + 1][r + 1]
            pts[l] = max(pts[l], {l + p[l + 1][r + 1], j});
        }

        int r = -1;
        for (int j = 1; j <= n; j++) {
            for (int k = max(r + 1, j); k <= pts[j][0]; k++)
                ans[i][k] = pts[j][1];
            r = max(r, pts[j][0]);
        }
    }

    while (q--) {
        int l, r;
        cin >> l >> r;

        if (!ans[l][r])
            cout << 0 << ' ' << 0 << '\n';
        else {
            cout << ans[l][r] << ' ' << ans[l][r] + (r - l) << '\n';
        }
    }

    return 0;
}

Advanced G: Mayoi Tree

Hint 1

Hint 2

Solution

Let $$$P_u(v)$$$ be the probability you go to node $$$v$$$ in $$$1$$$ step if you start at node $$$u$$$.

Let $$$E_u(v)$$$ denote the expected number of steps needed to go from node $$$u$$$ to node $$$v$$$ (note that $$$E_u(v)$$$ is not necessarily equal to $$$E_v(u)$$$).

Let $$$p_u$$$ denote the parent of node $$$u$$$ ($$$p_1$$$ is undefined).

Let $$$c_u$$$ denote the children of node $$$u$$$, or all the nodes adjacent to node $$$u$$$ other than $$$p_u$$$ (if it exists).

Let $$$up_u$$$ denote the expected number of steps needed to go from $$$u$$$ to $$$p_u$$$ (as before, $$$up_1$$$ is undefined). The most important observation is that we can define $$$up_u$$$ as a linear equation consisting of $$$up_u$$$, $$$up_v$$$ for $$$v \in c_u$$$ and $$$P_u(v)$$$ (with $$$up_u$$$ on both sides of the equation).

$$$up_u = P_u(p)(1) + \sum\limits_{v \in c_u} P_u(v)(1 + up_v + up_u)$$$

This is because there is a $$$P_u(p)$$$ chance to "escape" instantly and a $$$P_v(u)$$$ chance to go into the subtree of any $$$v$$$ which is a child of $$$u$$$. Most important, the expected amount of steps it takes is $$$1 + up_v + up_u$$$. You take $$$1$$$ step to go to node $$$v$$$, then you take $$$up_v$$$ steps to get back to node $$$u$$$, and finally, you take $$$up_u$$$ steps to "escape."

Let $$$down_u$$$ denote the expected number of steps needed to go from $$$p_u$$$ to $$$u$$$ (as before, $$$down_1$$$ is undefined). The same trick works for defining $$$down_u$$$.

Let $$$prob(u)$$$ denote the probability you go from node $$$p_u$$$ to node $$$u$$$. In particular, $$$prob(1) = 0$$$.

$$$down_u = P_{p_u}(u)(1) + prob(p_u)(1 + down_{p_u} + down_u) + \sum\limits_{v \in c_{p_u}, v \neq u} P_{p_u}(v)(1 + up_v + down_u)$$$

We can precompute $$$up_u$$$ with a bottom-up dfs and $$$down_u$$$ with a top-down dfs.

Finally, to answer a query of $$$s \ t$$$, let's first find the lca (least common ancestor) $$$l$$$ of $$$s$$$ and $$$t$$$. We then need to sum $$$up_u$$$ on the path from $$$s$$$ to $$$l$$$ (excluding $$$l$$$) and sum $$$down_u$$$ on the path from $$$l$$$ to $$$t$$$ (excluding $$$l$$$).

This can be done with prefix sums and any reasonable lca algorithm like binlifting or HLD. The final complexity is $$$O(n \log mod + n \log n)$$$.

Solution Code



#include <iostream>
#include <cmath>
#include <utility>
#include <cassert>
#include <algorithm>
#include <vector>
#include <array>
#include <functional>

#define sz(x) ((int)(x.size()))
#define all(x) x.begin(), x.end()
#define pb push_back

#ifndef LOCAL
#define cerr while(0) cerr
#endif

using ll = long long;

const ll mod = (1 << (23)) * 119 +1, ll_max = 1e18;
const int MX = 2e5 +10, int_max = 0x3f3f3f3f;

struct {
  template<class T>
  operator T() {
    T x; std::cin >> x; return x;
  }
} in;

using namespace std;



struct hld{
	vector<int> dep, sz, par, head, tin, out, tour;
	vector<vector<int>> adj;
	int n, ind;
	hld(){}
	hld(vector<pair<int, int>> edges, int rt = 1){
		n = sz(edges) + 1;
		ind = 0;
		dep = sz = par = head = tin = out = tour = vector<int>(n+1, 0);
		adj = vector<vector<int>>(n+1);
		for(auto [a, b] : edges){
			adj[a].pb(b);
			adj[b].pb(a);
		}
		dfs(rt, 0);
		head[rt] = rt;
		dfs2(rt, 0);
	}
	void dfs(int x, int p){
		sz[x] = 1;
		dep[x] = dep[p] + 1;
		par[x] = p;
		for(auto &i : adj[x]){
			if(i == p) continue;
			dfs(i, x);
			sz[x] += sz[i];
			if(adj[x][0] == p || sz[i] > sz[adj[x][0]]) swap(adj[x][0], i);
		}
	}
	void dfs2(int x, int p){
		tour[ind] = x;
		tin[x] = ind++;
		for(auto &i : adj[x]){
			if(i == p) continue;
			head[i] = (i == adj[x][0] ? head[x] : i);
			dfs2(i, x);
		}
		out[x] = ind;
	}
	
	int k_up(int u, int k){
		if(dep[u] <= k) return -1;
		while(k > dep[u] - dep[head[u]]){
			k -= dep[u] - dep[head[u]] + 1;
			u = par[head[u]];
		}
		return tour[tin[u] - k];
	}

	int lca(int a, int b){
		while(head[a] != head[b]){
			if(dep[head[a]] > dep[head[b]]) swap(a, b);
			b = par[head[b]];
		}
		if(dep[a] > dep[b]) swap(a, b);
		return a;
	}
} tr;

ll sum[MX], inv[MX], weight[MX]; //1/sum[u], weight to escape
vector<pair<int, ll>> adj[MX]; //node v and weight from u -> v
int par[MX], dep[MX];

ll up[MX], down[MX];
ll pup[MX], pdown[MX];

int n, q;

ll binpow(ll a, ll b = mod-2){
	if(a == 0 && b == mod-2){
		cout << "-1\n";
		exit(1);
	}
	ll ans = 1;
	for(int i = 1; i<=b; i*=2){
		if(i&b) (ans *= a) %= mod;
		(a *= a) %= mod;
	}
	return ans;
}

void dfs(int u, int p){
	par[u] = p;
	dep[u] = dep[p]+1;
	sum[u] = 0;
	for(auto [v, w] : adj[u]){
		sum[u] += w;
		if(v == p){
			weight[u] = w;
		}else{
			dfs(v, u);
		}
	}
	inv[u] = binpow(sum[u]);
}
//up[u] denotes the EV to start at node u and escape to the parent
//up[1] is undefined

//up[u] = sum(prob(of going to v)(up[v] + up[u] + 1)) + (prob of escaping now)
//up[u](1 + sum of probs) = sum of prob * (up[v] + 1) + prob of escaping now

//down[u] denotes the EV to start at the parent of node u and escape to node u
//down[1] is undefined
//down[u] = (prob of going up)(down[par[u]] (or 0 if u is the root) + down[u] + 1) + (prob of going to v when v != u)(up[v] + down[u] + 1) + (prob of going to u)
//(1 - prob of going up -prob of going to v for v != u from p)down[u] = prob of going up*(down[par[u]]+1) + prob of going to v * (up[v] + 1) + prob of going to u


void get_up(int u, int p){
	ll go_down = 0, prob = 0;
	for(auto [v, w] : adj[u]){
		if(v == p) continue;
		get_up(v, u);
		ll pr = 1ll*w*inv[u]%mod;
		go_down += pr*(up[v] + 1)%mod;
		prob += pr;
	}
	go_down %= mod;
	prob %= mod;
	if(p != 0){
		ll escape = weight[u]*inv[u]%mod;
		up[u] = (go_down + escape)*binpow(1 + mod - prob)%mod;
	}
}

void get_down(int u, int p){
	//find it for all the children
	ll go_down = 0;
	ll go_up = (p == 0 ? 0 : (weight[u]*inv[u])%mod*(down[u] + 1)%mod);
	ll prob = (p == 0 ? 0 : (weight[u]*inv[u]%mod));
	for(auto [v, w] : adj[u]){
		if(v == p) continue;
		ll pr = 1ll*w*inv[u]%mod;
		go_down += pr*(up[v]+1)%mod;
		prob += pr;
	}
	go_down %= mod;
	prob %= mod;
	for(auto [v, w] : adj[u]){
		if(v == p) continue;
		ll pr = 1ll*w*inv[u]%mod;
		go_down += mod - pr*(up[v]+1)%mod; 
		prob += mod - pr;
		prob %= mod;
		go_down %= mod;
		down[v] = (go_up + go_down + pr)*binpow(1 + mod - prob)%mod;
		prob += pr;
		go_down += pr*(up[v]+1)%mod;
		prob %= mod;
		go_down %= mod;
		get_down(v, u);
	}
}

void get_psum(int u, int p){
	for(auto [v, w] : adj[u]){
		if(p == v) continue;
		pup[v] = (pup[u] + up[v])%mod;
		pdown[v] = (pdown[u] + down[v])%mod;
		get_psum(v, u);
	}
}	


ll answer(int s, int t){
	int l = tr.lca(s, t);
	ll u = pup[s] + mod - pup[l];
	ll d = pdown[t] + mod - pdown[l];
	return (u + d)%mod;
}

void cl(){
	for(int i = 1; i<=n; i++){
		adj[i].clear();
		par[i] = weight[i] = inv[i] = dep[i] = 0;
		up[i] = down[i] = pup[i] = pdown[i] = 0;
	}
}

void solve(){
	n = in, q = in;
	vector<pair<int, int>> edges;
	for(int i = 2; i<=n; i++){
		int u = in, v = in;
		int a = in, b = in;
		adj[u].pb({v, a});
		adj[v].pb({u, b});
		edges.push_back({u, v});
	}
	tr = hld(edges);
	dfs(1, 0);
	get_up(1, 0);
	get_down(1, 0);
	get_psum(1, 0);

	for(int i = 1; i<=q; i++){
		int s = in, t = in;
		cout << answer(s, t) << "\n";
	}
	cl();
}

signed main(){
  cin.tie(0) -> sync_with_stdio(0);

  int T = 1;
	cin >> T;
  for(int i = 1; i<=T; i++){
		solve();
	}
  return 0;
}

Advanced I: Fire Fighters

Hint 1

Hint 2

Hint 3

Solution

Solution Code

#include <bits/stdc++.h>
using namespace std;
 
const int N = 69e4 + 4, inf = INT_MAX;
 
int t, n, q, a[N], nxt[N], dp[N], pre[N];
pair<int, int> sufMx[N];
stack<int> st;
 
int solve(int idx, int x, int r) {
    if (x > sufMx[r].first) return idx;
    else if (x == sufMx[r].first) return dp[sufMx[r].second+1];
    else return dp[r];
}
 
signed main() {
  ios::sync_with_stdio(false); cin.tie(nullptr);
 
  cin >> t;
  while (t--) {
    cin >> n >> q;
    for (int i = 0; i < n; i++) {
      cin >> a[i];
    }
 
    st = stack<int>();
    for (int i = n-1; i >= 0; i--) {
      while (!st.empty() && a[st.top()] < a[i]) st.pop();
      
      int x = (st.empty() ? n : st.top());
 
      if (st.empty()) {
        dp[i] = i;
        nxt[i] = n;
      }
      else if (a[x] == a[i]) {
        dp[i] = (x+1 < n ? dp[x+1] : n);
        nxt[i] = x+1;
      }
      else {
        dp[i] = dp[x];
        nxt[i] = x;
      }
 
      st.push(i);
    }
    nxt[n] = dp[n] = pre[n] = n;
 
    int x = 0;
    for (int i = 0; i < n; i++) {
        if (nxt[x] == i) x = nxt[x];
        pre[i] = x;
    }
    
    sufMx[n] = make_pair(-inf, n);
    for (int i = n-1; i >= 0; i--) {
        if (a[i] > sufMx[i+1].first) sufMx[i] = make_pair(a[i], i);
        else sufMx[i] = sufMx[i+1];
    }
    
    while (q--) {
        int l, r, x;
        cin >> l >> r >> x;
        l--; r--;
        
        int y = (l ? pre[l-1] : -1);
        
        if (y == -1 || a[y] < x) {
            if (!((r-l+1) & 1)) cout << dp[r+1]+1 << "\n";
            else {
                cout << solve(r, x, r+1)+1 << "\n";
            }
        }
        else if (a[y] == x) {
            if (!((r-l+2) & 1)) cout << dp[r+1]+1 << "\n";
            else {
                cout << solve(r, x, r+1)+1 << "\n";
            }
        }
        else { // a[y] > x
            cout << solve(y, a[y], r+1)+1 << "\n";
        }
    }
  }
}

Advanced J: Arknights Chips

Hint 1

Hint 2

Hint 3

Solution

For simplicity, let's have $$$i$$$ enumerate the number of caster chips instead of the sniper chips.

$$$E = \sum_{i = 0}^{n} {{n}\choose{i}}p^{n - i} q^{i} ((n - i) + y \cdot \lfloor {\frac{i}{x}} \rfloor)$$$

Then using the definition of floor, we can rewrite this as

$$$E = \sum_{i = 0}^{n} {{n}\choose{i}}p^{n - i} q^{i} ((n - i) + y \cdot (\frac{i}{x} - \frac{i \text{ mod } x}{x})$$$

$$$\sum_{i = 0}^{n} {n \choose i}p^{i}q^{n - i} i = pn$$$ (this can be interpreted as "If you have a coin that flips heads with probability $$$p$$$ and tails with probability $$$1 - p$$$, what is the expected number of heads you obtain after $$$n$$$ flips?")

$$$E = np + {\frac{y}{x}}nq -y \sum_{i = 0}^{n} {{n}\choose{i}}p^{n - i} q^{i} (\frac{i \text{ mod } x}{x})$$$

So now the question boils down to finding the expected value of $$$ \text{# caster chips mod } x$$$.

Let $$$f_m(n)$$$ denote the probability that after $$$n$$$ clears, the number of caster chips is $$$m \text{ mod } x$$$. We can observe that $$$f_0(0) = 1$$$ and $$$f_m(n) = p f_{m}(n-1) + q f_{(m + x - 1) \text { mod }}^(n-1)$$$. With probability $$$p$$$, we can get a sniper chip from a state where $$$\text{# caster chips} \equiv m \pmod{x}$$$ and with probability $$$q$$$, we can get a caster chip from a state where $$$\text{# caster chips} \equiv m - 1 \pmod{x}$$$. Additionally, with $$$0$$$ stage clears, there is a probability of $$$1$$$ that the number of caster chips is $$$0 \text {mod } x$$$ (as it is $$$0$$$).

This motivates matrix exponentiation as the method to compute $$$f_m(n)$$$, as the sum we desire is $$$\sum_{i = 0}^{x-1} if_{i}(n)$$$. We can make a matrix $$$A$$$ where on row $$$i$$$, $$$A_{i}{i} = p$$$ and $$$a_{i}{(i + 1) \text{ mod } x} = q$$$ and all other cells are $$$0$$$. By raising this to the power of $$$n$$$, we can find $$$f_m(n)$$$ as $$$A_{0}{m}$$$.

The final sum is

$$$E = np + {\frac{y}{x}}nq -y \sum_{i = 0}^{x-1} if_{i}(n)$$$

The total complexity is $$$O(x^3 \log n)$$$ with binary exponentiation for the matrix.

Solution Code

 
#include <iostream>
#include <cmath>
#include <utility>
#include <cassert>
#include <algorithm>
#include <vector>
#include <array>


#define sz(x) ((int)(x.size()))
#define all(x) x.begin(), x.end()
#define pb push_back

using ll = long long;
const ll mod = (1 << (23)) * 119 +1; 

using namespace std;


ll binpow(ll a, ll b = mod-2){
	a %= mod;
	ll ans = 1;
	for(ll i = 1; i<=b; i*=2ll){
		if(i&b){
			(ans *= a) %= mod;
		}
		(a *= a) %= mod;
	}
	return ans;
}


#define matrix vector<vector<ll>>

matrix mult(matrix& a, matrix& b){
	matrix c = a;
	for(auto& x : c){
		fill(all(x), 0);
	}
	for(int i = 0; i<sz(a); i++){
		for(int j = 0; j<sz(a); j++){
			if(a[i][j] == 0) continue;
			for(int k = 0; k<sz(a); k++){
				c[i][k] += a[i][j]*b[j][k]%mod;
			}
		}
	}
	for(int i = 0; i<sz(c); i++){
		for(int j = 0; j<sz(c); j++){
			c[i][j] %= mod;
		}
	}
	return c;
}

matrix binpow(matrix a, ll b){
	matrix ans = a;
	for(int i = 0; i<sz(ans); i++){
		fill(all(ans[i]), 0);
		ans[i][i] = 1;
	}
	for(ll i = 1; i<=b; i*=2){
		if(i&b){
			ans = mult(ans, a);
		}
		a = mult(a, a);
	}
	return ans;
}

void solve(){
	int a;
	ll x, y, n;
	cin >> a >> x >> y >> n;
	ll inv = binpow(x);
	ll p = a*binpow(100)%mod;
	ll q = 1 + mod - p;
	ll ans = p*(n%mod)%mod + inv*y%mod*q%mod*(n%mod);
	ans %= mod;
	matrix base(x, vector<ll>(x, 0));
	for(int i = 0; i<x; i++){
		base[i][i] = p;
		base[i][(i + 1)%x] = q;
	}
	auto mat = binpow(base, n);
	for(int i = 0; i<x; i++){
		ans += (mod - inv)*y%mod*i%mod*mat[0][i]%mod;
		ans %= mod;
	}
	cout << ans << "\n";
}

signed main(){
  cin.tie(0) -> sync_with_stdio(0);

    int T = 1;
    cin >> T;
    for(int i = 1; i<=T; i++){
		solve();
	}
    return 0;
}

Bonus 1

Bonus 2

Advanced K: ANDtreew

Hint 1

Hint 2

Hint 3

Hint 4

Solution

The hints briefly sum up the solution of the problem step by step, but we will provide a more detailed explanation now.

For the minimum value of a tree to change, so that the value of the whole forest can increment, it is needed that the minimum node is removed. With this in mind, we can build another tree recursively in the following way (we will call it $$$G$$$ for clarity):

Given a tree, if the tree consists of a single node, we stop there.
If there it consists of at least $$$2$$$ nodes, we take the node with the minimum value and and remove it from the tree, decomposing it into several other trees. We take the minimum nodes of those trees and add them as children in $$$G$$$ to the node we removed from the original tree. Then, do the same for the decomposed trees.

$$$G$$$ is also known as the Kruskal Reconstruction Tree, so we will refer to it as Kruskal Tree from now on.

Once we've build the Kruskal tree, we will iterate for each query over the bits of the answer from most significant bit to less significant bit, and try to add those to the AND as we progress. For a specific desired value of AND $$$mask$$$, we will define each node $$$v$$$ as good if and only if $$$mask$$$ is a submask of its value (i.e. $$$v \ AND \ mask = mask$$$) or it can be removed (i.e. there's some $$$i$$$ such that $$$x_i = v$$$) and all of its children are good. If we manage to quickly compute if the root of the Kruskal Tree is good, we can know whether it is possible to have $$$mask$$$ as a submask of the answer or not.

There are multiple ways to do this in $$$O(k)$$$, resuling in a total complexity of $$$O(k \log n)$$$ per query. I will present two.

The first one, which was the original intended solution proposed by the author, is to build an AND sparse table for each adjacency list. Therefore, for each value of $$$mask$$$, one can do a DFS and, for each node, check if it is good. Firstly, we check if it has $$$mask$$$ as a submask, because if it does it is already good. If it doesn't, we will proceed with the DFS with the children that are in the query, and check if those are good, if any of those is not good, then the node will already not be good. Additionally, to check that the children which are not in the query (and therefore cannot be removed) have $$$mask$$$ as a submask, we will query for each interval between the indices of the children in the query the AND of those children, to get the AND of all the children that are not in the query. All that is left to check is that $$$mask$$$ is a submask of the AND the children for the node to be good.

The second way to check if a node is good fast is to precalculate for each node the count of the ocurrences of each bit in its children. Then, in a query, you can precalculate before checking if any $$$mask$$$ is good a "bad mask", which will contain all of the bits that $$$mask$$$ cannot have for that node to be good. In other words, we will store for which bits there exists a children of the node which cannot be removed and does not have that bit on. To do so, we go over every node in the query and, for each node, we iteare over all the bits. For each bit, we will iterate over all the children that are in the query and, if they do not have that bit on add it to the count of children with the bit on (because, as we only want to know if the children which can't be removed have the bit on, this does not affect us and makes the implementation easier). Therefore, each bit will not be bad if and only if its count is equal to the number of children (both in and not in the query) of the node, because all the children that are in the query will have added to the count, therefore if it is not equal to the number of children one child which is not in the query must not have it.

Solution Code 1

#include <bits/stdc++.h>

using namespace std;

const int LOG = 20;

struct DSU{
	vector<int> v, mn;
	void init(int n){
		v.assign(n, -1);
		mn.resize(n);
		for(int i = 0; i < n; i++) mn[i] = i;
	}
	int get(int x){return v[x] < 0 ? x : v[x] = get(v[x]);}
	void unite(int x, int y){
		x = get(x); y = get(y);
		if(x == y) return;
		if(v[x] > v[y]) swap(x, y);
		v[x] += v[y]; v[y] = x;
		mn[x] = min(mn[x], mn[y]);
	}
	int getMn(int i){
		return mn[get(i)];
	}
};

void buildSparse(vector<int>& v, vector<vector<int>>& sparse){
	int n = (int)v.size();
	sparse.assign(LOG, vector<int>(n));
	for(int k = 0; k < LOG; k++){
		for(int i = 0; i < n; i++){
			if(k == 0) sparse[k][i] = v[i]+1;
			else{
				if(i - (1 << (k-1)) < 0) sparse[k][i] = sparse[k-1][i];
				else sparse[k][i] = (sparse[k-1][i] & sparse[k-1][i - (1 << (k-1))]);
			}
		}
	}
}

int getAnd(int l, int r, vector<vector<int>>& sparse){
	if(l > r) return (1 << LOG) - 1;
	int k = 31 - __builtin_clz(r-l+1);
	return (sparse[k][r] & sparse[k][l + (1 << k) - 1]);
}

int taken;

bool DFS(int x, vector<vector<int>>& adj, vector<vector<int>>& specialAdj, vector<vector<vector<int>>>& sparses, int curr){
	if(((x+1) & curr) == curr) {taken++; return true;}
	//It needs to be removed;
	int lst = -1;
	int ans = (1 << LOG) - 1;
	for(int ind : specialAdj[x]){
		if(!DFS(adj[x][ind], adj, specialAdj, sparses, curr)) return false;
		ans &= getAnd(lst + 1, ind-1, sparses[x]);
		lst = ind;
	}
	ans &= getAnd(lst + 1, (int)adj[x].size() - 1, sparses[x]);
	if((ans & curr) == curr) return true;
	else return false;
}

void undo(vector<int>& x, vector<int>& parent, vector<vector<int>>& specialAdj){
	for(int i : x){
		if(parent[i] != -1) specialAdj[parent[i]].pop_back();
	}
}

int main(){
	ios_base::sync_with_stdio(0);
	cin.tie(0);

	int tt; cin >> tt;
	while(tt--){
		int n, q; cin >> n >> q;
		vector<vector<int>> originalAdj(n);
		for(int i = 0; i < n - 1; i++){
			int u, v; cin >> u >> v; u--; v--;
			originalAdj[u].push_back(v);
			originalAdj[v].push_back(u);
		}
		vector<vector<int>> adj(n);
		vector<int> ind(n, -1), parent(n, -1);
		DSU UF; UF.init(n);
		for(int i = n - 1; i >= 0; i--){
			for(int node : originalAdj[i]){
				if(node < i) continue;
				adj[i].push_back(UF.getMn(node));
				UF.unite(i, node);
			}
			sort(adj[i].begin(), adj[i].end());
			for(int j = 0; j < (int)adj[i].size(); j++){
				ind[adj[i][j]] = j;
				parent[adj[i][j]] = i;
			}
		}
		vector<vector<vector<int>>> sparses(n);
		for(int i = 0; i < n; i++){
			buildSparse(adj[i], sparses[i]);
		}
		vector<vector<int>> specialAdj(n);
		while(q--){
			int k; cin >> k;
			vector<int> x(k);
			bool zero = false;
			for(int i = 0; i < k; i++){
				cin >> x[i]; x[i]--;
				if(!x[i]) zero = true;
				if(parent[x[i]] != -1){
					specialAdj[parent[x[i]]].push_back(ind[x[i]]);
				}
			}
			if(!zero){
				cout << 1 << "\n";
				undo(x, parent, specialAdj);
				continue;
			}
			int ans = 0;
			int curr = 0;
			for(int b = LOG - 1; b >= 0; b--){
				curr += (1 << b);
				taken = 0;
				if(DFS(0, adj, specialAdj, sparses, curr) && (taken > 0 || k != n)) ans = curr;
				else curr -= (1 << b);
			}
			cout << ans << "\n";
			undo(x, parent, specialAdj);
		}
	}
}

Solution Code 2

#include <bits/stdc++.h>

using namespace std;

const int LOG = 20;

struct DSU{
	vector<int> v, mn;
	void init(int n){
		v.assign(n, -1);
		mn.resize(n);
		for(int i = 0; i < n; i++) mn[i] = i;
	}
	int get(int x){return v[x] < 0 ? x : v[x] = get(v[x]);}
	void unite(int x, int y){
		x = get(x); y = get(y);
		if(x == y) return;
		if(v[x] > v[y]) swap(x, y);
		v[x] += v[y]; v[y] = x;
		mn[x] = min(mn[x], mn[y]);
	}
	int getMn(int i){
		return mn[get(i)];
	}
};

int taken;

bool DFS(int x, vector<vector<int>>& specialAdj, vector<int>& badMask, int curr){
	if(((x+1) & curr) == curr) {taken++; return true;}
	if(badMask[x] & curr) return false;
	//It needs to be removed;
	for(int node : specialAdj[x]){
		if(!DFS(node, specialAdj, badMask, curr)) return false;
	}
	return true;
}

void setBad(int x, vector<vector<int>>& adj, vector<vector<int>>& specialAdj, vector<vector<int>>& cnt, vector<int>& badMask){
	for(int k = 0; k < LOG; k++){
		int hvTotal = cnt[k][x];
		for(int node : specialAdj[x]){
			if(!((1 << k) & (node+1))) hvTotal++;
		}
		if(hvTotal != (int)adj[x].size()) badMask[x] += (1 << k);
	}
	for(int node : specialAdj[x]){
		setBad(node, adj, specialAdj, cnt, badMask);
	}
}

void undo(vector<int>& x, vector<int>& parent, vector<vector<int>>& specialAdj, vector<int>& badMask){
	for(int i : x){
		badMask[i] = 0;
		if(parent[i] != -1) specialAdj[parent[i]].pop_back();
	}
}

int main(){
	ios_base::sync_with_stdio(0);
	cin.tie(0);

	int tt; cin >> tt;
	while(tt--){
		int n, q; cin >> n >> q;
		vector<vector<int>> originalAdj(n);
		for(int i = 0; i < n - 1; i++){
			int u, v; cin >> u >> v; u--; v--;
			originalAdj[u].push_back(v);
			originalAdj[v].push_back(u);
		}
		vector<vector<int>> adj(n);
		vector<int> parent(n, -1);
		DSU UF; UF.init(n);
		for(int i = n - 1; i >= 0; i--){
			for(int node : originalAdj[i]){
				if(node < i) continue;
				adj[i].push_back(UF.getMn(node));
				UF.unite(i, node);
			}
			sort(adj[i].begin(), adj[i].end());
			for(int j = 0; j < (int)adj[i].size(); j++){
				parent[adj[i][j]] = i;
			}
		}
		vector<vector<int>> cnt(LOG, vector<int>(n, 0));
		for(int k = 0; k < LOG; k++){
			for(int i = 0; i < n; i++){
				for(int node : adj[i]){
					if((1 << k) & (node+1)) cnt[k][i]++;
				}
			}
		}
		vector<vector<int>> specialAdj(n);
		vector<int> badMask(n, 0);
		while(q--){
			int k; cin >> k;
			vector<int> x(k);
			bool zero = false;
			for(int i = 0; i < k; i++){
				cin >> x[i]; x[i]--;
				if(!x[i]) zero = true;
				if(parent[x[i]] != -1){
					specialAdj[parent[x[i]]].push_back(x[i]);
				}
			}
			if(!zero){
				cout << 1 << "\n";
				undo(x, parent, specialAdj, badMask);
				continue;
			}
			setBad(0, adj, specialAdj, cnt, badMask);
			int ans = 0;
			int curr = 0;
			for(int b = LOG - 1; b >= 0; b--){
				curr += (1 << b);
				taken = 0;
				if(DFS(0, specialAdj, badMask, curr) && (taken > 0 || k != n)) ans = curr;
				else curr -= (1 << b);
			}
			cout << ans << "\n";
			undo(x, parent, specialAdj, badMask);
		}
	}
}

Advanced L: Everyone Loves Threes Magic (Hard)

Hint 1

Hint 2

Solution

We can reduce the problem to finding $$$\sum_{i = 1}^{x-1} f(i)$$$, $$$\sum_{i = 1}^{x-1} if(i)$$$, and $$$\sum_{i = 1}^{x-1} i^2f(i)$$$ for a very large $$$x$$$.

Let $$$d(x)$$$ denote the sum of digits in the base-$$$10$$$ representation $$$\text{ mod } 3$$$. For instance $$$d(1) = 1, d(55) = 1, d(3366) = 0$$$.

Let $$$val(i, j) = \sum\limits_{d(x) = j, \log_{10}(x) < i} x^0$$$.

Let $$$lin(i, j) = \sum\limits_{d(x) = j, \log_{10}(x) < i} x^1$$$.

Let $$$squ(i, j) = \sum\limits_{d(x) = j, \log_{10}(x) < i} x^2$$$.

Let $$$sum(i, j) = \sum\limits_{d(x) = j, \log_{10}(x) < i} x^0f(x)$$$.

Let $$$slin(i, j) = \sum\limits_{d(x) = j, \log_{10}(x) < i} x^1f(x)$$$.

Let $$$ssqu(i, j) = \sum\limits_{d(x) = j, \log_{10}(x) < i} x^2f(x)$$$.

I would give math formulas for all of these, but its easier to just attach code.

Transitions

void precomp(int n){
	ll p = 1;
	for(int i = 0; i<=n; i++){
		ip10[i] = p;
		(p *= 10ll) %= mod;
	}
	p = 1;
	val[0][0] = 1;
	for(int i = 0; i<=n; i++){
		for(int j = 0; j<3; j++){
			for(int k = 0; k<10; k++){
				ll d = p*k%mod;
				if(k == 3){
					//(cnt(i) + 1)
					//1
					(sum[i+1][(j+k)%3] += val[i][j]) %= mod;
					//(i + d)(cnt(i) + 1)
					//i
					//d
					(slin[i+1][(j+k)%3] += val[i][j]*d%mod + lin[i][j]) %= mod;
					//(i + d)(i + d)(cnt(i) + 1)
					//i^2
					//id
					//di
					//d^2
					(ssqu[i+1][(j+k)%3] += val[i][j]*d%mod*d%mod + 2ll*lin[i][j]*d%mod + squ[i][j]) %= mod;
				}
				//(cnt(i))
				//cnt(i)
				(sum[i+1][(j+k)%3] += sum[i][j]) %= mod;
				//(i + d)(cnt(i))
				//icnt(i)
				//dcnt(i)
				(slin[i+1][(j+k)%3] += sum[i][j]*d%mod + slin[i][j]) %= mod;
				//(i + d)(i + d)(cnt(i))
				//i^2 cnt[i]
				//idcnt(i)
				//dicnt(i)
				//d^2cnt(i)
				(ssqu[i+1][(j+k)%3] += sum[i][j]*d%mod*d%mod + 2ll*slin[i][j]*d%mod + ssqu[i][j]) %= mod;
				(val[i+1][(j+k)%3] += val[i][j]) %= mod;
				(lin[i+1][(j+k)%3] += val[i][j]*d%mod + lin[i][j]) %= mod;
				(squ[i+1][(j+k)%3] += val[i][j]*d%mod*d%mod + 2ll*lin[i][j]*d%mod + squ[i][j]) %= mod;
			}
		}
		(p *= 10) %= mod;
	}
}

Let's fix some numbers $$$y$$$ and $$$k$$$ such that $$$y + 10^k \leq x$$$. We can easily obtain the sum of $$$f(i)$$$, $$$if(i)$$$, and $$$i^2f(i)$$$ for this range $$$[y, y+10^k)$$$ with the precomputed six precomputed functions above as we have no restrictions on the digits; The sum of $$$f(i)$$$, $$$if(i)$$$, and $$$i^2f(i)$$$ within this range depends solely on $$$y$$$, $$$d(y)$$$, $$$k$$$, and the precomputed functions above.

Let $$$n$$$ denote the number of digits in $$$x$$$.

To use this fact efficiently, let's enumerate the number of digits $$$y$$$ has in common with $$$x$$$. If at the $$$k$$$'th digit from the left, the digit in $$$y$$$ is strictly less than the digit $$$x$$$ (it cannot be strictly more, and if they are the same, $$$k$$$ will increase). We can set the last $$$n - k$$$ of $$$y$$$ to be $$$0$$$ and evaluate the sum for $$$[y, y + 10^{n - k})$$$.

This way, every number $$$ < x$$$ will be accounted for.

This takes $$$O(\log_{10}(R))$$$ precompute and $$$O(\log_{10}(R))$$$ per testcase. Read the code for more impl details. Note that a traditional digit dp where you store a flag of whether or not the current digit is strictly less than $$$x$$$ or not also works, but it runs slower.

Solution Code

//misaka, hitori, and elaina will carry me to red

#pragma GCC optimize("O3,unroll-loops")
#pragma GCC target("avx2,bmi,bmi2,lzcnt,popcnt")

#include <iostream>
#include <cmath>
#include <utility>
#include <cassert>
#include <algorithm>
#include <vector>
#include <array>
#include <cstdio>
#include <cstring>
#include <functional>
#include <numeric>
#include <set>
#include <queue>
#include <map>
#include <chrono>
#include <random>

#define sz(x) ((int)(x.size()))
#define all(x) x.begin(), x.end()
#define pb push_back
#define eb emplace_back
#define kill(x, s) {if(x){ cout << s << "\n"; return ; }}

//#ifndef LOCAL
#define cerr while(0) cerr
//#endif

using ll = long long;
using lb = long double;

const lb eps = 1e-9;
//const ll mod = 1e9 + 7, ll_max = 1e18;
const ll mod = (1 << (23)) * 119 +1, ll_max = 1e18;
const int MX = 2e5 +10, int_max = 0x3f3f3f3f;

struct {
  template<class T>
  operator T() {
    T x; std::cin >> x; return x;
  }
} in;

using namespace std;


//(r - i+1)(i - l+1)sum[i]
//(r+1)(-l+1)sum[i] + (-(-l+1) + r+1)*i*sum[i] + -i^2*sum[i]

ll val[MX][3]; //the number of ways to pick i digits such that they sum to j mod 3
ll sum[MX][3]; //the number of 3's across all those ways
ll lin[MX][3]; //sum of dig for all x that satisfy (i, j)
ll squ[MX][3]; //sum of dig*dig for all x that satisify (i, j)
ll slin[MX][3]; //sum of sum*dig for all x
ll ssqu[MX][3]; //sum of sum*dig*dig for all x

ll ip10[MX]; //ipman orz!


void precomp(int n){
	ll p = 1;
	for(int i = 0; i<=n; i++){
		ip10[i] = p;
		(p *= 10ll) %= mod;
	}
	p = 1;
	val[0][0] = 1;
	for(int i = 0; i<=n; i++){
		for(int j = 0; j<3; j++){
			for(int k = 0; k<10; k++){
				ll d = p*k%mod;
				if(k == 3){
					//(cnt(i) + 1)
					//1
					(sum[i+1][(j+k)%3] += val[i][j]) %= mod;
					//(i + d)(cnt(i) + 1)
					//i
					//d
					(slin[i+1][(j+k)%3] += val[i][j]*d%mod + lin[i][j]) %= mod;
					//(i + d)(i + d)(cnt(i) + 1)
					//i^2
					//id
					//di
					//d^2
					(ssqu[i+1][(j+k)%3] += val[i][j]*d%mod*d%mod + 2ll*lin[i][j]*d%mod + squ[i][j]) %= mod;
				}
				//(cnt(i))
				//cnt(i)
				(sum[i+1][(j+k)%3] += sum[i][j]) %= mod;
				//(i + d)(cnt(i))
				//icnt(i)
				//dcnt(i)
				(slin[i+1][(j+k)%3] += sum[i][j]*d%mod + slin[i][j]) %= mod;
				//(i + d)(i + d)(cnt(i))
				//i^2 cnt[i]
				//idcnt(i)
				//dicnt(i)
				//d^2cnt(i)
				(ssqu[i+1][(j+k)%3] += sum[i][j]*d%mod*d%mod + 2ll*slin[i][j]*d%mod + ssqu[i][j]) %= mod;
				(val[i+1][(j+k)%3] += val[i][j]) %= mod;
				(lin[i+1][(j+k)%3] += val[i][j]*d%mod + lin[i][j]) %= mod;
				(squ[i+1][(j+k)%3] += val[i][j]*d%mod*d%mod + 2ll*lin[i][j]*d%mod + squ[i][j]) %= mod;
			}
		}
		(p *= 10) %= mod;
	}
}

#define info array<ll, 3>
//sum, slin, ssqu

info operator + (info a, info b){
	return info{(a[0]+b[0])%mod, (a[1]+b[1])%mod, (a[2]+b[2])%mod};
}

info comb(int c, ll d, info a, info b){
	//a is sum/slin/ssqu 
	//b is val/lin/squ
	info r = {0ll, 0ll, 0ll};
	r[0] = (a[0]+c*b[0]%mod)%mod;
	r[1] = (a[1] + 1ll*c*b[1] + 1ll*d*a[0]%mod + 1ll*b[0]*d%mod*c%mod)%mod;
	r[2] = (1ll*c*(b[2] + 2ll*d*b[1]%mod + d*d%mod*b[0]%mod)%mod + a[2] + 2ll*d*a[1]%mod + d*d%mod*a[0]%mod)%mod;
	return r;
}

void pr(info& a){
	for(auto x : a) cerr << x << " "; cerr << "\n";
}

info eval(string s){
	ll d = 0;
	int c = 0;
	int m3 = 0;
	info ret = {0ll, 0ll, 0ll};
	cerr << "eval " << s << "\n";
	for(int i = sz(s); i>=1; i--){
		cerr << d << " " << c << " " << m3 << "\n";
		for(int j = 0; j<s[sz(s)-i]-'0'; j++){
			int nc = c + (j == 3);
			ll nd = d + 1ll*j*ip10[i-1]%mod;
			int nm3 = (m3 + j)%3;
			cerr << i << " " << (char)(j + '0')  << "\n";
			info a = {sum[i-1][(3 - nm3)%3], slin[i-1][(3 - nm3)%3], ssqu[i-1][(3 - nm3)%3]};
			info b = {val[i-1][(3 - nm3)%3], lin[i-1][(3 - nm3)%3], squ[i-1][(3 - nm3)%3]};
			pr(a); pr(b);
			auto tmp = comb(nc, nd, a, b);
			pr(tmp);
			ret = ret + tmp;
		}
		if(s[sz(s)-i] == '3') c++;
		(m3 += (s[sz(s)-i] - '0')) %= 3;
		(d += 1ll*(s[sz(s)-i] - '0')*ip10[i-1]) %= mod;
		cerr << "\n";
	}
	return ret;
}

ll conv(string s){
	ll ans = 0;
	for(int i = sz(s)-1; i>=0; i--){
		cerr << s[sz(s) - i-1] << " " << i << "\n";
		ans += 1ll*(s[sz(s) - i-1]-'0')*ip10[i]%mod;
	} cerr << "\n";
	return ans%mod;
}



string add(string l){
	for(int i = sz(l)-1; i>=0; i--){
		if(l[i] == '9'){
			l[i] = '0';
		}else{
			l[i]++;
			break ;
		}
	}
	if(l == string(l.size(), '0')){
		l.pb('1');
		reverse(all(l));
	}
	return l;
}

ll binpow(ll a, ll b = mod - 2){
	ll ans = 1;
	for(ll i = 1; i<=b; i*=2ll){
		if(i&b) (ans *= a) %= mod;
		(a *= a) %= mod;
	}
	return ans;
}

void solve(){
	string l = (string) in;
	string r = (string) in;
	auto sl = eval(l);
	auto sr = eval(add(r));
	ll L = conv(l), R = conv(r);
	//(r+1)(-l+1)sum[i] + (-(-l+1) + r+1)*i*sum[i] + -i^2*sum[i]
	pr(sl);
	pr(sr);
	ll ans = 1ll*(R + 1)*(mod-L+1)%mod*(sr[0] + mod - sl[0])%mod + \
					 1ll*(L + mod - 1 + R + 1)*(sr[1] + mod - sl[1])%mod + \
					 1ll*(mod - 1)*(sr[2] + mod - sl[2])%mod;
	ans %= mod;
	ll len = (R + mod - L + 1)%mod;
	cerr << ans << "\n";
	cerr << L << " " << R << " " << len << "\n";
	cout << ans%mod << "\n";
}

signed main(){
  cin.tie(0) -> sync_with_stdio(0);
	precomp(100010);
  int T = 1;
  cin >> T;
  for(int i = 1; i<=T; i++){
		//cout << "Case #" << i << ": ";
		solve();
	}
  return 0;
}

Full text and comments »

Tutorial of Teamscode Spring 2024 (Novice Division)

Announcement of Teamscode Spring 2024 (Advanced Division)

willy108
2 weeks ago
1

Teamscode Spring 2023 Editorial

By willy108, history, 13 months ago, In English

This is the editorial for a recent contest Teamscode. The problems are open for upsolving on this gym. Problems were prepared by oursaco, dutin, thehunterjames, Bossologist, Esomer, and me.

A. What do you do when the contest starts? Are you busy? Will you solve Bingo?

Editorial

Code

B. Mountain Climbing Easy

Solution

Code

#include <iostream>
#include <fstream>
using namespace std;

int main() {
	int N;
	cin >> N;

	int cnt = 0;
	int prev = -1;
	int ans = 0;
	for (int i = 0; i < N; i++)
	{
		int a;
		cin >> a;

		if (a > prev && i) cnt++;
		else if (a <= prev) cnt = 0;
		if (cnt == 2) ans++;
		prev = a;
	}

	cout << ans << "\n";
	return 0;
}

C. No Sweep

Solution

Code

n,k=input().split()
print((int(k) + 1) ** int(n) - 1)

D. Multiplication Table

Solution

Code

#include <cstdio>

int isp(int x){
    for(int i = 2; i*i <= x; i++){
        if(x%i == 0) return 0;
    }
    return 1;
}

int main(){
    int n;
    scanf("%d", &n);
    do{
        n++;  
    }while(isp(n) == 0);
    printf("%d\n", n);
    return 0;
}

E. Cyclic Shifts

Hint

Solution

Code

#include <bits/stdc++.h>
 
long long calculate_cost(int n, const std::vector<long long> &a, const std::vector<long long> &b) {
	long long ret = 0;
	for (int i = 0; i < n; i++)
		ret += llabs(a[i] - b[i]);
	return ret;
}
 
template<typename I>
void rotate_left(I l, I r) { std::rotate(l, std::next(l), r); }
 
int main() {
	using namespace std;
 
	int TC;
	cin >> TC;
	while (TC--) {
		int N, K;
		cin >> N >> K;
		vector<long long> A(N), B(N);
		for (auto &a : A)
			cin >> a;
		for (auto &b : B)
			cin >> b;
		long long ans = calculate_cost(N, A, B);
		rotate_left(A.begin(), A.begin() + K);
		long long cur = calculate_cost(N, A, B);
		ans = min(ans, cur + 1);
		for (int i = 1; i + K - 1 < N; i++) {
			cur -= llabs(A[i - 1] - B[i - 1]) + 
				llabs(A[i + K - 2] - B[i + K - 2]) + 
				llabs(A[i + K - 1] - B[i + K - 1]);
			auto tem = A[i - 1];
			A[i - 1] = A[i + K - 2];
			A[i + K - 2] = A[i + K - 1];
			A[i + K - 1] = tem;
			cur += llabs(A[i - 1] - B[i - 1]) + 
				llabs(A[i + K - 2] - B[i + K - 2]) + 
				llabs(A[i + K - 1] - B[i + K - 1]); 
			ans = min(ans, cur + 1);
		}
		cout << ans << '\n';
	}
}

F. Great Common Multiple

Solution

Code

#include <iostream>
#include <cmath>
using ll = long long;
using namespace std;
ll gcd(ll a, ll b){
	if(b == 0) return a;
	return gcd(b, a%b);
}

int main(){
	cin.tie(0) -> sync_with_stdio(0);
	int T;
	cin >> T;
	while(T--){
		ll a, b, c;
		cin >> a >> b >> c;
		ll lcm = a*b/gcd(a, b);
		ll step = gcd(lcm, c);
		cout << c - step << "\n";
	}
}

G. Daggers

Hint 1

Hint 2

Solution

Code

#include <bits\stdc++.h>
 
using namespace std;
 
int main(){
	ios_base::sync_with_stdio(0);
	cin.tie(0);
	
	int n, q; cin >> n >> q;
	set<int> shields;
	for(int t = 1; t <= q; t++){
		int x; cin >> x;
		shields.insert(x);
		long long ans = 0;
		int curr = 0;
		bool done = 0;
		while(!done){
			if(n - curr <= t){
				cout << ans + n - curr << "\n";
				done = 1;
			}else{
				auto it = shields.upper_bound(curr + t);
				if(it == shields.begin() || *(--it) == curr){
					cout << -1 << "\n";
					done = 1;
				}else{
					curr = *it;
					ans += t;
				}
			}
		}
	}
}

H. A Certain Scientific Tree Problem

There are many solutions to this problem, some simpler than others, but I'll present the intended solution which involves the distance formula between two nodes.

Hint 1

Hint 2

Solution

Code

#include <iostream>

using ll = long long;

const ll mod = 1e9 + 7;
const int MX = 2e5 +10;

using namespace std;

int two[MX];

void solve(){
	int d; cin >> d;
	ll ans = 0;
	ll n = two[d] - 1;
	for(int i = 0; i<d; i++){
		ll ch = (i == d-1) ? 0 : 2;
		ll ch_sub = two[d-1 - i]-1;
		ll sub = ch*ch_sub + 1;
		ll cnt = two[i];
		ans += cnt*((n*i%mod + n*i%mod + (mod - 2)*i%mod*(sub + ch*ch_sub%mod*(sub - ch_sub)%mod))%mod)%mod;
		ans %= mod;
	}
	cout << ans << "\n";
}

signed main(){
    cin.tie(0) -> sync_with_stdio(0);
	two[0] = 1;
	for(int i = 1; i<=1e5; i++){
		two[i] = 2*two[i-1]%mod;
	}
    int T = 1;
	cin >> T;
    for(int i = 1; i<=T; i++){
		solve();
	}
    return 0;
}

I. Mountain Climbing Hard

Solution

Code

#include <iostream>
#include <vector>
#include <algorithm>
#include <cassert>
using namespace std;
#define MAXN 1000001
#define MAXQ 100001
vector<pair<int, int> > points;
vector<pair<pair<int, int>, int> > qs;
int N, Q, a[MAXN], BIT[MAXN], r[MAXN], l[MAXN], sols[MAXQ];

int getSum(int index)
{
    int sum = 0;
    index = index + 1;
    while (index > 0)
    {
        sum += BIT[index];
        index -= index & (-index);
    }
    return sum;
}

void updateBIT(int index)
{
    index = index + 1;

    while (index <= N)
    {
        BIT[index] += 1;
        index += index & (-index);
    }
}

int main()
{
    ios_base::sync_with_stdio(0);
    cin.tie(0);
    cin >> N >> Q;

    for (int i = 0; i < N; i++)
    {
        cin >> a[i];
        points.push_back({ a[i], i }); // used to iterate in increasing altitude
    }

    for (int i = 0; i < Q; i++)
    {
        int p, f;
        cin >> p >> f;
        qs.push_back({ {f, p - 1}, i }); //offline queries
    }

    for (int i = 0; i < N; i++) r[i] = N, l[i] = -1;
    vector<pair<int, int> > sr, sl;
    for (int i = 0; i < N; i++) {
        int alt = a[i];

        while (sr.size() && sr.back().first <= alt)
        {
            r[sr.back().second] = i;
            sr.pop_back();
        }
        sr.push_back(points[i]);

        int ind = N - i - 1;
        alt = a[ind];

        while (sl.size() && sl.back().first <= alt)
        {
            l[sl.back().second] = ind;
            sl.pop_back();
        }
        sl.push_back(points[ind]);
    }

    sort(qs.begin(), qs.end());
    sort(points.begin(), points.end());

    int ind = 0;
    for (int i = 0; i < Q; i++)
    {
        int fog = qs[i].first.first;
        while (ind < N && points[ind].first < fog) {
            updateBIT(points[ind].second);
            ind++;
        }

        //point index of query
        int qp = qs[i].first.second;

        //no fog
        int ans = r[qp] - l[qp] - 1;

        //amt can't see cuz fog
        int sub = getSum(r[qp] - 1) - getSum(l[qp]);

        if (a[qp] >= fog) ans -= sub;

        sols[qs[i].second] = ans;
    }

    for (int i = 0; i < Q; i++) cout << sols[i] << "\n";

    return 0;
}

J. Two and Three

Editorial

Many solutions for this problem invoke Sprague Grundy, but I will present a solution that does not.

Let us first solve the subtask for $$$n = 1$$$.

n = 1

So now to solve for an array of integers, we will have to generalize our approach quite a bit.

First off

Secondly

Lastly

Full solution

As a side note. This is actually the exact same resulting solution if you used Sprague Grundy (SG) to solve.

Relationship between this solution and Sprague Grundy

Code

#include <iostream>
#include <vector>
#include <array>
using namespace std;

int dig(int x){
	while(x >= 6){
		x /= 6;
	}
	return x;
}

void solve(){
	int n;
	cin >> n;
	array<int, 6> cnt; cnt.fill(0);
	for(int i = 0; i<n; i++){
		int x; cin >> x;
		cnt[dig(x)]++;
	}
	int x = (cnt[2] + cnt[3])%2;
	int y = (cnt[4] + cnt[5])%2;
	if((x%2)|(y%2)) cout << "Nino\n";
	else cout << "Miku\n";
}

signed main(){
    cin.tie(0) -> sync_with_stdio(0);
    int T = 1;
    cin >> T;
    for(int i = 1; i<=T; i++){
		solve();
	}
    return 0;
}

K. That Time I Got Reincarnated As A String Problem

Hint 1

Solution

We will ignore the expected value for now and compute the sum of unique strings over all ways to fill in question marks.

The Math

The Algorithm

Code

//hina best girl

#include <iostream>
#include <vector>
#include <cassert>
#include <array>
#include <string>

#define ll long long
#define sz(x) ((int)(x.size()))
const int mod = 1e9 + 7;
const int MX = 1e3 +10;
using namespace std;

ll fac[MX], ifac[MX];


ll binpow(ll a, ll b = mod - 2){
	ll ans = 1;
	for(int i = 1; i<=b; i*=2){
		if(i&b) (ans *= a) %= mod;
		(a *= a) %= mod;
	}
	return ans;
}

void precomp(int n){
	fac[0] = 1;
	for(int i = 1; i<=n; i++){
		fac[i] = 1ll*i*fac[i-1]%mod;
	}
	ifac[n] = binpow(fac[n]);
	for(int i = n; i>=1; i--){
		ifac[i-1] = 1ll*i*ifac[i]%mod;
	}
	assert(ifac[0] == 1);
}

vector<ll> mult(vector<ll> a, vector<ll> b){
	vector<ll> c(sz(a) + sz(b) - 1, 0ll);
	for(int i = 0; i<sz(a); i++){
		for(int j = 0; j<sz(b); j++){
			c[i + j] += a[i]*b[j]%mod;
		}
	}
	for(int i = 0; i<sz(c); i++) c[i] %= mod;
	return c;
}

void solve(){
	string s; cin >> s;
	int n = sz(s);
	array<int, 26> cnt = {0};
	int q = 0;
	for(char c : s){
		if(c != '?'){
			cnt[c - 'a']++;
		}else{
			q++;
		}
	}
	vector<ll> ans = {1};
	for(int i = 0; i<26; i++){
		vector<ll> cur;
		for(int j = 0; j<=cnt[i] + q; j++){
			if(j < cnt[i]) cur.push_back(0);
			else cur.push_back(ifac[j] * ifac[j - cnt[i]]%mod);
		}
		ans = mult(ans, cur);
		if(sz(ans) > n+1) ans.erase(ans.begin() + n + 1, ans.end());
	}
	assert(sz(ans) == n+1);
	ll oup = ans[n] * fac[n]%mod *fac[q]%mod;
	oup *= binpow(binpow(26, q));
	oup %= mod;
	cout << oup << "\n";
}

int main(){
	cin.tie(0) -> sync_with_stdio(0);
	precomp(1000);
	int T; cin >> T;
	for(int i = 0; i<T; i++){
		solve();
	}

	return 0;
}

L. Stuck on Bricks

Solution

Draw the line from $$$(0, 0)$$$ to $$$(x_1, y_1)$$$. Notice that any time that this line touches the boundary between two bricks our answer increases by one.

Let's count the number of times we jump from a brick to a brick that is above it. This happens $$$y_1-1$$$ times since we always move to a new brick whenever we cross some line $$$y = a$$$ for $$$1 \le a \le y_1-1$$$.

Now count the number of times we jump from a brick to a brick that is to the right. To do this, write the equation for our line. It is $$$y_1x - x_1y = 0$$$. We check if this line crosses a boundary between two bricks at $$$x = b$$$. We find the intersection that these lines have with each other, $$$(c, d)$$$. If both $$$c$$$ and $$$d$$$ are integers, we do not count the movement to the right since we already counted the movement upwards to the next brick. Now we check if $$$(c, d)$$$ is a point between two horizontally adjacent bricks or in the space inside a brick. To do this, we notice that for any odd $$$x$$$ value, the point brings us to a new brick if it's $$$y$$$ coordinate is in any range $$$[1, 2], [3, 4], \dots$$$ while for even values of $$$x$$$ the point brings us to a new brick if it's $$$y$$$ coordinate is any range $$$[0, 1], [2, 3], \dots$$$. My code checks this by looking at the parity of the x coordinate and the floor of the y coordinate of this point. If their parity is the same, it means that we move to a new brick to the right at that point. This gives an $$$O(x_1)$$$ solution.

For the complete solution, we have to deal with cases when $$$x_1$$$ is large. To do this, notice that if it is then for every range $$$y_1, y_2$$$ we cross right boundary lines multiple times. You can solve this by calculations based on the boundary points for each consecutive pairs of $$$y$$$, or by scaling down $$$x_1$$$ when you notice that if $$$x > 2y_1$$$ we are guaranteed to pass through a range of $$$(2y_1)$$$ when we move to a point 1 coordinate upwards, so we can calculate the answer by adding $$$y_1$$$ with the answer to $$$(x_1-2y_1, y_1)$$$. Through this we can make use of mods to bring the $$$x$$$ coordinate down to $$$2y$$$. Then our time complexity is $$$O(\min(x, y))$$$.

Code

#include <bits/stdc++.h>
using namespace std;
void solve() {
	long long x, y; cin>>x>>y;
	{
		long long ans = y;
		if (x > 2 * y) {
			long long c = (x-1) / (2*y);
			ans += c * (y);
			x = ((x-1) % (2 * y)) + 1;
		}
		for (int i = 1; i < x; i++) {
			long long y1 = (y * i)/x;
			if (y1*x==y*i) continue;
			if (i%2==1 && y1%2==1) {
				ans++;
			}
			else if (i%2==0 && y1%2==0) {
				ans++;
			}
		}
		cout<<ans<<endl;
	}
}
int main() {
	ios_base::sync_with_stdio(0); cin.tie(0); cout.sync_with_stdio(0);
	int t = 1;
	cin>>t;
	while (t--)
		solve();
	return 0;
}

M. Magic labyrinth

Hint 1

Hint 2

Hint 3

Solution

Code for the first method

#include<bits/stdc++.h>
 
using namespace std;
 
typedef long long int ll;
 
const int MOD = 1e9 + 7;

void mult(vector<vector<ll>>& a, vector<vector<ll>>& b){
	int n = (int)a.size();
	vector<vector<ll>> nw(n, vector<ll>(n));
	ll mx = 1e18;
	for(int i = 0; i < n; i++){
		for(int j = 0; j < n; j++){
			for(int q = 0; q < n; q++){
				if(q == 0) nw[i][j] = min(a[i][q] + b[q][j], mx);
				else nw[i][j] = min(nw[i][j], min(a[i][q] + b[q][j], mx));
			}
		}
	}
	a = nw;
}

vector<vector<ll>> exp(vector<vector<ll>> dp, int e){
	if(e == 1) return dp;
	if(e % 2 == 0){
		vector<vector<ll>> dp2 = exp(dp, e / 2);
		mult(dp2, dp2);
		return dp2;
	}else{
		vector<vector<ll>> dp2 = exp(dp, e / 2);
		mult(dp2, dp2); mult(dp2, dp);
		return dp2;
	}
}

void solve(){
	int n, m, k; cin >> n >> m >> k;
	vector<int> a(n);
	for(auto &i : a) cin >> i;
	vector<vector<int>> adj(n);
	for(int i = 0; i < m; i++){
		int u, v; cin >> u >> v; u--; v--;
		adj[u].push_back(v);
	}
	int additional = k % n;
	k /= n;
	vector<vector<ll>> ad(n);
	vector<vector<ll>> dp(n);
	for(int i = 0; i < n; i++){
		vector<ll> curr(n, 1e18);
		curr[i] = 0;
		for(int t = 1; t <= n; t++){
			vector<ll> lst = curr;
			curr.assign(n, 1e18);
			for(int j = 0; j < n; j++){
				curr[j] = min(curr[j], lst[j] + a[(j + (t - 1)) % n]);
				for(int x : adj[j]){
					curr[x] = min(curr[x], lst[j] + a[(j + (t - 1)) % n]);
				}
			}
			if(t == additional){
				ad[i] = curr;
			}
		}
		dp[i] = curr;
	}
	if(k == 0){
		vector<vector<ll>> ans = ad;
		ll res = 1e18;
		for(int i = 0; i < n; i++) res = min(res, ans[0][i]);
		cout << res << endl;
		return;
	}
	vector<vector<ll>> ans = exp(dp, k);
	if(additional > 0) mult(ans, ad);
	ll res = 1e18;
	for(int i = 0; i < n; i++) res = min(res, ans[0][i]);
	cout << res << endl;
}

signed main(){
    ios_base::sync_with_stdio(0);
    cin.tie(0);

    //~ int tt; cin >> tt;
    int tt = 1;
    for(int t = 1; t <= tt; t++){
        solve();
    }
}

Code for the second method

#include<bits/stdc++.h>
 
using namespace std;
 
typedef long long int ll;
 
const int MOD = 1e9 + 7;

void mult(vector<vector<ll>>& a, vector<vector<ll>>& b){
	int n = (int)a.size();
	vector<vector<ll>> nw(n, vector<ll>(n));
	ll mx = 1e18;
	for(int i = 0; i < n; i++){
		for(int j = 0; j < n; j++){
			for(int q = 0; q < n; q++){
				if(q == 0) nw[i][j] = min(a[i][q] + b[q][j], mx);
				else nw[i][j] = min(nw[i][j], min(a[i][q] + b[q][j], mx));
			}
		}
	}
	a = nw;
}

void solve(){
	int n, m, k; cin >> n >> m >> k;
	vector<int> a(n);
	for(auto &i : a) cin >> i;
	vector<vector<int>> adj(n);
	for(int i = 0; i < m; i++){
		int u, v; cin >> u >> v; u--; v--;
		adj[u].push_back(v);
	}
	int additional = k % n;
	k /= n;
	vector<vector<ll>> ad(n);
	vector<vector<ll>> dp(n);
	for(int i = 0; i < n; i++){
		vector<ll> curr(n, 1e18);
		curr[i] = 0;
		for(int t = 1; t <= n; t++){
			vector<ll> lst = curr;
			curr.assign(n, 1e18);
			for(int j = 0; j < n; j++){
				curr[j] = min(curr[j], lst[j] + a[(j + (t - 1)) % n]);
				for(int x : adj[j]){
					curr[x] = min(curr[x], lst[j] + a[(j + (t - 1)) % n]);
				}
			}
			if(t == additional){
				ad[i] = curr;
			}
		}
		dp[i] = curr;
	}
	if(k == 0){
		vector<vector<ll>> ans = ad;
		ll res = 1e18;
		for(int i = 0; i < n; i++) res = min(res, ans[0][i]);
		cout << res << endl;
		return;
	}
	vector<vector<ll>> ans = dp;
	k--;
	for(int b = 0; b < 30; b++){
		if((1 << b) > k) break;
		if((1<<b) & k){
			mult(ans, dp);
		}
		mult(dp, dp);
	}
	if(additional > 0) mult(ans, ad);
	ll res = 1e18;
	for(int i = 0; i < n; i++) res = min(res, ans[0][i]);
	cout << res << endl;
}

signed main(){
    ios_base::sync_with_stdio(0);
    cin.tie(0);

    //~ int tt; cin >> tt;
    int tt = 1;
    for(int t = 1; t <= tt; t++){
        solve();
    }
}

N. This Tree Problem Is Done For

Hint 1

Hint 2

Solution

It is easy to see that all possible splitting of the tree can be obtained by removing an edge and looking at the remaining subtrees. This leads us to an $$$O(N^2)$$$ solution where we try splitting the tree over every edge, then run a dp in each of the two remaining subtrees.

We can define $$$dp[x][0] = \text{maximum path that contains node x}$$$ and $$$dp[x][1] = \text{maximum path in the subtree of x}$$$. $$$dp[x][0]$$$ can be calculated by using the maximum $$$dp[i][0]$$$, where $$$i$$$ is a child of $$$x$$$. Meanwhile, $$$dp[x][1]$$$ can be calculated by using the two maximum $$$dp[i][0]$$$ and maximum $$$dp[i][1]$$$. With these dp states, we can easily update the values when attaching or removing children from a node. If we maintain a multiset storing all of the $$$dp[i][0]$$$ and $$$dp[i][1]$$$, then attaching a child becomes inserting a value into the multiset, and removing a child becomes removing a value from the multiset. $$$dp[x][0]$$$ then transitions to the largest value in the multiset of $$$dp[i][0]$$$, while $$$dp[x][1]$$$ transitions to the two largest values of $$$dp[i][0]$$$ and the largest value of the multiset of $$$dp[i][1]$$$.

Now, if our tree is rooted at $$$x$$$, we can effectively split the tree over every edge attached to $$$x$$$ by removing and adding children. We can also use this method to efficiently reroot the tree, thus allowing us to be able to split the tree over every edge. Lets say we are rerooting our tree from node $$$a$$$ to node $$$b$$$. To do this, we can remove $$$b$$$ from being a child of $$$a$$$, then attach $$$a$$$ to be a child of $$$b$$$ using the values computed after the first removal. Using this described method yields a solution of $$$O(N \text{ log } N)$$$, which if well implemented, will pass. However, we can actually optimize this further by only storing the three maximum values for each multiset instead of all of them. It is easy to see that those are all we need to support our operations.

There also exists other solutions such as binary searching on the answer for $$$O(N \text{ log } N)$$$ complexity and a greedy solution involving diameters for $$$O(N)$$$.

Code

#pragma GCC optimize("O3")
#pragma GCC optimization ("unroll-loops")
#pragma GCC target("avx,avx2,fma")
#pragma GCC target("sse,sse2,sse3,ssse3,sse4,popcnt,abm,mmx,tune=native")
#include <bits/stdc++.h>
using namespace std;

#define pb push_back
#define ff first
#define ss second

typedef long long ll;
typedef pair<int, int> pii;
typedef pair<ll, ll> pll;

const int INF = 1e9;
const ll LLINF = 1e18;
const int MOD = 1e9 + 7;

vector<pii> g[500005];

ll dp[500005][2];
multiset<ll, greater<ll>> deg[500005][2];

void dfs1(int x, int p = -1){
    deg[x][0].insert(0), deg[x][0].insert(0);
    for(pii i : g[x]){
        if(i.ff == p) continue;
        dfs1(i.ff, x);
        deg[x][0].insert(dp[i.ff][0] + i.ss);
        deg[x][1].insert(dp[i.ff][1]);
    }
    deg[x][1].insert(*deg[x][0].begin() + *next(deg[x][0].begin()));
    dp[x][0] = *deg[x][0].begin();
    dp[x][1] = *deg[x][1].begin();
    while(deg[x][0].size() > 3) deg[x][0].erase(prev(deg[x][0].end()));
    while(deg[x][1].size() > 3) deg[x][1].erase(prev(deg[x][1].end()));
}

ll ans;

void rem(int x, int t, ll v){
    multiset<ll, greater<ll>>::iterator it = deg[x][t].find(v);
    if(it != deg[x][t].end()) deg[x][t].erase(it);
}

void ins(int x, int t, ll v){
    deg[x][t].insert(v);
    while(deg[x][t].size() > 3) deg[x][t].erase(prev(deg[x][t].end()));
}

void move(int a, int b, int c){
    rem(a, 1, dp[b][1]);
    rem(a, 1, *deg[a][0].begin() + *next(deg[a][0].begin()));
    rem(a, 0, dp[b][0] + c);
    ins(a, 1, *deg[a][0].begin() + *next(deg[a][0].begin()));
    dp[a][0] = *deg[a][0].begin();
    dp[a][1] = *deg[a][1].begin();
    ans = max(ans, min(dp[a][1], dp[b][1]));
    rem(b, 1, *deg[b][0].begin() + *next(deg[b][0].begin()));
    ins(b, 0, dp[a][0] + c);
    ins(b, 1, *deg[b][0].begin() + *next(deg[b][0].begin()));
    ins(b, 1, dp[a][1]);
    dp[b][0] = *deg[b][0].begin();
    dp[b][1] = *deg[b][1].begin();
}

void dfs2(int x, int p = - 1){ 
    for(pii i : g[x]){
        if(i.ff == p) continue;
        move(x, i.ff, i.ss);
        dfs2(i.ff, x);
        move(i.ff, x, i.ss);
    }
}

const int BUFSIZE = 20 << 21;
char Buf[BUFSIZE + 1], *buf = Buf;

template<class T>
void scan(T &x){
    int neg = 1;
    for(x = 0; *buf < '0' || *buf > '9'; buf++) if(*buf == '-') neg = -1;
    while(*buf >= '0' && *buf <= '9') x = x*10 + (*buf - '0'), buf++;
    x *= neg;
}

void setIO(){
    fread(Buf, 1, BUFSIZE, stdin);
}

int main(){
    setIO();
    int t;
    scan(t);
    for(int tt = 1; tt <= t; tt++){
        int n;
        scan(n);
        for(int i = 0; i < n - 1; i++){
            int a, b, c;
            scan(a), scan(b), scan(c);
            g[a].pb({b, c});
            g[b].pb({a, c});
        }
        ans = 0;
        dfs1(1);
        dfs2(1);
        cout << ans << endl;
        for(int i = 1; i <= n; i++){
            g[i].clear();
            deg[i][0].clear();
            deg[i][1].clear();
        }
    }
}

O. Prefix queries

Hint 1

Hint 2

Hint 3

Solution

Code

#include<bits/stdc++.h>
 
using namespace std;

struct segTree{
    vector<long long> v;
    vector<long long> upd;
    int size;
    void init(int n){
        size = 1;
        while(size < n) size *= 2;
        v.assign(2 * size, 0);
        upd.assign(2 * size, 0);
    }
    void set(int l, int r, int x, int lx, int rx, long long u){
        if(lx >= l && rx <= r){
            v[x] += u * (rx - lx);
            upd[x] += u;
            return;
        }
        if(lx >= r || l >= rx) return;
        int m = (lx + rx) / 2;
        set(l, r, 2 * x + 1, lx, m, u);
        set(l, r, 2 * x + 2, m, rx, u);
        v[x] = v[2 * x + 1] + v[2 * x + 2] + upd[x] * (rx - lx);
    }
    void set(int l, int r, long long u){
        return set(l, r, 0, 0, size, u);
    }

    void build(vector<int>& a, int x, int lx, int rx){
        if (rx - lx == 1){
            if (lx < (int)a.size()){
                v[x] = a[lx];
            }
            return;
        }
        int m = (lx + rx) / 2;
        build(a, 2 * x + 1, lx, m);
        build(a, 2 * x + 2, m, rx);
        v[x] = v[2 * x + 1] + v[2 * x + 2];
    }
    void build(vector<int>& a){
        build(a, 0, 0, size);
    }

    pair<long long, int> sum(int l, int r, int x, int lx, int rx){
        if(lx >= l && rx <= r) return {v[x], rx - lx};
        else if(lx >= r || rx <= l) return {0, 0};
        int m = (lx + rx) / 2;
        pair<long long, int> s1 = sum(l, r, 2 * x + 1, lx, m);
        pair<long long, int> s2 = sum(l, r, 2 * x + 2, m, rx);
        return {s1.first + s2.first + upd[x] * (s1.second + s2.second), (s1.second + s2.second)};
    }

    long long sum(int l, int r){
        pair<long long, int> p = sum(l, r, 0, 0, size);
        return p.first;
    }
};


int main(){
    ios_base::sync_with_stdio(0);
    cin.tie(0);
 
	int n, q; cin >> n >> q;
	vector<int> a(n);
	set<int> positive; //Contains all the indices which could be potential answers.
	long long sum = 0;
	for(int i = 0; i < n; i++){
		int x; cin >> x;
		a[i] = x;
		if(i > 0 && x - sum >= 0) positive.insert(i);
		sum += x;
	}
	segTree st; st.init(n); st.build(a);
	while(q--){
		int l, r, x; cin >> l >> r >> x; l--; r--;
		st.set(l, r + 1, (long long)x);
		if(l > 0 && st.sum(l, l + 1) - st.sum(0, l) >= 0) positive.insert(l);
		bool done = 0;
		while((int)positive.size() > 0 && done == 0){
			int ind = *positive.begin();
			if(st.sum(ind, ind + 1) - st.sum(0, ind) >= 0){
				done = 1;
				cout << ind + 1 << "\n";
			}else{
				positive.erase(positive.begin());
			}
		}
		if(!done) cout << -1 << "\n";
	}
}

P. In Another World With My Range Query Problems

Hint 1

Hint 2

Solution

Code

#pragma GCC optimize("O3,unroll-loops")
#pragma GCC target("avx,avx2,fma")
#pragma GCC target("sse4,popcnt,abm,mmx,tune=native")
#include <bits/stdc++.h>
using namespace std;

#define pb push_back
#define ff first
#define ss second

typedef long long ll;
typedef pair<int, int> pii;
typedef pair<ll, ll> pll;

const int MOD = 1e9 + 7;

void setIO() {
    ios_base::sync_with_stdio(0); cin.tie(0);
}

int n, q;
int arr[200005];

struct node {

    int iia, ia, a, ii, i, sz;

    node(){
        iia = ia = a = sz = 0;
    }
};

node seg[800005];
int tag[800005];

void push_down(int x){
    if(!tag[x]) return;
    for(int i = x*2 + 1; i <= x*2 + 2; i++){
        seg[i].a = (seg[i].a + (ll)seg[i].sz*tag[x]%MOD)%MOD;
        seg[i].ia = (seg[i].ia + (ll)seg[i].i*tag[x]%MOD)%MOD;
        seg[i].iia = (seg[i].iia + (ll)seg[i].ii*tag[x]%MOD)%MOD;
        tag[i] = (tag[i] + tag[x])%MOD;
    }
    tag[x] = 0;
}

node pull(node a, node b){
    node ret;
    ret.iia = (a.iia + b.iia)%MOD;
    ret.ia = (a.ia + b.ia)%MOD;
    ret.ii = (a.ii + b.ii)%MOD;
    ret.a = (a.a + b.a)%MOD;
    ret.i = (a.i + b.i)%MOD;
    ret.sz = (a.sz + b.sz)%MOD;
    return ret;
}

void build(int l = 1, int r = n, int cur = 0){
    if(l == r){
        seg[cur].sz = 1;
        seg[cur].i = l;
        seg[cur].a = arr[l];
        seg[cur].ii = (ll)l*l%MOD;
        seg[cur].ia = (ll)l*arr[l]%MOD;
        seg[cur].iia = (ll)l*l%MOD*arr[l]%MOD;
        return;
    }
    int mid = (l + r)/2;
    build(l, mid, cur*2 + 1);
    build(mid + 1, r, cur*2 + 2);
    seg[cur] = pull(seg[cur*2 + 1], seg[cur*2 + 2]);
}

int get(node x, int l, int r){
    int ret = MOD - x.iia;
    (ret += (ll)x.ia*l%MOD) %= MOD;
    (ret += (ll)x.ia*r%MOD) %= MOD;
    (ret += MOD - (ll)x.a*l%MOD*r%MOD) %= MOD;
    (ret += MOD - (ll)x.a*l%MOD) %= MOD;
    (ret += (ll)x.a*r%MOD) %= MOD;
    (ret += x.a) %= MOD;
    return ret;
}

int query(int l, int r, int ul = 1, int ur = n, int cur = 0){
    if(l <= ul && ur <= r){
        return get(seg[cur], l, r);
    }
    if(ur < l || ul > r) return 0;
    push_down(cur);
    int mid = (ul + ur)/2;
    return (query(l, r, ul, mid, cur*2 + 1) + query(l, r, mid + 1, ur, cur*2 + 2))%MOD;
}

void update(int l, int r, int v, int ul = 1, int ur = n, int cur = 0){
    if(l <= ul && ur <= r){
        seg[cur].a = (seg[cur].a + (ll)seg[cur].sz*v%MOD)%MOD;
        seg[cur].ia = (seg[cur].ia + (ll)seg[cur].i*v%MOD)%MOD;
        seg[cur].iia = (seg[cur].iia + (ll)seg[cur].ii*v%MOD)%MOD;
        tag[cur] = (tag[cur] + v)%MOD;
        return;
    }
    push_down(cur);
    int mid = (ul + ur)/2;
    if(l <= mid) update(l, r, v, ul, mid, cur*2 + 1);
    if(r > mid) update(l, r, v, mid + 1, ur, cur*2 + 2);
    seg[cur] = pull(seg[cur*2 + 1], seg[cur*2 + 2]);
}

int main(){
    setIO();
    cin >> n >> q;
    for(int i = 1; i <= n; i++) cin >> arr[i];
    build();
    while(q--){
        int t, l, r;
        cin >> t >> l >> r;
        if(t == 1){
            cout << query(l, r) << endl;
        } else {
            int v;
            cin >> v;
            update(l, r, v);
        }
    }
}

Q. Another Floors Problem

A solution for this problem is not published yet. For now, please refer to this tester solution.

Code

# O(N*log(precision + MAXA*log(MAXA))

# ANALYZING WHY WE CAN'T EXPRESS ALL VALUES:
#
# The sum changes at x = b/z if for some i, z | a[i].
# However, there may be multiple such i, and so the sum "skips" a few values
# since multiple a transition (floor(ax) increases). This is why we can't express all integers.
#
# IDEA:
#
# The number of expressible integers = the number of x such that the sum increases.
#
# SOLUTION:
#
# Realize that for a fixed max x, we can do a dp on divisors to compute:
# transition_points[i] = # of x such that x in simplest form = b/i
#
# Then, the sum is increased to a new value at transition_points[i] x's if there exists an
# a that transitions at those points x = b/i => i | a.
#
# Thus, we can find # of expressible numbers below r and l-1 by binary searching on the maximum x
# (be careful about precision!).
# We can binary search on the integer part and then the fractional part.
# Subtract the values for the answer.


from math import floor

MAXA = 10**5


def expressible_numbers_below_bound(a, right_bound):
    # Binary search to find max_x

    # First binary search on the integer part of max_x
    l = 0
    r = 10**18

    while l != r:
        m = (l + r + 1) // 2

        tot_sum = sum(floor(m*val) for val in a)

        if tot_sum <= right_bound:
            l = m
        else:
            r = m-1

    # Now binary search on the fractional part of max_x
    fractional_l = 0
    fractional_r = 1
    # We can stop at <= 2e-10 actually
    while fractional_r - fractional_l > 1e-12:
        m = (fractional_l + fractional_r) / 2

        # This fails if abs(m - b/val) < 1e-15 and we have nlog(precision) calculations.
        # Thus, there is a 1e-9 chance of occurring over all calculations
        tot_sum = sum(l*val + floor(m*val) for val in a)

        if tot_sum <= right_bound:
            fractional_l = m
        else:
            fractional_r = m

    max_x_integer = l
    max_x_fractional = fractional_l

    # Now we find the number of expressible integers using 0 <= x <= max_x

    cnt = [0] * (MAXA + 1)

    for i in a:
        cnt[i] += 1

    divisors = [[] for _ in range(MAXA+1)]
    number_of_a_that_transition = [0] * (MAXA + 1)

    for i in range(1, MAXA+1):
        for j in range(i, MAXA+1, i):
            divisors[j].append(i)

            number_of_a_that_transition[i] += cnt[j]

    transition_points = [0] * (MAXA + 1)

    for i in range(1, MAXA + 1):
        for div in divisors[i]:
            if div != i:
                transition_points[i] -= transition_points[div]

        transition_points[i] += i*max_x_integer + floor(i*max_x_fractional)

    return sum((number_of_a_that_transition[i] > 0) * transition_points[i] for i in range(1, MAXA + 1))


n, l, r = map(int, input().split())
a = list(map(int, input().split()))

ans = expressible_numbers_below_bound(a, r) &mdash; expressible_numbers_below_bound(a, l-1)

print(ans)

R. Bingo

Solution for k = 20 that also happens to cheese and ac

Intended solution. Can be used to solve k = 27

Code

//misaka, hitori, and elaina will carry me to red
#include <iostream>
#include <cmath>
#include <utility>
#include <cassert>
#include <algorithm>
#include <vector>
#include <array>
#include <cstdio>
#include <cstring>
#include <functional>
#include <numeric>
#include <set>
#include <queue>
#include <map>
#include <chrono>
#include <random>

#define sz(x) ((int)(x.size()))
#define all(x) x.begin(), x.end()
#define pb push_back
#define eb emplace_back
#define kill(x, s) {if(x){ cout << s << "\n"; return ; }}
#define lsb(x) ((x)&(-(x)))
#define lg2(x) (31 &mdash; __builtin_clz(x))
#define pcnt(x) __builtin_popcount(x)


#ifndef LOCAL
#define cerr while(0) cerr
#endif

using ll = long long;
using lb = long double;

const lb eps = 1e-9;
const ll mod = 1e9 + 7, ll_max = 1e18;
//const ll mod = (1 << (23)) * 119 +1, ll_max = 1e18;
const int MX = 2e5 +10, int_max = 0x3f3f3f3f;

struct {
  template<class T>
  operator T() {
    T x; std::cin >> x; return x;
  }
} in;

using namespace std;

const int k = 5;
const int p = 5;
const int A = 25;

vector<int> mem[40];

array<int, A*A*A*A*A> val;
int cond(int x, int mask){
	int ans = 0, b = 1;
	for(int i = 0; i<k; i++){
		if(mask&(1 << i)){
			ans += ((x&(((1 << p)-1) << (i*p))) >> (i*p)) * b;
			b *= (1 << p);
		}
	}
	return ans;
}

int check(int x, int mask){
	for(int i = 0; i<k; i++){
		if(!(mask&(1 << i))){
			if(x&(((1 << p)-1) << (i*p))) return 0;
		}
	}
	return 1;
}
vector<int> sos(vector<int> a){
	int n = lg2(sz(a));
	for(int i = 0; i<n; i++){
		for(int j = 0; j<(1 << n); j++){
			if(j&(1 << i)){
				a[j] = min(a[j], a[j &mdash; (1 << i)]);
			}
		}
	}
	return a;
}
void solve(){
	int n = in;
	int mx = in;
	vector<pair<int, int>> small;
	val.fill(int_max);
	for(int i = 1; i<=n; i++){
		array<array<int, k>, k> board;
		for(int j = 0; j<k; j++){
			for(int h = 0; h<k; h++){
				board[j][h] = in;
				board[j][h]--;
			}
		}
		for(int j = 0; j<k; j++){
			unsigned int r = 0, c = 0;
			array<int, k> rr, cc;
			for(int h = 0; h<k; h++){
				r |= (1 << board[j][h]);
				c |= (1 << board[h][j]);
				rr[h] = board[j][h];
				cc[h] = board[h][j];
			}
			sort(all(rr));
			sort(all(cc));
			int r1 = 0, c1 = 0;
			int b = 1;
			for(int h = 0; h<k; h++){
				r1 += b*rr[h];
				c1 += b*cc[h];
				b *= A;
			}
			if(val[c1] == int_max){
				small.pb({c, i});
				val[c1] = i;
			}
			if(val[r1] == int_max){
				small.pb({r, i});
				val[r1] = i;
			}			
		}
	}
	for(int mask = 1; mask<(1 << k)-1; mask++){
		vector<int> a(cond((1 << (k*p))-1, mask)+1, int_max);
		for(auto [m, id] : small){
			if(check(m, mask)){
				a[cond(m, mask)] = min(a[cond(m, mask)], id);
			}
		}
		mem[mask] = sos(a);
	}	
	int q = in;
	for(int qaq = 1; qaq<=q; qaq++){
		array<int, A> perm, inv = perm;
		iota(all(perm), 0);
		for(int i = 0; i<mx; i++){
			perm[i] = in;
			perm[i]--;
		}
		for(int i = 0; i<A; i++){
			inv[perm[i]] = i;
		}
		int glob = 0;
		pair<int, int> ans = {int_max, int_max};
		for(int i = 0, wo = 0; i<A && wo == 0; i++){
			if(perm[i] < p*k)
				glob |= (1 << perm[i]);
			for(int mask = 1; mask<(1 << k)-1; mask++){
				int v = mem[mask][cond(glob, mask)];
				if(v != int_max){
					ans = min(ans, pair(i, v));
					wo = 1;
				}
			}
		}
		for(int i = 0; i<p; i++){
			for(int j = p; j<p*2; j++){
				for(int h = p*2; h<p*3; h++){
					for(int l = p*3; l<p*4; l++){
						for(int m = p*4; m<p*5; m++){
							int hsh = i + A*j + A*A*h + A*A*A*l + A*A*A*A*m;
							int t = max({inv[i], inv[j], inv[h], inv[l], inv[m]});
							if(val[hsh] != int_max) ans = min(ans, pair(t, val[hsh]));
						}
					}
				}
			}
		}
		cout << ans.second << " " << perm[ans.first]+1 << "\n";
	}
}

signed main(){
  cin.tie(0) -> sync_with_stdio(0);

  int T = 1;
  //cin >> T;
  for(int i = 1; i<=T; i++){
		//cout << "Case #" << i << ": ";
		solve();
	}
  return 0;
}

Full text and comments »

Tutorial of Teamscode Spring 2023 Contest

teamscode

willy108
13 months ago
2

The AI speaks for itself

By willy108, history, 17 months ago, In English

Full text and comments »

+202

willy108
17 months ago
5

Teamscode Summer 2021 Summary

By willy108, history, 3 years ago, In English

The long awaited editorial and CF gym for the TeamsCode Summer 2021 Contest is finally out! The CF gym is here with all 25 problems sorted in difficulty. In each problem at the bottom (after the sample explanation) are credits for each problem as well as in which divisions they appeared in. The editorial is linked in the form of a pdf in the CF gym and can also be found here.

The problem difficulties range from less than $$$800$$$ to well over $$$2500$$$ in terms of CF ratings. I challenge you to upsolve them. I know that the problemsetting team, codicon, Bossologist, Mantlemoose, Spark, and me, put a lot of work into making 25 quality problems this time around.

We also have a github with relevant materials as well as a Discord.

Special thanks to BucketPotato, lunchbox, Daveeed, and jli505 for testing the Advanced Division and Shreybob, Nikhil Chatterjee (nikhilc1527), and Ryan Chou for testing the Intermediate Division. Also massive props to PurpleCrayon for coordinating the round! We could not have done it without him. If there are any problems that you do not like, I guarantee you that Purple played a part in making it :).

Also thanks if you took the round! I know that a few of the problems were scuffed and harder than previous years, but I still hope you enjoyed! Now go upsolve the problems :)

Full text and comments »

Announcement of Teamscode Summer 2021

teamscode, purplecrayonorz

+117

willy108
3 years ago
12

[Tutorial] a few strange lca algorithms with a few strange time complexities pt 2 revised

By willy108, history, 3 years ago, In English

disclaimer: yet again i do not pretend to claim that this algorithm is useful. bin lifting is probably better in all aspects.

======================================================================================

intro

if you havent alr, consider reading this since most of my terminology will be from there.

cube root decomp

before i start, this algorithm is entirely useless. bin lifting has both a shorter impl and it has a better time complexity. but being able to understand this algorithm will help with the generalized algorithm later in this article.

so i first came up with this idea when i doing the CSES Distance Queries with my sqrt lca and it tle'd. so what i was thinking was "why on earth is sqrt lca so slow", then it hit me, sqrt per query is horrible (and i should learn bin lifting, but i would rather brainstorm useless algs like this instead of learning bin lifting tho). but then i thought, what if i used cube root instead of square root? then, i thought, the complexity would go from O(n^(1/2)) to O(n^(2/3)) as i had to loop over n^(2/3) segments of length n^1/3. but thankfully we can do better than that.

so lets do some defining of terms:

CUBE is a constant such that CUBE^3 >= n and CUBE is minimal (a fancy way of saying the cube root of n)

par[u] is the parent directly up from u

super[u] is redefined as the parent CUBE steps up from u

duper[u] is defined as the parent CUBE^2 steps up from u (i have great naming skills btw)

we'll get onto how to compute super and duper fast is a second, but first i'll show you why they help.

so first is the k_up function

int k_up(int u, int k){ //returns the k'th parent up from node u
   for(; k >= CUBE*CUBE; k -= CUBE*CUBE) u = duper[u];
   for(; k >= CUBE; k -= CUBE) u = super[u];
   for(;k--;) u = par[u];
   return u;
}

so what is the complexity of the above code? well, you will iterate the first loop at most CUBE times since there are at most n/(CUBE*CUBE) <= CUBE since k <= n and you go up CUBE*CUBE steps each time, its similar to how sqrt lca works. then you iterate the second loop also CUBE times at most, since after you finish the first loop k will be < CUBE*CUBE, and they are only CUBE CUBE's in CUBE*CUBE. the third loop will also run in CUBE time since k < CUBE after the second loop. and so this k_up implementation runs in O(CUBE) (hahah CUBE is a constant so its O(1) hahahh ahahah big O abuse hahaha).

now the important thing is the actual lca finding, so for two nodes on the same level, you can also use the duper/super/par array to find the lca of the two in O(CUBE) (if they are on different levels, just use the k_up function to move the lower one up). so lets say two nodes u and v (on the same level) have the same duper value, their lca will not be further from u (and v) than duper[u] is. since if it was further, you can take duper and it would be closer (this is more or less the same thing as the proof of correctness of the sqrt lca). if they are different, you set u = duper[u] and v = duper[v] and try again. this will happen at most CUBE times (just like the k_up complexity). then you can do the same thing with the super array. since the distance from u to duper[u] is exactly CUBE^2 and we know the lca is at least as close as duper[u], the problem just becomes the same thing with a tree size CUBE^2 (instead of CUBE^3 as it was previously), and then the tree becomes size CUBE with the par array, and you have an lca! this is very similar to the sqrt lca idea, its just that i used 2 arrays (duper and super) instead of 1 (super).

below is an implementation of the code.

int lca(int u, int v){
  if(dep[u] < dep[v]) swap(u, v); //im just yoinking this
  u = k_up(u, dep[u] - dep[v]);   //from my sqrt lca code
  while(duper[u] != duper[v]) u = duper[u], v = duper[v]; //you can just duper CUBE times before it becomes the root
  while(super[u] != super[v]) u = super[u], v = super[v]; //you can just super CUBE times before you actually just wouldve jumped duper again
  while(u != v) u = par[u], v = par[v]; //you can jump par CUBE times before you would've just jumped super
  return u; //or v since they should be equal
}

and this is O(CUBE) per lca query since k_up runs in O(CUBE) and each loop runs in O(CUBE). since each duper[u] is CUBE^2 nodes up and super[u] is CUBE up, you can just loop over super CUBE times and it'll work. below is some code since this'll come up later

void precomp(){
  //assume dep and par are computed elsewhere, if you dont know how to compute those, you shouldnt be reading abt lca :/
  for(int i = 1; i<=n; i++){ //assume n is global and there are n nodes in the tree
    super[i] = i;
    for(int i = 0; i < CUBE && super[i] != 0; i++) //optimization to stop if super goes out of the tree
      super[i] = par[super[i]]; //just looping par up CUBE times, like the sqrt lca but with CUBE
  }
  for(int i = 1; i<=n; i++){
    duper[i] = i;
    for(int i = 0; i<CUBE && duper[i]; i++)
     duper[i] = super[duper[i]]; //the same thing but jumping super up to save time

  }
}

the precomp complexity is O(n*CUBE) as the nested loops are, and queries and O(CUBE). yet again. you can do precomp in O(n) but im too lazy to cover it. you figured out how to do O(n) for sqrt precomp, its the same thing but with 2 arrays to maintain. this finally ac'ed the cses problem :D. since CUBE < SQRT this algorithm runs better (even if barely and more scuffed).

nth root lca

well, can we generalize it? what if you used 3 arrays super, duper, and juper (haha great naming) and did O(n^(1/4)) per query and O(n * n^(1/4)) for precomp, or 4 arrays for n^(1/5)? you can and i dont want to implement each one so.... the idea is that you can use R arrays (including the par array) to handle queries in O(R * n^(1/R)) with O(n * R * n^(1/R)) just note if you make R too big, nothing happens since you're jumping up by 1 or 0 each time. actually, if you set R to be log2(n) you end up with bin lifting. so imagine if i actually implemented decomp with n^(1/4) and then i realized i should make it a 2d array where super[u][j] stores the n^(j/4) parent up from u. then if i decided to not limit myself my 4 and i picked a constant R and super[u][j] stores to parent n^(j/R) up from u. you can actually just set the par array to be super[][0] since n^(0/R) is 1 and thats' exactly what the parent array stores. below is an implementation of the functions needed for lca (namely, k_up, lca, and precomp).

i left RT and LOG blank, that's for the reader to play with :), LOG is the exponent and RT is the "root"

super[u][j] is the parent LOG^j times up

base[i] = RT^i

par[u] is the parent

dep[u] is the distance from the root, dep[root] is arbitrary (0 or 1, your choice)

const int max_v = ;
const int RT = , LOG = ; //RT^LOG approx max_v
vector<int> adj[max_v];
int super[max_v][LOG * 2], par[max_v], dep[max_v], base[max_v], n, q; 
 
void dfs(int u, int p, int d){ //general util dfs, this O(n)
  par[u] = super[u][0] = p;
  dep[u] = d;
  for(int v : adj[u])
    if(v != p)
        dfs(v, u, d + 1);

}
 
void precomp(){ //three nested for loops so its just O(n * RT * LOG)
  base[0] = 1;
  for(int k = 1; k<=LOG; k++){
    base[k] = base[k - 1] * RT;
    for(int i = 1, j; i<=n; i++){
      for(j = 0, super[i][k] = i; j < RT && super[i][k]; j++){
        super[i][k] = super[super[i][k]][k - 1];
      }
    }
  }
}
 
int k_up(int u, int k){          //O(LOG*RT)
  for(int i = LOG; i >= 0; i--){ //similar proof of complexity as the cube root decomp
    while(k >= base[i])k -= base[i], u = super[u][i];
  }
  return u;
}
 
int LCA(int u, int v){
  if(dep[u] < dep[v]) swap(u, v);
  u = k_up(u, dep[u] - dep[v]);
  if(u == v) return u;
  for(int i = LOG; i >= 0; i--){ //this is always O(LOG*RT), just think abt the proof for cube root but then realizing the "root" we're using isnt constant.
    while(super[u][i] != super[v][i]) u = super[u][i], v = super[v][i];
  }
  return (par[u]) ? par[u] : u; //cant return 0
}

hopefully, it makes sense, it's just compressing the idea described above with some nested for loops and 2d arrays. so it is O(n * RT * LOG) for precomp and O(RT * LOG) per query. just note we were playing with small values of LOG (2 and 3) so we didnt really care abt it, but when you use anything more, it's no longer "constant" if you see what i mean.

resolution?

thank you for reading this scuffed blog post and please do in fact learn bin lifting, it cleaner than my "nth root decomp" and it runs faster too (unless you set RT to 2 and LOG to log2(n) >:) ). the advantages of choosing this method only lies is you can trade memory for time easily. if you choose RT to be larger, you'll use less memory, and if you set RT to be small, you'll use more. the memory complexity is always O(n * LOG) since that's the size of the super array. yet again, please do learn bin lifting, this article is what came out of someone who was too lazy to learn it. and after doing all of this, i always write bin lifting for lca. hahah

thanks for reading and i apologize for any typoes, unclearness, or over scuffedness.

Full text and comments »

lca, #trees, #implementaion, #c++, useless, cube root

willy108
3 years ago
4

[Tutorial] a few strange lca algorithms with a few strange time complexities pt 1

By willy108, history, 3 years ago, In English

Disclaimer: I will not promise that this blog will make you code lca better. binary lifting is generally better than the following algorithm and i am only sharing it since i find it very interesting.

===================================================================================

intro (skip this if you know what lca is)

if you didnt know, lca stands for least common ancestor (and implies a rooted tree). so any ancestor of a node u. is any node on u's path to the root node (including the root itself). in the diagram below nodes 1 and 2 are both ancestors of node 4. so common ancestors of nodes u and v are the nodes that are both ancestors of u and ancestors of v. the least common ancestor of nodes u and v is first node that u and v share as an ancestor (first meaning the ancestor with the largest depth). and you can see in the picture below the lca of 4 and 6 is 2, since that's the node with the furthest depth from the root that is both an ancestor of u and an ancestor of v. 1 does not count as the lca since 2 is further down and 5 does not count since it is not an ancestor of 4 (or 6 for that matter). for any pair of nodes on a rooted tree there is only one lca (hopefully this is intuitive), and this blog post describes ways to find that lca.

here is an image (from google search) of a tree. remember lca only works on a rooted tree since you have a sense of "up" and "down" only if there is a root

Sqrt LCA

imagine if we had a function k_up where k_up(u, k) returns the k'th node up from u. so from the diagram above k_up(2, 1) is 1 and k_up(8, 2) is also 1. this will be very helpful to do lca as we will see later. the array par[] stores for each u the direct parent of u (the parent of the root node is an imaginary node, 0 or -1 depending upon your implementation). in the diagram above par[2] = 1, par[5] = 2, and par[8] = 3.

so in all of the following code assume the par array is already calcutated, as for how to calculate it.... go google it.

int k_up(int u, int k){
   for(int i = 0; i<k; i++){
      u = par[u];
   }
   return u;
}

so what is the complexity of the above code? its O(k) since you loop over k to find par[u] k times. darn that's slow. i really wish we could do that faster. well that's the point of this blog.

so now lets pick a define a constant R, all we have to know abt R is that it's a constant <= the number of nodes on the tree. now for each u we define super[u] as the parent of u R times up (super for superparent, i love that word "superparent"). in the case that going k times from u takes us higher than the tree allows supor[u] = -1. so how does this help? so now in k_up(u, k) we can first loop over floor(k/R) times the superparent then we loop over k%R times on the parent array. so in total we move up floor(k/R)*R + k%R times (or k times :OOO). now the complexity is reduced to O(k/R + R) since the first half can only take k/R turns at most and the second half can take R steps at most. below is some code of the idea

int k_up(int u, int k){
   while(k >= R) k = k-R, u = super[u];
   for(int i = 0; i<k; i++) u = par[u];
   return u;
}

now there are a few problems, namely how to find super[] and what is R, If we set R to be sqrt(n), O(k/R + R) is minimized. (hopefully the intuition makes sense), in fact picking R like this is so common its even got a name: "SQRT decomp". and to find super, you can for each u, loop up R times to find the parent R steps up. you can do this even faster, but im too lazy to cover that.

be sure you understand all of this since the concept of a k_up function will come up a lot later in this blog.

now onto the actual lca part. so consider a rooted tree and any two nodes u and v that are on the same level or have the same distance from the root. if we just marched from each node taking 1 step from each at the same time, the first node where they are the same is their lca. (note this only works if u and v start on the same level). so below is an implementation of the idea

int lca(int u, int v){ //remember that they have the same depth
  while(u != v){ 
    u = par[u], v = par[v];
  }
  return u;
}

so whats the complexity of this code? its O(d) where d is the difference of depth from the lca to node u (or v). this at worst case can be O(n) where n is the number of nodes in the tree (imagine a chain). so what can we do to speed it up? let us refer to the super array again. so if super[u] == super[v] then we know that the lca of u and v has to be super[u] or further down the tree. since if it was further up, we'd just take super[u] instead since super[u] is an ancestor of u and super[v] is an ancestor of v (and they are the same :O). so now (remember nodes u and v have the same depth) we can just loop over the super[u] and super[v] while they are different, and when they are the same, we'll loop over the parent array. below is the code for this idea.

int lca(int u, int v){ //remember that they have the same depth
  while(super[u] != super[v]){ 
    u = super[u], v = super[v];
  }
  while(u != v){
    u = par[u], v = par[v];
  }
  return u;
}

what is the complexity of the above code? its O(n/R + n%R) worst case. which is also O(sqrt(n)) since R is sqrt(n). sadly this only find the lca when the two nodes have the same depth from the root. luckily this is where our k_up function comes in handy. so if we define dep[u] as the depth of node u from the root and dep[root] = 1, then we can just set u to be the further down node out of u and v and then make u = k_up(u, dep[u] — depv]). and now it becomes lca on the same depth. below is the implementation of the idea.

int k_up(int u, int k){
   while(k >= R) k = k/R, u = super[u];
   for(int i = 0; i<k; i++) u = par[u];
   return u;
}

int lca(int u, int v){
  if(dep[u] < dep[v]) swap(u, v); //setting u to be the node with greater depth
  u = k_up(u, dep[u] - dep[v]);   //moving u up to the same level at v
  while(super[u] != super[v]){    //iterating over super
    u = super[u], v = super[v];
  }
  while(u != v){                  //ieterating over par
    u = par[u], v = par[v];
  }
  return u;                       //u and v will be the same, so returnv works too
}

since k_up is also O(root(n)) worst case, the. overall query is still O(root(n)) in time complexity.

and our lca implemention is complete! its O(n sqrt(n)) precomp (or O(n) if you are smart abt it, try figuring out how later :D) and its O(sqrt(n)) per query. a more complete implementaion can be found here (along with calculating the par, super, and dep arrays).

Conclusion

the overall time complexity is O((n+q)sqrt(n)) and the memory is O(n) since we just have to store par, super, and dep arrays. but if you squish the code, it becomes a pretty short impl (and slow) and you can make the compleixty O(n + q*sqrt(n)) if you want.

please remember O(sqrt(n)) for lca queries is really slow. reaaallllly slow. there are better lca algorithms but this is cool one i wanted to introduce. also note the actually fun lca algorithm (that's not bin lifiting) will be on the next blog post since this one got too long. rip.

thank you reading and i apologize for any typos, instances of unclearness, and bugs in the code.

Full text and comments »

#lca, sqrt decomposition, #trees, #algorithms, #implementaion, #c++

willy108
3 years ago
2

std::stable_sort vs std::sort

By willy108, history, 3 years ago, In English

This is my first blog post, so it probably will end up being scuffed.

==============================

The problem

So I was working on CF 472D, Design Tutorial: Inverse the Problem and it requires an MST (sorry for spoiling) and I chose to use Kruskals MST to do this (just note that I could've avoided this issue by using any other MST alg, but that's not the point here). So I just coded vanilla Kruskals where I std::sort'ed the edges and used a DSU with path compression and union by size. And I submitted the code and lo and behold, it was TLE on tc 39! I entered into a state of depression and decided to change my std::sort to std::stable_sort and wow, it ac'ed (with 1934ms on a 2 second TL)! Well I was talking some people on Discord later and I this up and one of them told me that the only reason std::sort was slow was since I had used c++11 (which I did) instead of c++17 where std::sort was upgraded. So I submitted it again with std::sort and c++17 and yay it passed (with 1466ms)! and ~470ms faster than my last submission! But to satisfy my curiosity I submitted it again with c++17 and std::stable_sort and woah, it passed with 1154ms, some 310ms faster than the last one.

Please do not judge my template/coding style as that is not the point here, but if you look at my code, the only differences between the submissions are the submission settings and a different sort on line 65 (or the second line of the kruskals function).

the submissions from each correlate to:

1154ms, c++17 with stable_sort
1466ms, c++17 with sort
1934ms, c++11 with stable_sort
TLE tc 39, c++11 with sort

also note I did not benchmark memory since that was not something that bothered me in all of this

===============================

The resolution?

So here is one (of probably very few) situations where std::stable_sort outperformed std::sort. The problem that I have right now is that I do not want to miss a submission in a future contest over which sort I chose, since there are definitely problems out here where this problem cannot be avoided by something just as simple as using Prim instead of Kruskal.

If anyone has a good suggestion of which to use (std::stable_sort or std::sort) or a simple impl of a sorting alg that I can write up a little more time for similar results, please link it. I will probably just end up using stable_sort from now on since that was what made a difference here unless there is a really convincing argument or implementation that'll make me switch. No upvoting is needed (unless you want to :D), I just need the help. Thanks for reading and I apologize for any typos, unclear sections, and overall scuffedness.

Full text and comments »

sorting algorithms, c++11, c++17

willy108
3 years ago
9