#	User	Rating
1	tourist	3985
2	jiangly	3814
3	jqdai0815	3682
4	Benq	3529
5	orzdevinwang	3526
6	ksun48	3517
7	Radewoosh	3410
8	hos.lyric	3399
9	ecnerwala	3392
9	Um_nik	3392

#	User	Contrib.
1	cry	169
2	maomao90	162
2	Um_nik	162
4	atcoder_official	161
5	djm03178	158
6	-is-this-fft-	157
7	adamant	155
8	awoo	154
8	Dominater069	154
10	luogu_official	150

After 21 days and 56 submissions on IOI 2010 Maze, I finally broke the 100 point barrier and achieved a score of 100.081 / 100.

Score distribution Page 3 of submissions

Page 2 of submissions

Page 1 of submissions

Methodology

It's just simulated annealing + a lot a lot of time.

The neighbour function to generate a new state was just randomly choosing one cell to change from '$$$\text{#}$$$' to '$$$\text{.}$$$' or from '$$$\text{.}$$$' to '$$$\text{#}$$$'. Remember to take care that there must be exactly one '$$$\text{.}$$$' at the edge of the maze at all times.

The energy function that we are optimizing is the question itself, which is the maximum length of the shortest path.

The acceptance probability function is the classic exponential function based on the Boltzmann probability distribution.

Finally, the initial temperature used was $$$t_0 = 2.5$$$ with geometric temperature reduction $$$t' = t\cdot \alpha$$$ where $$$\alpha = 0.999999999$$$.

I did not do any optimisation for the energy function, So each iteration takes $$$O(RC)$$$, which is quite slow considering the extremely big $$$\alpha$$$ used. This is why I spent 21 days on this question as each run takes around 1 week to converge on the final answer 🤡.

Code

#include <bits/stdc++.h>
using namespace std;

#define REP(i, j, k) for (int i = (j); i < (k); i++)
#define RREP(i, j, k) for (int i = (j); i >= (k); i--)

template <class T>
inline bool mnto(T &a, const T b) {return a > b ? a = b, 1 : 0;}
template <class T>
inline bool mxto(T &a, const T b) {return a < b ? a = b, 1 : 0;}

typedef long long ll;
typedef long double ld;
#define FI first
#define SE second
typedef pair<int, int> ii;
typedef pair<ll, ll> pll;
#define ALL(x) x.begin(), x.end()
#define SZ(x) (int) x.size()
#define pb push_back
typedef vector<int> vi;
typedef vector<ll> vll;
typedef vector<ii> vii;
typedef tuple<int, int, int> iii;
typedef vector<iii> viii;

const int INF = 1000000005;
const ll LINF = 1000000000000000005;
const int MAXN = 205;
const ld T = 2.5, A = 0.999999999;
const int diri[] = {1, 0, -1, 0}, dirj[] = {0, 1, 0, -1};

mt19937 rnd(chrono::high_resolution_clock::now().time_since_epoch().count());

int n, m;
vector<string> g;
vii sides, all;
ii src;
ld t;

int d[MAXN][MAXN];
queue<ii> bfs;
int calcEnergy() {
	REP (i, 0, n) {
		REP (j, 0, m) {
			d[i][j] = INF;
		}
	}
	d[src.FI][src.SE] = 1;
	bfs.push(src);
	int res = 1;
	while (!bfs.empty()) {
		auto [i, j] = bfs.front(); bfs.pop();
		REP (k, 0, 4) {
			int ni = i + diri[k], nj = j + dirj[k];
			if (ni < 0 || ni >= n || nj < 0 || nj >= m) {
				continue;
			}
			if (g[ni][nj] != '.') {
				continue;
			}
			if (d[ni][nj] == INF) {
				d[ni][nj] = d[i][j] + 1;
				res = d[ni][nj];
				bfs.push({ni, nj});
			}
		}
	}
	return res;
}
bool accept(int newEnergy, int oldEnergy) {
	if (newEnergy >= oldEnergy) {
		return 1;
	}
	uniform_real_distribution<ld> dist;
	return dist(rnd) < exp((newEnergy - oldEnergy) / t);
}

int main(int argc, char* argv[]) {
	char tc = argv[1][0];
	char inname[20];
	sprintf(inname, "field%c.txt", tc);
	ifstream fin(inname);
	string tmp;
	while (fin >> tmp) {
		g.pb(tmp);
	}
	fin.close();
	n = SZ(g), m = SZ(g[0]);
	REP (i, 1, n - 1) {
		for (int j : {0, m - 1}) {
			if (g[i][j] == 'X') {
				continue;
			}
			sides.pb({i, j});
		}
	}
	REP (j, 1, m - 1) {
		for (int i : {0, n - 1}) {
			if (g[i][j] == 'X') {
				continue;
			}
			sides.pb({i, j});
		}
	}
	REP (i, 0, n) {
		REP (j, 0, m) {
			if ((i == 0 && j == 0) || (i == 0 && j == m - 1) || 
					(i == n - 1 && j == 0) || (i == n - 1 && j == m - 1)) {
				continue;
			}
			if (g[i][j] == 'X') {
				continue;
			}
			all.pb({i, j});
		}
	}
	src = {-1, -1};
	for (auto [i, j] : sides) {
		if (g[i][j] == '.') {
			src = {i, j};
			break;
		}
	}
	if (src.FI == -1) {
		int r = rnd() % SZ(sides);
		src = sides[r];
		g[sides[r].FI][sides[r].SE] = '.';
		REP (i, 1, n - 1) {
			REP (j, 1, m - 1) {
				if (g[i][j] == 'X') {
					continue;
				}
				if (rnd() % 10 < 7) {
					g[i][j] = '.';
				}
			}
		}
	}
	t = T;
	int curEnergy = calcEnergy();
	int bestEnergy = curEnergy;
	vector<string> bestg = g;
	unsigned int cnt = 0;
	while (1) {
		if ((cnt & ((1 << 23) - 1)) == 0) {
			cerr << t << ' ' << curEnergy << '\n';
			char outname[20];
			sprintf(outname, "maze%c.txt", tc);
			ofstream fout(outname);
			REP (i, 0, n) {
				fout << bestg[i] << '\n';
			}
			fout.close();
		}
		cnt++;
		int id = rnd() % SZ(all);
		int r = -1;
		ii osrc = src;
		if (all[id].FI == 0 || all[id].FI == n - 1 || 
				all[id].SE == 0 || all[id].SE == m - 1) {
			g[osrc.FI][osrc.SE] = '#';
			if (osrc == all[id]) {
				r = rnd() % SZ(sides);
				src = sides[r];
			} else {
				src = all[id];
			}
			g[src.FI][src.SE] = '.';
		} else {
			if (g[all[id].FI][all[id].SE] == '#') {
				g[all[id].FI][all[id].SE] = '.';
			} else {
				g[all[id].FI][all[id].SE] = '#';
			}
		}
		int newEnergy = calcEnergy();
		if (newEnergy >= bestEnergy) {
			bestEnergy = newEnergy;
			bestg = g;
		}
		if (accept(newEnergy, curEnergy)) {
			curEnergy = newEnergy;
		} else {
			if (all[id].FI == 0 || all[id].FI == n - 1 || 
					all[id].SE == 0 || all[id].SE == m - 1) {
				g[src.FI][src.SE] = '#';
				g[osrc.FI][osrc.SE] = '.';
				src = osrc;
			} else {
				if (g[all[id].FI][all[id].SE] == '#') {
					g[all[id].FI][all[id].SE] = '.';
				} else {
					g[all[id].FI][all[id].SE] = '#';
				}
			}
		}
		t *= A;
	}
	return 0;
}

Takeaways

For such a brain-dead solution, I actually learnt quite a lot of things about simulated annealing. Below is a short list of items to take note of while doing simulated annealing.

As the wise SGP IOI trainer bensonlzl told me: "Always write your intermediate solution to a file so that you can still get partial scores if it doesn't finish running before the contest ends". Writing to file can be quite time-consuming, so I only do it every ~1 million iterations.
To choose a good $$$t_0$$$ and $$$\alpha$$$, I normally start with a high $$$t_0$$$ and a low $$$\alpha$$$, then print the temperature and the energy function after each iteration. Then, I try to choose a $$$t_0$$$ where the energy is not completely random but at the same time there are significant jumps in energy to ensure that enough exploration takes place. I binary search on the $$$\alpha$$$ to use based on how slowly the temperature decreases over time and try to pick the one that is neither too slow nor too fast.
Most of the time running the simulated annealing for a longer time with bigger $$$\alpha$$$ is better than trying to improve a previous solution by letting the initial state be the previous solution and starting with a lower $$$t_0$$$. This is probably because the latter has a higher chance to be stuck in a local minimum.
In a real 5-hour contest scenario, do not spend too much time on the output-only problem. Spend a short time coding the simulated annealing and work on the remaining problems while the code is running in the background. Do not be like me and spend the majority of the contest trying to increase my score from ~80 to ~90 and end up having low score on other problems.

Special Thanks

Of course, this could not have been done without the help of the following people:

bensonlzl, the SGP IOI trainer, for teaching me simulated annealing and including this problem in one of the training contest.
rainboy for giving me the motivation to get higher than him as he was the first place before I beat him.
jamessngg for helping me to solve test case 8 by hand and buying purple candy for the SGP IOI team.
pavement for giving moral support and suggestions as part of the SGP IOI team.
NUS for supplying electricity so that I can keep the NUS computer on for 3 consecutive weeks while running the simulated annealing.

Multiple terminals running simulated annealing

Conclusion

Feel free to try to beat my score or tell me about any possible optimizations in the comments.

Comments (11)

Show archived | Write comment?

joyfullife

17 months ago, # |

orz

(I am familiar with the recent blogs and stuff but I couldn't bare it lol)

→ Reply

eternal_happiness

wtf this is wild

vitosevskich

You must be Chuck Norris

jonathanirvings

← Rev. 2 →

+217

Headlines of similar feel:

358 years after its formulation, a mathematician proved Fermat Last Theorem, costing years of research.
36 years after its release, a speedrunner finished Super Mario Bros faster than 4 minute 55 seconds, costing countless hours of attempts.
13 years after IOI 2010, a competitive programmer broke the 100 point barrier for Maze, costing 3 consecutive weeks of NUS computational power.

NeoYL

If you were in IOI 2010, you might be the first to get >600 pointssss xd

maomao90

17 months ago, # ^ |

+47

If IOI 2010 was three weeks long maybe

+58

Also, Tourist got 778 points at IOI 2010, ~~he is that good~~ IOI 2010 was the last IOI (to date) to have 8 tasks.

bIeah

6 months ago, # ^ |

-33

Let's keep it that way.

drdilyor

Is it possible to recalculate the score function after the change in O((R + C) log (R+C)), or even in O(R + C)? that would improve efficiency by a lot. But probably using different score function, that better fits simulated annealing and is easier to optimize, is better.

Also, I ran my own simulated annealing overnight and it found a better solution to the 9th test, other runs got corrupted smh and the output was gibberish :,(

https://oj.uz/submission/805436
code: https://pastebin.com/0iFixk2p

Hmm do you have a suggestion for the different score function?

Thanks for telling me that there is a better solution for the 9th test. I thought that it was already the optimal, so I stopped running the simulated annealing for the 9th test. Maybe I'll try to rerun it to see whether I can get a better result.

I have no idea tbh :)

maomao90's blog

Methodology

Takeaways

Special Thanks

Conclusion