№	Пользователь	Рейтинг
1	tourist	4009
2	jiangly	3821
3	Benq	3736
4	Radewoosh	3631
5	jqdai0815	3620
6	orzdevinwang	3529
7	ecnerwala	3446
8	Um_nik	3396
9	ksun48	3388
10	gamegame	3386

№	Пользователь	Вклад
1	cry	164
1	maomao90	164
3	Um_nik	163
4	atcoder_official	161
5	-is-this-fft-	158
6	awoo	157
7	adamant	156
8	TheScrasse	154
8	nor	154
10	Dominater069	153

After 21 days and 56 submissions on IOI 2010 Maze, I finally broke the 100 point barrier and achieved a score of 100.081 / 100.

Score distribution Page 3 of submissions

Page 2 of submissions

Page 1 of submissions

Methodology

It's just simulated annealing + a lot a lot of time.

The neighbour function to generate a new state was just randomly choosing one cell to change from '$$$\text{#}$$$' to '$$$\text{.}$$$' or from '$$$\text{.}$$$' to '$$$\text{#}$$$'. Remember to take care that there must be exactly one '$$$\text{.}$$$' at the edge of the maze at all times.

The energy function that we are optimizing is the question itself, which is the maximum length of the shortest path.

The acceptance probability function is the classic exponential function based on the Boltzmann probability distribution.

Finally, the initial temperature used was $$$t_0 = 2.5$$$ with geometric temperature reduction $$$t' = t\cdot \alpha$$$ where $$$\alpha = 0.999999999$$$.

I did not do any optimisation for the energy function, So each iteration takes $$$O(RC)$$$, which is quite slow considering the extremely big $$$\alpha$$$ used. This is why I spent 21 days on this question as each run takes around 1 week to converge on the final answer 🤡.

Code

#include <bits/stdc++.h>
using namespace std;

#define REP(i, j, k) for (int i = (j); i < (k); i++)
#define RREP(i, j, k) for (int i = (j); i >= (k); i--)

template <class T>
inline bool mnto(T &a, const T b) {return a > b ? a = b, 1 : 0;}
template <class T>
inline bool mxto(T &a, const T b) {return a < b ? a = b, 1 : 0;}

typedef long long ll;
typedef long double ld;
#define FI first
#define SE second
typedef pair<int, int> ii;
typedef pair<ll, ll> pll;
#define ALL(x) x.begin(), x.end()
#define SZ(x) (int) x.size()
#define pb push_back
typedef vector<int> vi;
typedef vector<ll> vll;
typedef vector<ii> vii;
typedef tuple<int, int, int> iii;
typedef vector<iii> viii;

const int INF = 1000000005;
const ll LINF = 1000000000000000005;
const int MAXN = 205;
const ld T = 2.5, A = 0.999999999;
const int diri[] = {1, 0, -1, 0}, dirj[] = {0, 1, 0, -1};

mt19937 rnd(chrono::high_resolution_clock::now().time_since_epoch().count());

int n, m;
vector<string> g;
vii sides, all;
ii src;
ld t;

int d[MAXN][MAXN];
queue<ii> bfs;
int calcEnergy() {
	REP (i, 0, n) {
		REP (j, 0, m) {
			d[i][j] = INF;
		}
	}
	d[src.FI][src.SE] = 1;
	bfs.push(src);
	int res = 1;
	while (!bfs.empty()) {
		auto [i, j] = bfs.front(); bfs.pop();
		REP (k, 0, 4) {
			int ni = i + diri[k], nj = j + dirj[k];
			if (ni < 0 || ni >= n || nj < 0 || nj >= m) {
				continue;
			}
			if (g[ni][nj] != '.') {
				continue;
			}
			if (d[ni][nj] == INF) {
				d[ni][nj] = d[i][j] + 1;
				res = d[ni][nj];
				bfs.push({ni, nj});
			}
		}
	}
	return res;
}
bool accept(int newEnergy, int oldEnergy) {
	if (newEnergy >= oldEnergy) {
		return 1;
	}
	uniform_real_distribution<ld> dist;
	return dist(rnd) < exp((newEnergy - oldEnergy) / t);
}

int main(int argc, char* argv[]) {
	char tc = argv[1][0];
	char inname[20];
	sprintf(inname, "field%c.txt", tc);
	ifstream fin(inname);
	string tmp;
	while (fin >> tmp) {
		g.pb(tmp);
	}
	fin.close();
	n = SZ(g), m = SZ(g[0]);
	REP (i, 1, n - 1) {
		for (int j : {0, m - 1}) {
			if (g[i][j] == 'X') {
				continue;
			}
			sides.pb({i, j});
		}
	}
	REP (j, 1, m - 1) {
		for (int i : {0, n - 1}) {
			if (g[i][j] == 'X') {
				continue;
			}
			sides.pb({i, j});
		}
	}
	REP (i, 0, n) {
		REP (j, 0, m) {
			if ((i == 0 && j == 0) || (i == 0 && j == m - 1) || 
					(i == n - 1 && j == 0) || (i == n - 1 && j == m - 1)) {
				continue;
			}
			if (g[i][j] == 'X') {
				continue;
			}
			all.pb({i, j});
		}
	}
	src = {-1, -1};
	for (auto [i, j] : sides) {
		if (g[i][j] == '.') {
			src = {i, j};
			break;
		}
	}
	if (src.FI == -1) {
		int r = rnd() % SZ(sides);
		src = sides[r];
		g[sides[r].FI][sides[r].SE] = '.';
		REP (i, 1, n - 1) {
			REP (j, 1, m - 1) {
				if (g[i][j] == 'X') {
					continue;
				}
				if (rnd() % 10 < 7) {
					g[i][j] = '.';
				}
			}
		}
	}
	t = T;
	int curEnergy = calcEnergy();
	int bestEnergy = curEnergy;
	vector<string> bestg = g;
	unsigned int cnt = 0;
	while (1) {
		if ((cnt & ((1 << 23) - 1)) == 0) {
			cerr << t << ' ' << curEnergy << '\n';
			char outname[20];
			sprintf(outname, "maze%c.txt", tc);
			ofstream fout(outname);
			REP (i, 0, n) {
				fout << bestg[i] << '\n';
			}
			fout.close();
		}
		cnt++;
		int id = rnd() % SZ(all);
		int r = -1;
		ii osrc = src;
		if (all[id].FI == 0 || all[id].FI == n - 1 || 
				all[id].SE == 0 || all[id].SE == m - 1) {
			g[osrc.FI][osrc.SE] = '#';
			if (osrc == all[id]) {
				r = rnd() % SZ(sides);
				src = sides[r];
			} else {
				src = all[id];
			}
			g[src.FI][src.SE] = '.';
		} else {
			if (g[all[id].FI][all[id].SE] == '#') {
				g[all[id].FI][all[id].SE] = '.';
			} else {
				g[all[id].FI][all[id].SE] = '#';
			}
		}
		int newEnergy = calcEnergy();
		if (newEnergy >= bestEnergy) {
			bestEnergy = newEnergy;
			bestg = g;
		}
		if (accept(newEnergy, curEnergy)) {
			curEnergy = newEnergy;
		} else {
			if (all[id].FI == 0 || all[id].FI == n - 1 || 
					all[id].SE == 0 || all[id].SE == m - 1) {
				g[src.FI][src.SE] = '#';
				g[osrc.FI][osrc.SE] = '.';
				src = osrc;
			} else {
				if (g[all[id].FI][all[id].SE] == '#') {
					g[all[id].FI][all[id].SE] = '.';
				} else {
					g[all[id].FI][all[id].SE] = '#';
				}
			}
		}
		t *= A;
	}
	return 0;
}

Takeaways

For such a brain-dead solution, I actually learnt quite a lot of things about simulated annealing. Below is a short list of items to take note of while doing simulated annealing.

As the wise SGP IOI trainer bensonlzl told me: "Always write your intermediate solution to a file so that you can still get partial scores if it doesn't finish running before the contest ends". Writing to file can be quite time-consuming, so I only do it every ~1 million iterations.
To choose a good $$$t_0$$$ and $$$\alpha$$$, I normally start with a high $$$t_0$$$ and a low $$$\alpha$$$, then print the temperature and the energy function after each iteration. Then, I try to choose a $$$t_0$$$ where the energy is not completely random but at the same time there are significant jumps in energy to ensure that enough exploration takes place. I binary search on the $$$\alpha$$$ to use based on how slowly the temperature decreases over time and try to pick the one that is neither too slow nor too fast.
Most of the time running the simulated annealing for a longer time with bigger $$$\alpha$$$ is better than trying to improve a previous solution by letting the initial state be the previous solution and starting with a lower $$$t_0$$$. This is probably because the latter has a higher chance to be stuck in a local minimum.
In a real 5-hour contest scenario, do not spend too much time on the output-only problem. Spend a short time coding the simulated annealing and work on the remaining problems while the code is running in the background. Do not be like me and spend the majority of the contest trying to increase my score from ~80 to ~90 and end up having low score on other problems.

Special Thanks

Of course, this could not have been done without the help of the following people:

bensonlzl, the SGP IOI trainer, for teaching me simulated annealing and including this problem in one of the training contest.
rainboy for giving me the motivation to get higher than him as he was the first place before I beat him.
jamessngg for helping me to solve test case 8 by hand and buying purple candy for the SGP IOI team.
pavement for giving moral support and suggestions as part of the SGP IOI team.
NUS for supplying electricity so that I can keep the NUS computer on for 3 consecutive weeks while running the simulated annealing.

Multiple terminals running simulated annealing

Conclusion

Feel free to try to beat my score or tell me about any possible optimizations in the comments.

Комментарии (11)

Показать архивные | Написать комментарий?

joyfullife

15 месяцев назад, # |

orz

(I am familiar with the recent blogs and stuff but I couldn't bare it lol)

→ Ответить

eternal_happiness

wtf this is wild

vitosevskich

You must be Chuck Norris

jonathanirvings

← Rev. 2 →

+217

Headlines of similar feel:

358 years after its formulation, a mathematician proved Fermat Last Theorem, costing years of research.
36 years after its release, a speedrunner finished Super Mario Bros faster than 4 minute 55 seconds, costing countless hours of attempts.
13 years after IOI 2010, a competitive programmer broke the 100 point barrier for Maze, costing 3 consecutive weeks of NUS computational power.

NeoYL

If you were in IOI 2010, you might be the first to get >600 pointssss xd

maomao90

15 месяцев назад, # ^ |

+47

If IOI 2010 was three weeks long maybe

+58

Also, Tourist got 778 points at IOI 2010, ~~he is that good~~ IOI 2010 was the last IOI (to date) to have 8 tasks.

kozliklekarsky

5 месяцев назад, # ^ |

-33

Let's keep it that way.

drdilyor

Is it possible to recalculate the score function after the change in O((R + C) log (R+C)), or even in O(R + C)? that would improve efficiency by a lot. But probably using different score function, that better fits simulated annealing and is easier to optimize, is better.

Also, I ran my own simulated annealing overnight and it found a better solution to the 9th test, other runs got corrupted smh and the output was gibberish :,(

https://oj.uz/submission/805436
code: https://pastebin.com/0iFixk2p

Hmm do you have a suggestion for the different score function?

Thanks for telling me that there is a better solution for the 9th test. I thought that it was already the optimal, so I stopped running the simulated annealing for the 9th test. Maybe I'll try to rerun it to see whether I can get a better result.

I have no idea tbh :)

Блог пользователя maomao90

Methodology

Takeaways

Special Thanks

Conclusion