Skip to content

Commit 270a960

Browse files
committed
feat: v5 leaderboard fixes and r1
1 parent 33505c0 commit 270a960

7 files changed

+50548
-29405
lines changed

build/asset-manifest.json

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,13 @@
11
{
22
"files": {
33
"main.css": "./static/css/main.be588df3.css",
4-
"main.js": "./static/js/main.34fef9d7.js",
4+
"main.js": "./static/js/main.e52d421e.js",
55
"index.html": "./index.html",
66
"main.be588df3.css.map": "./static/css/main.be588df3.css.map",
7-
"main.34fef9d7.js.map": "./static/js/main.34fef9d7.js.map"
7+
"main.e52d421e.js.map": "./static/js/main.e52d421e.js.map"
88
},
99
"entrypoints": [
1010
"static/css/main.be588df3.css",
11-
"static/js/main.34fef9d7.js"
11+
"static/js/main.e52d421e.js"
1212
]
1313
}

build/leaderboard.html

+1-1
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
<!doctype html><html lang="en"><head><title>LiveCodeBench Leaderboard</title><meta charset="UTF-8"/><meta name="viewport" content="width=device-width,initial-scale=1"/><meta name="theme-color" content="#000000"/><meta name="description" content="LiveCodeBench Leaderboard"/><link rel="stylesheet" href="bootstrap.min.css"/><link rel="stylesheet" href="./css/bulma.min.css"/><link rel="stylesheet" href="./css/bulma-carousel.min.css"/><link rel="stylesheet" href="./css/bulma-slider.min.css"/><link rel="stylesheet" href="./css/fontawesome.all.min.css"/><link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css"/><link rel="stylesheet" href="./css/index.css"/><link rel="icon" href="./images/favicon.svg"/><script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script><script defer="defer" src="./js/fontawesome.all.min.js"></script><script src="./js/bulma-carousel.min.js"></script><script src="./js/bulma-slider.min.js"></script><script src="./js/index.js"></script><script defer="defer" src="./static/js/main.34fef9d7.js"></script><link href="./static/css/main.be588df3.css" rel="stylesheet"></head><body><noscript>You need to enable JavaScript to run this app.</noscript><div id="root"></div></body></html>
1+
<!doctype html><html lang="en"><head><title>LiveCodeBench Leaderboard</title><meta charset="UTF-8"/><meta name="viewport" content="width=device-width,initial-scale=1"/><meta name="theme-color" content="#000000"/><meta name="description" content="LiveCodeBench Leaderboard"/><link rel="stylesheet" href="bootstrap.min.css"/><link rel="stylesheet" href="./css/bulma.min.css"/><link rel="stylesheet" href="./css/bulma-carousel.min.css"/><link rel="stylesheet" href="./css/bulma-slider.min.css"/><link rel="stylesheet" href="./css/fontawesome.all.min.css"/><link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css"/><link rel="stylesheet" href="./css/index.css"/><link rel="icon" href="./images/favicon.svg"/><script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script><script defer="defer" src="./js/fontawesome.all.min.js"></script><script src="./js/bulma-carousel.min.js"></script><script src="./js/bulma-slider.min.js"></script><script src="./js/index.js"></script><script defer="defer" src="./static/js/main.e52d421e.js"></script><link href="./static/css/main.be588df3.css" rel="stylesheet"></head><body><noscript>You need to enable JavaScript to run this app.</noscript><div id="root"></div></body></html>

build/static/js/main.34fef9d7.js renamed to build/static/js/main.e52d421e.js

+3-3
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

build/static/js/main.34fef9d7.js.map renamed to build/static/js/main.e52d421e.js.map

+1-1
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

src/LeaderboardComp.tsx

+2
Original file line numberDiff line numberDiff line change
@@ -237,6 +237,8 @@ const Leaderboard = React.memo(function LeaderboardComponent(props: any) {
237237

238238
message += "<br><br>We estimate cutoff dates based on release date and performance variation. Models highlighted in red are likely contaminated on some fraction of the problems in the given time-window. Feel free to adjust the slider to see the leaderboard at different time windows. Please offer feedback if you find any issues!"
239239

240+
message += "<br><br>Announcements: 1. We have made revisions to our official autograder. In case you are performing local evaluations, please use the latest codebase. 2. We have been updating the problem difficulty distribution making it more challenging aligned with the model capability improvements. A drop in performance towards later months is expected."
241+
240242

241243

242244
return (

0 commit comments

Comments
 (0)