Skip to content

Commit 957ef04

Browse files
committed
add codemmlu leaderboard
1 parent ee2968c commit 957ef04

File tree

2 files changed

+16
-16
lines changed

2 files changed

+16
-16
lines changed

leaderboards/codemmlu/index.html

Lines changed: 15 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -9,12 +9,12 @@
99

1010
<head>
1111
<meta charset="UTF-8" />
12-
<meta name="description" content="RepoExec: Evaluate Code Generation with a Repository-Level Executable Benchmark">
13-
<meta property="og:title" content="RepoExec: Evaluate Code Generation with a Repository-Level Executable Benchmark"/>
14-
<meta property="og:description" content="Benchmark for Repository-Level Code Generation, focus on Executability, Correctness from Test Cases and Usage of Contexts from Cross-file Dependencies"/>
12+
<meta name="description" content="CodeMMLU: A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs">
13+
<meta property="og:title" content="CodeMMLU: A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs"/>
14+
<meta property="og:description" content="A Multi-Task Benchmark for Assessing Code Understanding Capabilities"/>
1515
<meta property="og:url" content="https://fsoft-ai4code.github.io/leaderboards/codemmlu"/>
1616

17-
<title>RepoExec Leaderboard</title>
17+
<title>CodeMMLU Leaderboard</title>
1818
<script src="https://cdnjs.cloudflare.com/ajax/libs/PapaParse/5.3.0/papaparse.min.js"></script>
1919
<script src="https://cdn.jsdelivr.net/npm/echarts@5.3.3/dist/echarts.min.js"></script>
2020
<link
@@ -111,7 +111,7 @@ <h3 class="fw-light text-nowrap">
111111
<br/></small>
112112
</h3>
113113
<div class="d-flex flex-row justify-content-center gap-3">
114-
<a href="https://fsoft-ai4code.github.io/repoexec/"
114+
<a href="https://fsoft-ai4code.github.io/codemmlu/"
115115
><img
116116
src="https://custom-icon-badges.demolab.com/badge/WebPage-1a4f76?style=for-the-badge&logo=web"
117117
alt="blog"
@@ -153,8 +153,8 @@ <h3 class="fw-light text-nowrap">
153153
checked
154154
/>
155155
<label class="btn btn-outline-primary" for="Complete">Complete</label>
156-
<input type="radio" class="btn-check" name="btnradio" id="Instruct" />
157-
<label class="btn btn-outline-primary" for="Instruct">Instruct</label>
156+
<!-- <input type="radio" class="btn-check" name="btnradio" id="Instruct" />
157+
<label class="btn btn-outline-primary" for="Instruct">Instruct</label> -->
158158
</div>
159159
<div class="form-check form-switch mt-3">
160160
<input class="form-check-input" type="checkbox" id="toggleUnknownSize">
@@ -473,7 +473,7 @@ <h3>🙏 Acknowledgements</h3>
473473
],
474474
};
475475

476-
const theaders = ["Model", "Pass@1"];
476+
const theaders = ["Model", "Accuracy"];
477477

478478
// score: 'complete', 'instruct'
479479
const displayTable = (table, score) => {
@@ -670,7 +670,7 @@ <h3>🙏 Acknowledgements</h3>
670670
};
671671

672672
const completeRadio = document.getElementById("Complete");
673-
const instructRadio = document.getElementById("Instruct");
673+
//const instructRadio = document.getElementById("Instruct");
674674

675675
completeRadio.addEventListener("click", function () {
676676
clearTable();
@@ -679,12 +679,12 @@ <h3>🙏 Acknowledgements</h3>
679679
displayChart("complete", toggleUnknownSize.checked);
680680
});
681681

682-
instructRadio.addEventListener("click", function () {
683-
clearTable();
684-
displayTable(originTable, "instruct");
685-
clearChart();
686-
displayChart("instruct", toggleUnknownSize.checked);
687-
});
682+
// instructRadio.addEventListener("click", function () {
683+
// clearTable();
684+
// displayTable(originTable, "instruct");
685+
// clearChart();
686+
// displayChart("instruct", toggleUnknownSize.checked);
687+
// });
688688

689689
toggleUnknownSize.addEventListener("change", function () {
690690
const score = completeRadio.checked ? "complete" : "instruct";

leaderboards/codemmlu/results.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
{
2-
"CodeLlama-34B-Python": {
2+
"CodeLlama-34B-Instruct": {
33
"link": "https://huggingface.co/codellama/CodeLlama-34b-hf",
44
"open-data": "None",
55
"pass@1": {

0 commit comments

Comments
 (0)