Skip to content

Commit 5fe541d

Browse files
committed
Minor update
1 parent 02bfe4b commit 5fe541d

File tree

2 files changed

+6
-6
lines changed

2 files changed

+6
-6
lines changed

leaderboards/codemmlu/index.html

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -141,7 +141,7 @@
141141
<h1 class="text-nowrap mt-5">CodeMMLU Leaderboard</h1>
142142
<h3 class="fw-light text-nowrap">
143143
<small id="warning">
144-
<p>CodeMMLU: A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs</p>
144+
<p>A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs</p>
145145
<br/></small>
146146
</h3>
147147
<div class="d-flex flex-row justify-content-center gap-3">
@@ -151,7 +151,7 @@ <h3 class="fw-light text-nowrap">
151151
alt="blog"
152152
class="img-fluid"
153153
/></a>
154-
<a href="https://arxiv.org/abs/2410.01999v1#:~:text=View%20a%20PDF%20of%20the%20paper%20titled%20CodeMMLU:%20A%20Multi-Task"
154+
<a href="https://arxiv.org/abs/2410.01999"
155155
><img
156156
src="https://img.shields.io/badge/2410.01999-red?style=for-the-badge&label=arXiv"
157157
alt="leaderboard"
@@ -186,7 +186,7 @@ <h3 class="fw-light text-nowrap">
186186
id="Complete"
187187
checked
188188
/>
189-
<label class="btn btn-outline-primary" for="Complete">Complete</label>
189+
<!-- <label class="btn btn-outline-primary" for="Complete">Complete</label> -->
190190
<!-- <input type="radio" class="btn-check" name="btnradio" id="Instruct" />
191191
<label class="btn btn-outline-primary" for="Instruct">Instruct</label> -->
192192
</div>

leaderboards/codemmlu/results.json

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@
99
"realtask_accuracy": 38.26,
1010
"syntactic_accuracy": 67.22,
1111
"semantic_accuracy": 66.08,
12-
"prompted": false,
12+
"prompted": true,
1313
"size": null,
1414
"direct_complete": false,
1515
"lazy": false,
@@ -25,7 +25,7 @@
2525
"realtask_accuracy": 77.18,
2626
"syntactic_accuracy": 60.41,
2727
"semantic_accuracy": 57.81,
28-
"prompted": false,
28+
"prompted": true,
2929
"size": null,
3030
"direct_complete": false,
3131
"lazy": false,
@@ -41,7 +41,7 @@
4141
"realtask_accuracy": 45.26,
4242
"syntactic_accuracy": 61.68,
4343
"semantic_accuracy": 53.65,
44-
"prompted": false,
44+
"prompted": true,
4545
"size": null,
4646
"direct_complete": false,
4747
"lazy": false,

0 commit comments

Comments
 (0)