File tree Expand file tree Collapse file tree 2 files changed +6
-6
lines changed Expand file tree Collapse file tree 2 files changed +6
-6
lines changed Original file line number Diff line number Diff line change 141141 < h1 class ="text-nowrap mt-5 "> CodeMMLU Leaderboard</ h1 >
142142 < h3 class ="fw-light text-nowrap ">
143143 < small id ="warning ">
144- < p > CodeMMLU: A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs</ p >
144+ < p > A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs</ p >
145145 < br /> </ small >
146146 </ h3 >
147147 < div class ="d-flex flex-row justify-content-center gap-3 ">
@@ -151,7 +151,7 @@ <h3 class="fw-light text-nowrap">
151151 alt ="blog "
152152 class ="img-fluid "
153153 /> </ a >
154- < a href ="https://arxiv.org/abs/2410.01999v1#:~:text=View%20a%20PDF%20of%20the%20paper%20titled%20CodeMMLU:%20A%20Multi-Task "
154+ < a href ="https://arxiv.org/abs/2410.01999 "
155155 > < img
156156 src ="https://img.shields.io/badge/2410.01999-red?style=for-the-badge&label=arXiv "
157157 alt ="leaderboard "
@@ -186,7 +186,7 @@ <h3 class="fw-light text-nowrap">
186186 id ="Complete "
187187 checked
188188 />
189- < label class ="btn btn-outline-primary " for ="Complete "> Complete</ label >
189+ <!-- < label class="btn btn-outline-primary" for="Complete">Complete</label> -- >
190190 <!-- <input type="radio" class="btn-check" name="btnradio" id="Instruct" />
191191 <label class="btn btn-outline-primary" for="Instruct">Instruct</label> -->
192192 </ div >
Original file line number Diff line number Diff line change 99 "realtask_accuracy" : 38.26 ,
1010 "syntactic_accuracy" : 67.22 ,
1111 "semantic_accuracy" : 66.08 ,
12- "prompted" : false ,
12+ "prompted" : true ,
1313 "size" : null ,
1414 "direct_complete" : false ,
1515 "lazy" : false ,
2525 "realtask_accuracy" : 77.18 ,
2626 "syntactic_accuracy" : 60.41 ,
2727 "semantic_accuracy" : 57.81 ,
28- "prompted" : false ,
28+ "prompted" : true ,
2929 "size" : null ,
3030 "direct_complete" : false ,
3131 "lazy" : false ,
4141 "realtask_accuracy" : 45.26 ,
4242 "syntactic_accuracy" : 61.68 ,
4343 "semantic_accuracy" : 53.65 ,
44- "prompted" : false ,
44+ "prompted" : true ,
4545 "size" : null ,
4646 "direct_complete" : false ,
4747 "lazy" : false ,
You can’t perform that action at this time.
0 commit comments