File tree Expand file tree Collapse file tree 2 files changed +6
-6
lines changed Expand file tree Collapse file tree 2 files changed +6
-6
lines changed Original file line number Diff line number Diff line change 141141      < h1  class ="text-nowrap mt-5 "> CodeMMLU Leaderboard</ h1 > 
142142      < h3  class ="fw-light text-nowrap "> 
143143        < small  id ="warning ">  
144-           < p > CodeMMLU:  A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs</ p > 
144+           < p > A Multi-Task Benchmark for Assessing Code Understanding Capabilities of CodeLLMs</ p > 
145145        < br /> </ small > 
146146      </ h3 > 
147147      < div  class ="d-flex flex-row justify-content-center gap-3 "> 
@@ -151,7 +151,7 @@ <h3 class="fw-light text-nowrap">
151151            alt ="blog "
152152            class ="img-fluid "
153153        /> </ a > 
154-         < a  href ="https://arxiv.org/abs/2410.01999v1#:~:text=View%20a%20PDF%20of%20the%20paper%20titled%20CodeMMLU:%20A%20Multi-Task  "
154+         < a  href ="https://arxiv.org/abs/2410.01999  "
155155          > < img 
156156            src ="https://img.shields.io/badge/2410.01999-red?style=for-the-badge&label=arXiv "
157157            alt ="leaderboard "
@@ -186,7 +186,7 @@ <h3 class="fw-light text-nowrap">
186186          id ="Complete "
187187          checked 
188188        /> 
189-         < label  class ="btn btn-outline-primary " for ="Complete "> Complete</ label > 
189+         <!-- < label class="btn btn-outline-primary" for="Complete">Complete</label> -- > 
190190        <!-- <input type="radio" class="btn-check" name="btnradio" id="Instruct" /> 
191191        <label class="btn btn-outline-primary" for="Instruct">Instruct</label> --> 
192192      </ div > 
Original file line number Diff line number Diff line change 99        "realtask_accuracy" : 38.26 ,
1010        "syntactic_accuracy" : 67.22 ,
1111        "semantic_accuracy" : 66.08 ,
12-         "prompted" : false ,
12+         "prompted" : true ,
1313        "size" : null ,
1414        "direct_complete" : false ,
1515        "lazy" : false ,
2525        "realtask_accuracy" : 77.18 ,
2626        "syntactic_accuracy" : 60.41 ,
2727        "semantic_accuracy" : 57.81 ,
28-         "prompted" : false ,
28+         "prompted" : true ,
2929        "size" : null ,
3030        "direct_complete" : false ,
3131        "lazy" : false ,
4141        "realtask_accuracy" : 45.26 ,
4242        "syntactic_accuracy" : 61.68 ,
4343        "semantic_accuracy" : 53.65 ,
44-         "prompted" : false ,
44+         "prompted" : true ,
4545        "size" : null ,
4646        "direct_complete" : false ,
4747        "lazy" : false ,
 
 
   
 
     
   
   
          
    
    
     
    
      
     
     
    You can’t perform that action at this time.
  
 
    
  
    
      
        
     
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments