evalplus
diff --git a/‎evalperf.html‎
Lines changed: 5 additions & 9 deletions b/‎evalperf.html‎
Lines changed: 5 additions & 9 deletions
diff --git a/‎leaderboard.html‎
Lines changed: 0 additions & 1 deletion b/‎leaderboard.html‎
Lines changed: 0 additions & 1 deletion
@@ -126,6 +126,9 @@ <h1 class="text-nowrap mt-5" style="font-size: xx-large;">
 
         <div class="container d-flex flex-column align-items-center gap-3 mt-5">
           <h3>Win-rate Leaderboard</h3>
+          <p>📝 Notes: the default prompt does not emphasize efficiency requirements as our work shows such emphasis
+            might degrade both efficiency and correctness for some weak models. Yet, "(🔥)" marks models using
+            performance-encouraging prompts as they might be able to accurately understand such needs.</p>
           <table id="leaderboard"
             class="table table-responsive table-striped table-bordered flex-shrink-1 border border-5">
           </table>
@@ -233,15 +236,10 @@ <h2 id="sponsor" class="text-nowrap mt-5">🤗 Acknowledgment</h2>
             modelId = modelId[1];
             url = hfLinkPrefix + modelOrg + "/" + modelId;
             linkMapping.set(modelId, url);
-          } else if (modelId.startsWith("gpt-4-")) {
+          } else if (modelId.startsWith("o1-") || modelId.startsWith("gpt-")) {
             linkMapping.set(
               modelId,
-              "https://platform.openai.com/docs/models/gpt-4-turbo-and-gpt-4",
-            );
-          } else if (modelId.startsWith("gpt-3.5-")) {
-            linkMapping.set(
-              modelId,
-              "https://platform.openai.com/docs/models/gpt-3-5-turbo",
+              "https://platform.openai.com/docs/models",
             );
           } else if (modelId.startsWith("claude-3-")) {
             linkMapping.set(
@@ -258,8 +256,6 @@ <h2 id="sponsor" class="text-nowrap mt-5">🤗 Acknowledgment</h2>
               modelId,
               "https://deepmind.google/technologies/gemini/flash/",
             );
-          } else if (modelId.startsWith("gpt-4o-")) {
-            linkMapping.set(modelId, "https://openai.com/index/hello-gpt-4o/");
           } else if (modelId.startsWith("deepseek-chat")) {
             linkMapping.set(modelId, "https://chat.deepseek.com/")
           } else if (modelId == "heatmap_data") {
 
@@ -170,7 +170,6 @@ <h3>📝 Notes</h3>
       </div>
     </div>
     <div id="notes">
-      <h3 id="sponsor" class="text-nowrap mt-5">🖊️ Citation</h3>
       <h3>🤗 More Leaderboards</h3>
       In addition to EvalPlus leaderboards, it is recommended to
       comprehensively understand LLM coding ability through a diverse set of