galb-dai commited on
Commit
d565019
·
1 Parent(s): e717fbe

Updated results.

Browse files
Files changed (1) hide show
  1. app.py +9 -34
app.py CHANGED
@@ -210,31 +210,6 @@ def _select_example_tab(choice: str):
210
 
211
 
212
  # === Static, made-up results for the landing chart (not tied to leaderboard) ===
213
- TIER_TOTALS = {"Warmup": 100, "Tier 1": 100, "Tier 2": 20} # dataset sizes
214
- MODELS_ORDER = ["GPT-5", "Gemini 2.5 Pro", "Grok 4", "Claude Opus 4", "o3 Pro"]
215
- STATIC_RESULTS = {
216
- "Warmup": {
217
- "GPT-5": 95,
218
- "Gemini 2.5 Pro": 90,
219
- "Grok 4": 84,
220
- "Claude Opus 4": 92,
221
- "o3 Pro": 88,
222
- },
223
- "Tier 1": {
224
- "GPT-5": 38,
225
- "Gemini 2.5 Pro": 30,
226
- "Grok 4": 24,
227
- "Claude Opus 4": 35,
228
- "o3 Pro": 28,
229
- },
230
- "Tier 2": {
231
- "GPT-5": 1,
232
- "Gemini 2.5 Pro": 0,
233
- "Grok 4": 0,
234
- "Claude Opus 4": 0,
235
- "o3 Pro": 0,
236
- },
237
- }
238
 
239
  MODEL_RELEASES = {
240
  "GPT-5": "2025-08-07",
@@ -249,18 +224,18 @@ MODELS_ORDER = ["GPT-5", "Gemini 2.5 Pro", "Grok 4", "Claude Opus 4", "o3 Pro"]
249
 
250
  ACCURACY_PCT = {
251
  "Warmup": {
252
- "GPT-5": 38,
253
- "Gemini 2.5 Pro": 35,
254
  "Grok 4": 28,
255
- "Claude Opus 4": 32,
256
- "o3 Pro": 30,
257
  },
258
  "Tier 1": {
259
- "GPT-5": 3,
260
- "Gemini 2.5 Pro": 2,
261
- "Grok 4": 1,
262
- "Claude Opus 4": 2,
263
- "o3 Pro": 2,
264
  },
265
  "Tier 2": {
266
  "GPT-5": 0,
 
210
 
211
 
212
  # === Static, made-up results for the landing chart (not tied to leaderboard) ===
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
213
 
214
  MODEL_RELEASES = {
215
  "GPT-5": "2025-08-07",
 
224
 
225
  ACCURACY_PCT = {
226
  "Warmup": {
227
+ "GPT-5": 49,
228
+ "Gemini 2.5 Pro": 30,
229
  "Grok 4": 28,
230
+ "Claude Opus 4": 30,
231
+ "o3 Pro": 24,
232
  },
233
  "Tier 1": {
234
+ "GPT-5": 4,
235
+ "Gemini 2.5 Pro": 0,
236
+ "Grok 4": 0,
237
+ "Claude Opus 4": 0,
238
+ "o3 Pro": 0,
239
  },
240
  "Tier 2": {
241
  "GPT-5": 0,