llm-pricing-calculator

Running

App Files Files Community

Presidentlin commited on 16 days ago

Commit

fffbe5d

1 Parent(s): d7502bf

x

Browse files

Files changed (2) hide show

src/lib/benchmarks/ index.ts +3 -1
src/lib/benchmarks/qwen.ts +84 -0

src/lib/benchmarks/ index.ts CHANGED Viewed

@@ -4,11 +4,13 @@ import { googleBenchmarks } from "./google";
 import { anthropicBenchmarks } from "./anthropic";
 import { openaiBenchmarks } from "./openai";
 import { deepseekBenchmarks } from "./deepseek";
 export const benchmarkData: Benchmark[] = [
   ...xaiBenchmarks,
   ...googleBenchmarks,
   ...anthropicBenchmarks,
    ...openaiBenchmarks,
-   ...deepseekBenchmarks
 ];

 import { anthropicBenchmarks } from "./anthropic";
 import { openaiBenchmarks } from "./openai";
 import { deepseekBenchmarks } from "./deepseek";
+import { qwenBenchmarks } from "./qwen";
 export const benchmarkData: Benchmark[] = [
   ...xaiBenchmarks,
   ...googleBenchmarks,
   ...anthropicBenchmarks,
    ...openaiBenchmarks,
+   ...deepseekBenchmarks,
+   ...qwenBenchmarks
 ];

src/lib/benchmarks/qwen.ts ADDED Viewed

	@@ -0,0 +1,84 @@

+import { Benchmark } from "./types";
+export const qwenBenchmarks: Benchmark[] = [
+    {
+        model: "Qwen3-235B-A22B",
+        provider: "Qwen",
+        inputPrice: 0.0,
+        outputPrice: 0.0,
+        benchmark: {
+            aime_24: 85.7,
+            aime_2025: 81.5,
+            gpqa_diamond: 44.06,
+            // livecodebench_v6: 70.7,
+            mmlu_pro: 68.18,
+            mmlu: 87.81,
+            mmmu: 71.84,
+            // gsm8k: 47.47,
+            // math: 71.84,
+            // bigbench_extra_hard: 59.54,
+            // global_mmlu_lite: 87.40,
+            // evalplus: 77.60,
+            // humaneval: 79.00,
+            // mbpp: 81.40,
+            // cruxeval_c: 79.00,
+            simpleqa: 85.8,
+            egoschema: 81.1,
+        },
+        source: "https://qwenlm.github.io/blog/qwen3/",
+    },
+    {
+        model: "Qwen3-32B",
+        provider: "Qwen",
+        inputPrice: 0.0,
+        outputPrice: 0.0,
+        benchmark: {
+            aime_24: 81.4,
+            aime_2025: 72.9,
+            // livecodebench_v6: 65.7,
+            //: 1977,
+            //aider_polyglot: 50.2,
+            // livebench: 74.9,
+            //  bfcl: 70.3,
+            //  multillm: 73.0,
+        },
+        source: "https://qwenlm.github.io/blog/qwe,n3/ (image table)",
+    },
+    {
+        model: "Qwen3-30B-A3B",
+        provider: "Qwen",
+        inputPrice: 0.0,
+        outputPrice: 0.0,
+        benchmark: {
+            aime_24: 80.4,
+            aime_2025: 70.9,
+            //livecodebench_v6: 62.6,
+            //codeforces: 1974,
+            gpqa: 65.8,
+            // livebench: 74.3,
+            // bfcl: 69.1,
+            // multillm: 72.2,
+        },
+        source: "https://qwenlm.github.io/blog/qwen3/ (image table)",
+    },
+    {
+        model: "Qwen3-4B",
+        provider: "Qwen",
+        inputPrice: 0.0,
+        outputPrice: 0.0,
+        benchmark: {
+            aime_24: 73.8,
+            aime_2025: 65.6,
+            //livecodebench_v6: 54.2,
+            // codeforces: 1671,
+            gpqa: 55.9,
+            // bfcl: 65.9,
+            // math: 62.12,
+            //multillm: 66.3,
+        },
+        source: "https://qwenlm.github.io/blog/qwen3/ (image table)",
+    }
+];