File size: 2,216 Bytes
fffbe5d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
import { Benchmark } from "./types";

export const qwenBenchmarks: Benchmark[] = [
    {
        model: "Qwen3-235B-A22B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 85.7,
            aime_2025: 81.5,
            gpqa_diamond: 44.06,
            // livecodebench_v6: 70.7,
            mmlu_pro: 68.18,
            mmlu: 87.81,
            mmmu: 71.84,
            // gsm8k: 47.47,
            // math: 71.84,
            // bigbench_extra_hard: 59.54,
            // global_mmlu_lite: 87.40,
            // evalplus: 77.60,
            // humaneval: 79.00,
            // mbpp: 81.40,
            // cruxeval_c: 79.00,
            simpleqa: 85.8,
            egoschema: 81.1,
        },
        source: "https://qwenlm.github.io/blog/qwen3/",
    },
    {
        model: "Qwen3-32B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 81.4,
            aime_2025: 72.9,
            // livecodebench_v6: 65.7,
            //: 1977,
            //aider_polyglot: 50.2,
            // livebench: 74.9,
            //  bfcl: 70.3,
            //  multillm: 73.0,
        },
        source: "https://qwenlm.github.io/blog/qwe,n3/ (image table)",
    },

    {
        model: "Qwen3-30B-A3B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 80.4,
            aime_2025: 70.9,
            //livecodebench_v6: 62.6,
            //codeforces: 1974,
            gpqa: 65.8,
            // livebench: 74.3,
            // bfcl: 69.1,
            // multillm: 72.2,
        },
        source: "https://qwenlm.github.io/blog/qwen3/ (image table)",
    },
    {
        model: "Qwen3-4B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 73.8,
            aime_2025: 65.6,
            //livecodebench_v6: 54.2,
            // codeforces: 1671,
            gpqa: 55.9,

            // bfcl: 65.9,
            // math: 62.12,
            //multillm: 66.3,
        },
        source: "https://qwenlm.github.io/blog/qwen3/ (image table)",
    }

];