llm-pricing-calculator

Running

File size: 2,216 Bytes

fffbe5d

import { Benchmark } from "./types";

export const qwenBenchmarks: Benchmark[] = [
    {
        model: "Qwen3-235B-A22B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 85.7,
            aime_2025: 81.5,
            gpqa_diamond: 44.06,
            // livecodebench_v6: 70.7,
            mmlu_pro: 68.18,
            mmlu: 87.81,
            mmmu: 71.84,
            // gsm8k: 47.47,
            // math: 71.84,
            // bigbench_extra_hard: 59.54,
            // global_mmlu_lite: 87.40,
            // evalplus: 77.60,
            // humaneval: 79.00,
            // mbpp: 81.40,
            // cruxeval_c: 79.00,
            simpleqa: 85.8,
            egoschema: 81.1,
        },
        source: "https://qwenlm.github.io/blog/qwen3/",
    },
    {
        model: "Qwen3-32B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 81.4,
            aime_2025: 72.9,
            // livecodebench_v6: 65.7,
            //: 1977,
            //aider_polyglot: 50.2,
            // livebench: 74.9,
            //  bfcl: 70.3,
            //  multillm: 73.0,
        },
        source: "https://qwenlm.github.io/blog/qwe,n3/ (image table)",
    },

    {
        model: "Qwen3-30B-A3B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 80.4,
            aime_2025: 70.9,
            //livecodebench_v6: 62.6,
            //codeforces: 1974,
            gpqa: 65.8,
            // livebench: 74.3,
            // bfcl: 69.1,
            // multillm: 72.2,
        },
        source: "https://qwenlm.github.io/blog/qwen3/ (image table)",
    },
    {
        model: "Qwen3-4B",
        provider: "Qwen",
        inputPrice: 0.0,
        outputPrice: 0.0,
        benchmark: {
            aime_24: 73.8,
            aime_2025: 65.6,
            //livecodebench_v6: 54.2,
            // codeforces: 1671,
            gpqa: 55.9,

            // bfcl: 65.9,
            // math: 62.12,
            //multillm: 66.3,
        },
        source: "https://qwenlm.github.io/blog/qwen3/ (image table)",
    }

];