import { Benchmark } from "./types";


export const googleBenchmarks: Benchmark[] = [
    {
        model: "Gemini Diffusion",
        provider: "Google",
        inputPrice: 0,
        outputPrice: 0,
        benchmark: {
            livecodebench_v6: 30.9,
            bigcodebench: 45.4,
            lbpp_v2: 56.8,
            swe_bench_verified: 22.9,
            humaneval: 89.6,
            mbpp: 76.0,
            gpqa_diamond: 40.4,
            aime_2025: 23.3,
            bigbench_extra_hard: 15.0,
            global_mmlu_lite: 69.1,
        },
        source: "https://deepmind.google/models/gemini-diffusion/",
    },
    {
        model: "Gemini 2.0 Flash-Lite",
        provider: "Google",
        inputPrice: 0.10,
        outputPrice: 0.40,
        benchmark: {
            livecodebench_v6: 28.5,
            bigcodebench: 45.8,
            lbpp_v2: 56.0,
            swe_bench_verified: 28.5,
            humaneval: 90.2,
            mbpp: 75.8,
            gpqa_diamond: 56.5,
            aime_2025: 20.0,
            bigbench_extra_hard: 21.0,
            global_mmlu_lite: 79.0,
        },
        source: "https://deepmind.google/models/gemini-diffusion/",
    },

    {
        model: "Gemini 2.5 Flash Preview (05-20)",
        provider: "Google",
        inputPrice: 0.15,
        outputPrice: 3.5,
        source: "https://ai.google.dev/gemini-api/docs/thinking",
        benchmark: {
            aime_2025: 72.0,
            gpqa_diamond: 82.8,
            simpleqa: 26.9,
            global_mmlu_lite: 88.4,
            swe_bench_verified: 60.4,
            livecodebench_v6: 63.9,
            mmmu: 79.7,
            lbpp_v2: 61.9,
            bigcodebench: 56.7,
            facts_grounding: 85.3,
            humanitys_last_exam: 11.0,
            mrcr_v2_avg_128k: 74.0,
            mrcr_v2_pointwise_1m: 32.0,

        },
    },
    {
        model: "Gemini 2.5 Flash Preview (04-17) Thinking",
        provider: "Google",
        inputPrice: 0.15,
        outputPrice: 3.5,
        source: "https://ai.google.dev/gemini-api/docs/thinking",
        benchmark: {
            aime_2025: 78.0,
            gpqa_diamond: 78.3,
            simpleqa: 29.7,
            global_mmlu_lite: 88.4,
            livecodebench_v6: 63.5,
            lbpp_v2: 51.1,
            bigcodebench: 44.2,
            mmmu: 76.7,
            humanitys_last_exam: 12.1

        },
    },
    {
        model: "Gemini 2.0 Flash",
        provider: "Google",
        inputPrice: 0.1,
        outputPrice: 0.4,
        source: "https://ai.google.dev/gemini-api/docs/thinking",
        benchmark: {
            aime_2025: 27.5,
            gpqa_diamond: 60.1,
            simpleqa: 29.9,
            global_mmlu_lite: 83.4,
            livecodebench_v6: 34.5,
            lbpp_v2: 22.2,
            mmmu: 71.7,
            facts_grounding: 84.6,
            humanitys_last_exam: 5.1,
            mrcr_v2_avg_128k: 36.0,
            mrcr_v2_pointwise_1m: 6.0,

        },
    },
    {
        model: "Gemini 2.5 Pro Preview (05-06)",
        provider: "Google",
        inputPrice: 2.5,
        outputPrice: 15.0,
        source: "https://blog.google/products/gemini/gemini-2-5-pro-updates/",
        benchmark: {
            humanitys_last_exam: 17.8,
            gpqa_diamond: 83.0,
            aime_2025: 83.0,
            livecodebench_v6: 75.6,
            lbpp_v2: 76.5,
            bigcodebench: 72.7,
            swe_bench_verified: 63.2,
            simpleqa: 50.8,
            mmmu: 79.6,

            video_mme: 84.8,
            mrcr_v2_avg_128k: 93.0,
            mrcr_v2_pointwise_1m: 82.9,
            global_mmlu_lite: 88.6,
        },
    },
    {
        model: "Gemini 2.5 Pro Experimental (03-25)",
        provider: "Google",
        inputPrice: 2.5,
        outputPrice: 15.0,
        source: "https://blog.google/technology/google-deepmind/gemini-model-thinking-updates-march-2025/",
        benchmark: {
            humanitys_last_exam: 18.8,
            gpqa_diamond: 84.0,
            aime_2025: 86.7,
            livecodebench_v6: 70.4,
            lbpp_v2: 74.0,
            bigcodebench: 68.6,
            swe_bench_verified: 63.8,
            simpleqa: 52.9,
            mmmu: 81.7,
            mrcr_v2_avg_128k: 94.5,
            mrcr_v2_pointwise_1m: 83.1,
            global_mmlu_lite: 89.8,
        },
    },


];