Baselight
Loading...Loading chart...
1-- CHART 1: Model Performance - Diminishing Returns
2-- Shows all models from 2019-2025 with MMLU scores
3
4SELECT 
5    architecture AS model_name,
6    year,
7    model_size_parameters / 1000000000.0 AS params_billions,
8    mmlu_avg AS mmlu_score,
9    dataset_size_tokens / 1000000000.0 AS training_tokens_billions,
10    training_computation_petaflop AS training_cost_pflops,
11    organisation AS organization
12FROM "@owid.epoch_llms.owid_epoch_llms_2"
13WHERE model_size_parameters IS NOT NULL
14  AND mmlu_avg IS NOT NULL
15
16UNION ALL
17
18SELECT 
19    model_name,
20    year,
21    parameters_billion AS params_billions,
22    mmlu_score,
23    training_tokens_billion AS training_tokens_billions,
24    training_cost_pflops,
25    organization
26FROM "@adlrocha.llm_stats.llm_performance2425"
27WHERE parameters_billion IS NOT NULL
28  AND mmlu_score IS NOT NULL
29
30ORDER BY year, params_billions
model_nameyearparams_billionsmmlu_scoretraining_tokens_billionstraining_cost_pflopsorganization
GPT-2 (finetuned)20191.532.400001525878906436000OpenAI
GPT-3 (davinci)202017543.900001525878906374393000000OpenAI
Gopher (0.4B)20210.41725.700000762939453300751000Google DeepMind
Gopher (1.4B)20211.427.2999992370605473002520000Google DeepMind
Gopher (7B)20217.129.530012800000Google DeepMind
Gopher (280B)202128060300504000000Google DeepMind
PaLM (8B)2022825.29999923706054778037400000Google Research
GPT-NeoX-20B20222033.59999847412109417721200000Eleuther
PaLM (62B)20226253.70000076293945795296000000Google Research
PaLM (62B+)20226262.799999237060551330493000000Google Research
OPT20226635.9900016784668434172000000Meta AI
Chinchilla20227067.51400588000000Google DeepMind
GLM-130B202213044.79999923706055400312000000Tsinghua KEG
BLOOM202217639.130001068115234390412000000HuggingFace, BigScience
PaLM (540B)202254069.300003051757817802530000000Google Research
LLaMA (7B)20236.735.099998474121094100040200000Meta AI
LLaMA (13B)20231346.900001525878906100078000000Meta AI
LLaMA (33B)202332.557.799999237060551400273000000Meta AI
BloombergGPT20235039.18000030517578708212000000Bloomberg
LLaMA (65B)202365.263.4000015258789061400548000000Meta AI
PaLM-2202334078.340008160000Google
PaLM-2202334078.3000030517578140008160000000Google Research
Gemini Ultra2023156083.961300079999000Google
GPT-42023176086.41300021000000OpenAI
DeepSeek-V320243781.2148005300DeepSeek
Gemini 2.0 Flash202415077.6nullnullGoogle
Llama 4 Maverick20251780.52200022000Meta
Llama 4 Scout20251787.34000040200Meta
DeepSeek-R1-052820253785null6500DeepSeek
DeepSeek-R120253781.2148006300DeepSeek
Claude Sonnet 4.5202520082nullnullAnthropic
Claude Opus 4.1202540088nullnullAnthropic
GPT-5202517009011400021000000OpenAI

Share link

Anyone who has the link will be able to view this.