-- SELECT
-- system,
-- publication_date,
-- domain,
-- CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) as training_datapoints
-- FROM "@owid.epoch.owid_epoch_1"
-- WHERE training_dataset_size_datapoints IS NOT NULL
-- AND training_dataset_size_datapoints != ''
-- ORDER BY publication_date, system
SELECT
system,
publication_date,
CASE WHEN domain = 'Language' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Language,
CASE WHEN domain = 'Vision' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Vision,
CASE WHEN domain = 'Games' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Games,
CASE WHEN domain = 'Biology' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Biology,
CASE WHEN domain = 'Image generation' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Image_generation,
CASE WHEN domain = 'Speech' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Speech,
CASE WHEN domain = 'Multiple domains' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Multiple_domains,
CASE WHEN domain = 'Other' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Other,
CASE WHEN domain = 'Robotics' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Robotics,
CASE WHEN domain = 'Drawing' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Drawing,
CASE WHEN domain = 'Text-to-Video' THEN CAST(REPLACE(training_dataset_size_datapoints, ',', '') AS BIGINT) END as Text_to_Video
FROM @owid.epoch.owid_epoch_1
WHERE training_dataset_size_datapoints IS NOT NULL
AND training_dataset_size_datapoints != ''
ORDER BY publication_date, system
system | publication_date | Language | Vision | Games | Biology | Image_generation | Speech | Multiple_domains | Other | Robotics | Drawing | Text_to_Video |
---|---|---|---|---|---|---|---|---|---|---|---|---|
Theseus | 1950-07-02 00:00:00 | null | null | null | null | null | null | null | 40 | null | null | null |
Self Organizing System | 1955-03-01 00:00:00 | null | 256 | null | null | null | null | null | null | null | null | null |
Perceptron Mark I | 1957-01-01 00:00:00 | null | 6 | null | null | null | null | null | null | null | null | null |
Samuel Neural Checkers | 1959-07-01 00:00:00 | null | null | 53000 | null | null | null | null | null | null | null | null |
ADALINE | 1960-06-30 00:00:00 | null | 100 | null | null | null | null | null | null | null | null | null |
Neocognitron | 1980-04-01 00:00:00 | null | 5 | null | null | null | null | null | null | null | null | null |
Back-propagation | 1986-10-01 00:00:00 | null | null | null | null | null | null | null | 144 | null | null | null |
NetTalk | 1987-06-06 00:00:00 | null | null | null | null | null | 21000 | null | null | null | null | null |
Motion-Driven 3D Feature Tracking | 1988-07-01 00:00:00 | null | 1500 | null | null | null | null | null | null | null | null | null |
Innervator | 1989-01-01 00:00:00 | null | null | null | null | null | null | null | 4 | null | null | null |
ALVINN | 1989-12-01 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Zip CNN | 1989-12-01 00:00:00 | null | 7290 | null | null | null | null | null | null | null | null | null |
SRN-Encoded Grammatical Structures | 1991-09-01 00:00:00 | 178000 | null | null | null | null | null | null | null | null | null | null |
TD-Gammon | 1992-05-01 00:00:00 | null | null | 6300000 | null | null | null | null | null | null | null | null |
Fuzzy NN | 1992-09-01 00:00:00 | null | null | null | null | null | 436 | null | null | null | null | null |
IBM-5 | 1993-06-15 00:00:00 | 53400000 | null | null | null | null | null | null | null | null | null | null |
GroupLens | 1994-10-22 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Iterative Bootstrapping WSD | 1995-06-26 00:00:00 | 460000000 | null | null | null | null | null | null | null | null | null | null |
Random Decision Forests | 1995-08-14 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Support Vector Machines | 1995-09-01 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
System 11 | 1996-06-18 00:00:00 | null | 9050 | null | null | null | null | null | null | null | null | null |
HMM Word Alignment | 1996-08-05 00:00:00 | 442000 | null | null | null | null | null | null | null | null | null | null |
SVM for face detection | 1997-06-17 00:00:00 | null | 50000 | null | null | null | null | null | null | null | null | null |
Bidirectional RNN | 1997-11-01 00:00:00 | null | null | null | null | null | 73900 | null | null | null | null | null |
LSTM | 1997-11-15 00:00:00 | 1270000 | null | null | null | null | null | null | null | null | null | null |
Sparse coding model for V1 receptive fields | 1997-12-01 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Social and content-based classification | 1998-07-01 00:00:00 | null | null | null | null | null | null | null | 45000 | null | null | null |
LeNet-5 | 1998-11-01 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
LSTM with forget gates | 1999-01-02 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
IBM Model 4 | 1999-07-02 00:00:00 | 800000 | null | null | null | null | null | null | null | null | null | null |
Perceptron for Large Margin Classification | 1999-12-01 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
FrameNet role labeling | 2000-09-01 00:00:00 | 50000 | null | null | null | null | null | null | null | null | null | null |
Decision tree (classification) | 2001-12-08 00:00:00 | null | 14500 | null | null | null | null | null | null | null | null | null |
Thumbs Up? | 2002-05-28 00:00:00 | 2050 | null | null | null | null | null | null | null | null | null | null |
Maximum Entropy Models for machine translation | 2002-07-06 00:00:00 | 520000 | null | null | null | null | null | null | null | null | null | null |
NPLM | 2003-03-15 00:00:00 | 1000000 | null | null | null | null | null | null | null | null | null | null |
Phrase-based translation | 2003-05-01 00:00:00 | 20000000 | null | null | null | null | null | null | null | null | null | null |
Unsupervised Scale-Invariant Learning | 2003-06-18 00:00:00 | null | 3500 | null | null | null | null | null | null | null | null | null |
CNN Best Practices | 2003-08-06 00:00:00 | null | 50000 | null | null | null | null | null | null | null | null | null |
Max-Margin Markov Networks | 2004-03-01 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
SACHS | 2005-04-22 00:00:00 | null | null | null | null | null | null | null | 5400 | null | null | null |
Hiero | 2005-06-01 00:00:00 | 171000000 | null | null | null | null | null | null | null | null | null | null |
ConvNet similarity metric | 2005-06-20 00:00:00 | null | 140000 | null | null | null | null | null | null | null | null | null |
Histograms of Oriented Gradients | 2005-06-25 00:00:00 | null | 1810 | null | null | null | null | null | null | null | null | null |
BiLSTM for Speech | 2005-08-01 00:00:00 | null | null | null | null | null | 37000 | null | null | null | null | null |
DrLIM | 2006-06-17 00:00:00 | null | 217000 | null | null | null | null | null | null | null | null | null |
CTC-Trained LSTM | 2006-06-25 00:00:00 | null | null | null | null | null | 41600 | null | null | null | null | null |
DImensionality Reduction | 2006-07-18 00:00:00 | null | 70000 | null | null | null | null | null | null | null | null | null |
Deep Belief Nets | 2006-07-18 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
Sparse Energy-Based Model | 2006-12-04 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
Regularized SVD for Collaborative Filtering | 2007-08-12 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Deep Multitask NLP Network | 2008-07-05 00:00:00 | 633000000 | null | null | null | null | null | null | null | null | null | null |
Multitask DNNs for NLP | 2008-07-05 00:00:00 | 631000000 | null | null | null | null | null | null | null | null | null | null |
BigChaos 2008 | 2008-11-25 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Semantic Hashing | 2008-12-10 00:00:00 | null | null | null | null | null | null | null | 311000 | null | null | null |
BellKor 2009 | 2009-08-01 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
MatrixFac for Recommenders | 2009-08-07 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
6-layer MLP (MNIST) | 2010-03-01 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
Word Representations | 2010-06-01 00:00:00 | 37000000 | null | null | null | null | null | null | null | null | null | null |
ReLU (NORB) | 2010-06-15 00:00:00 | null | 292000 | null | null | null | null | null | null | null | null | null |
KN5 LM + RNN 400/10 (WSJ) | 2010-09-26 00:00:00 | null | null | null | null | null | 6400000 | null | null | null | null | null |
RNN 500/10 + RT09 LM (NIST RT05) | 2010-09-26 00:00:00 | null | null | null | null | null | 5400000 | null | null | null | null | null |
YouTube Video Recommendation System | 2010-09-26 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
RNN-SpeedUp | 2011-05-22 00:00:00 | 698000 | null | null | null | null | null | null | null | null | null | null |
Domain Adaptation | 2011-11-06 00:00:00 | null | 4650 | null | null | null | null | null | null | null | null | null |
NLP from scratch | 2011-11-08 00:00:00 | 852000000 | null | null | null | null | null | null | null | null | null | null |
MCDNN (MNIST) | 2012-02-13 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
Dropout (ImageNet) | 2012-06-03 00:00:00 | null | 1000000 | null | null | null | null | null | null | null | null | null |
Dropout (MNIST) | 2012-06-03 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
Dropout (TIMIT) | 2012-06-03 00:00:00 | null | null | null | null | null | 41600 | null | null | null | null | null |
Unsupervised High-level Feature Learner | 2012-07-12 00:00:00 | null | 10000000 | null | null | null | null | null | null | null | null | null |
AlexNet | 2012-09-30 00:00:00 | null | 1200000 | null | null | null | null | null | null | null | null | null |
Mitosis | 2013-09-22 00:00:00 | null | 1000000 | null | null | null | null | null | null | null | null | null |
Word2Vec (large) | 2013-10-16 00:00:00 | 33000000000 | null | null | null | null | null | null | null | null | null | null |
Word2Vec (small) | 2013-10-16 00:00:00 | 692000 | null | null | null | null | null | null | null | null | null | null |
TransE | 2013-12-05 00:00:00 | null | null | null | null | null | null | null | 17000000 | null | null | null |
Image generation | 2013-12-20 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
GloVe (32B) | 2014-01-01 00:00:00 | 42000000000 | null | null | null | null | null | null | null | null | null | null |
GloVe (6B) | 2014-01-01 00:00:00 | 6000000000 | null | null | null | null | null | null | null | null | null | null |
GANs | 2014-06-10 00:00:00 | null | null | null | null | null | null | null | null | null | 60000 | null |
SPPNet | 2014-06-18 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
Multiresolution CNN | 2014-06-23 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
SmooCT | 2014-07-01 00:00:00 | null | null | 12000000000 | null | null | null | null | null | null | null | null |
RNNsearch-50* | 2014-09-01 00:00:00 | 348000000 | null | null | null | null | null | null | null | null | null | null |
VGG16 | 2014-09-04 00:00:00 | null | 1300000 | null | null | null | null | null | null | null | null | null |
VGG19 | 2014-09-04 00:00:00 | null | 1300000 | null | null | null | null | null | null | null | null | null |
Seq2Seq LSTM | 2014-09-10 00:00:00 | 652000000 | null | null | null | null | null | null | null | null | null | null |
DSN | 2014-09-18 00:00:00 | null | 870000 | null | null | null | null | null | null | null | null | null |
Deeply-supervised nets | 2014-09-18 00:00:00 | null | 870000 | null | null | null | null | null | null | null | null | null |
LRCN | 2014-11-07 00:00:00 | null | 40000 | null | null | null | null | null | null | null | null | null |
MSRA (C, PReLU) | 2015-02-06 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
DQN-2015 | 2015-02-25 00:00:00 | null | null | 50000000 | null | null | null | null | null | null | null | null |
GoogLeNet / InceptionV1 | 2015-06-07 00:00:00 | null | 1200000 | null | null | null | null | null | null | null | null | null |
BPE | 2015-08-31 00:00:00 | 37500000 | null | null | null | null | null | null | null | null | null | null |
Inception v3 | 2015-12-02 00:00:00 | null | 1200000 | null | null | null | null | null | null | null | null | null |
DeepSpeech2 (English) | 2015-12-08 00:00:00 | null | null | null | null | null | 163000000 | null | null | null | null | null |
ResNet-152 (ImageNet) | 2015-12-10 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
AlphaGo Lee | 2016-01-27 00:00:00 | null | null | 29400000 | null | null | null | null | null | null | null | null |
Spatiotemporal fusion ConvNet | 2016-06-01 00:00:00 | null | 97200 | null | null | null | null | null | null | null | null | null |
R-FCN | 2016-06-21 00:00:00 | null | 94400 | null | null | null | null | null | null | null | null | null |
GNMT | 2016-09-26 00:00:00 | 360000000 | null | null | null | null | null | null | null | null | null | null |
PolyNet | 2016-11-17 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
Transformer | 2017-06-12 00:00:00 | 360000000 | null | null | null | null | null | null | null | null | null | null |
JFT | 2017-08-04 00:00:00 | null | 300000000 | null | null | null | null | null | null | null | null | null |
RetinaNet-R101 | 2017-08-07 00:00:00 | null | 135000 | null | null | null | null | null | null | null | null | null |
AlphaGo Zero | 2017-10-18 00:00:00 | null | null | 5800000000 | null | null | null | null | null | null | null | null |
CapsNet (MNIST) | 2017-10-26 00:00:00 | null | 60000 | null | null | null | null | null | null | null | null | null |
PNASNet-5 | 2017-12-02 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
AlphaZero | 2017-12-05 00:00:00 | null | null | 700000 | null | null | null | null | null | null | null | null |
AmoebaNet-A (F=448) | 2018-02-05 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
YOLOv3 | 2018-04-08 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
GPT | 2018-06-01 00:00:00 | 1000000000 | null | null | null | null | null | null | null | null | null | null |
BigGAN-deep 512x512 | 2018-09-28 00:00:00 | null | null | null | null | null | null | null | null | null | 292000000 | null |
BERT-Large | 2018-10-11 00:00:00 | 3300000000 | null | null | null | null | null | null | null | null | null | null |
Decoupled weight decay regularization | 2019-01-04 00:00:00 | null | 50000 | null | null | null | null | null | null | null | null | null |
GPT-2 (1542M) | 2019-02-14 00:00:00 | 3000000000 | null | null | null | null | null | null | null | null | null | null |
KataGo | 2019-02-27 00:00:00 | null | null | 241000000 | null | null | null | null | null | null | null | null |
MnasNet-A1 + SSDLite | 2019-05-29 00:00:00 | null | 118000 | null | null | null | null | null | null | null | null | null |
MnasNet-A3 | 2019-05-29 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
RoBERTa Large | 2019-07-01 00:00:00 | 32000000000 | null | null | null | null | null | null | null | null | null | null |
ObjectNet | 2019-09-06 00:00:00 | null | 50000 | null | null | null | null | null | null | null | null | null |
ALBERT | 2019-09-26 00:00:00 | 3300000000 | null | null | null | null | null | null | null | null | null | null |
T5-11B | 2019-10-23 00:00:00 | 150000000000 | null | null | null | null | null | null | null | null | null | null |
T5-3B | 2019-10-23 00:00:00 | 150000000000 | null | null | null | null | null | null | null | null | null | null |
MuZero | 2019-11-19 00:00:00 | null | null | 20000000000 | null | null | null | null | null | null | null | null |
OpenAI Five | 2019-12-13 00:00:00 | null | null | 454000000000 | null | null | null | null | null | null | null | null |
OpenAI Five Rerun | 2019-12-13 00:00:00 | null | null | 53100000000 | null | null | null | null | null | null | null | null |
ALBERT-xxlarge | 2020-02-09 00:00:00 | 3300000000 | null | null | null | null | null | null | null | null | null | null |
GPT-3 175B (davinci) | 2020-05-28 00:00:00 | 374000000000 | null | null | null | null | null | null | null | null | null | null |
ViT-H/14 | 2020-09-28 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
wave2vec 2.0 LARGE | 2020-10-22 00:00:00 | null | null | null | null | null | 728000000 | null | null | null | null | null |
CLIP (ResNet-50) | 2021-01-05 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
CLIP (ViT L/14@336px) | 2021-01-05 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
DALL-E | 2021-01-05 00:00:00 | null | null | null | null | null | null | null | null | null | 250000000 | null |
Meta Pseudo Labels | 2021-03-01 00:00:00 | null | 130000000 | null | null | null | null | null | null | null | null | null |
M6-T | 2021-03-05 00:00:00 | null | null | null | null | null | null | null | null | null | null | null |
Transformer local-attention (NesT-B) | 2021-05-26 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
Denoising Diffusion Probabilistic Models (LSUN Bedroom) | 2021-06-11 00:00:00 | null | null | null | null | null | null | null | null | null | 3030000 | null |
EfficientNetV2 | 2021-06-23 00:00:00 | null | 14200000 | null | null | null | null | null | null | null | null | null |
Codex | 2021-07-07 00:00:00 | 31800000000 | null | null | null | null | null | null | null | null | null | null |
HuBERT | 2021-07-27 00:00:00 | 821000000 | null | null | null | null | null | null | null | null | null | null |
XLMR-XXL | 2021-08-17 00:00:00 | 125000000000 | null | null | null | null | null | null | null | null | null | null |
FLAN | 2021-09-03 00:00:00 | 1870000000000 | null | null | null | null | null | null | null | null | null | null |
Megatron-Turing NLG 530B | 2021-10-11 00:00:00 | 203000000000 | null | null | null | null | null | null | null | null | null | null |
XGLM | 2021-12-20 00:00:00 | 1740000000 | null | null | null | null | null | null | null | null | null | null |
data2vec (language) | 2022-01-20 00:00:00 | 3300000000 | null | null | null | null | null | null | null | null | null | null |
data2vec (speech) | 2022-01-20 00:00:00 | null | null | null | null | null | 13100000 | null | null | null | null | null |
data2vec (vision) | 2022-01-20 00:00:00 | null | 1280000 | null | null | null | null | null | null | null | null | null |
InstructGPT | 2022-01-27 00:00:00 | 1310000 | null | null | null | null | null | null | null | null | null | null |
GPT-NeoX-20B | 2022-02-09 00:00:00 | 177000000000 | null | null | null | null | null | null | null | null | null | null |
LaMDA | 2022-02-10 00:00:00 | 1560000000000 | null | null | null | null | null | null | null | null | null | null |
Chinchilla | 2022-03-29 00:00:00 | 1050000000000 | null | null | null | null | null | null | null | null | null | null |
PaLM (540B) | 2022-04-04 00:00:00 | 585000000000 | null | null | null | null | null | null | null | null | null | null |
DALLĀ·E 2 | 2022-04-06 00:00:00 | null | null | null | null | null | null | null | null | null | 650000000 | null |
Stable Diffusion (LDM-KL-8-G) | 2022-04-13 00:00:00 | null | null | null | null | null | null | null | null | null | 400000000 | null |
Sparse all-MLP | 2022-04-14 00:00:00 | 75000000000 | null | null | null | null | null | null | null | null | null | null |
Parti | 2022-06-22 00:00:00 | null | null | null | null | null | null | null | null | null | 4800000000 | null |
Minerva (540B) | 2022-06-29 00:00:00 | 614000000000 | null | null | null | null | null | null | null | null | null | null |
NLLB | 2022-07-06 00:00:00 | 360000000000 | null | null | null | null | null | null | null | null | null | null |
Whisper | 2022-09-21 00:00:00 | null | null | null | null | null | 9300000000 | null | null | null | null | null |
BLOOM | 2022-11-08 00:00:00 | 263000000000 | null | null | null | null | null | null | null | null | null | null |
LLaMA-65B | 2023-02-24 00:00:00 | 1050000000000 | null | null | null | null | null | null | null | null | null | null |
Falcon-40B | 2023-03-15 00:00:00 | 750000000000 | null | null | null | null | null | null | null | null | null | null |
PaLM 2 | 2023-05-10 00:00:00 | 2700000000000 | null | null | null | null | null | null | null | null | null | null |
InternLM | 2023-07-06 00:00:00 | 750000000000 | null | null | null | null | null | null | null | null | null | null |
Llama 2 | 2023-07-18 00:00:00 | 1500000000000 | null | null | null | null | null | null | null | null | null | null |
Jais | 2023-08-29 00:00:00 | 300000000000 | null | null | null | null | null | null | null | null | null | null |
Falcon 180B | 2023-09-06 00:00:00 | 2625000000000 | null | null | null | null | null | null | null | null | null | null |