Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Reduce the metadata we track per preset #1991

Merged
merged 1 commit into from
Dec 2, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 0 additions & 8 deletions keras_hub/src/models/albert/albert_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 11683584,
"official_name": "ALBERT",
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/albert/keras/albert_base_en_uncased/2",
},
Expand All @@ -21,9 +19,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 17683968,
"official_name": "ALBERT",
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/albert/keras/albert_large_en_uncased/2",
},
Expand All @@ -34,9 +30,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 58724864,
"official_name": "ALBERT",
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/albert/keras/albert_extra_large_en_uncased/2",
},
Expand All @@ -47,9 +41,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 222595584,
"official_name": "ALBERT",
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/albert/keras/albert_extra_extra_large_en_uncased/2",
},
Expand Down
6 changes: 0 additions & 6 deletions keras_hub/src/models/bart/bart_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,7 @@
"Trained on BookCorpus, English Wikipedia and CommonCrawl."
),
"params": 139417344,
"official_name": "BART",
"path": "bart",
"model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/bart/README.md",
},
"kaggle_handle": "kaggle://keras/bart/keras/bart_base_en/2",
},
Expand All @@ -21,9 +19,7 @@
"Trained on BookCorpus, English Wikipedia and CommonCrawl."
),
"params": 406287360,
"official_name": "BART",
"path": "bart",
"model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/bart/README.md",
},
"config": {
"vocabulary_size": 50265,
Expand All @@ -43,9 +39,7 @@
"summarization dataset."
),
"params": 406287360,
"official_name": "BART",
"path": "bart",
"model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/bart/README.md",
},
"config": {
"vocabulary_size": 50264,
Expand Down
20 changes: 0 additions & 20 deletions keras_hub/src/models/bert/bert_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 4385920,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_tiny_en_uncased/2",
},
Expand All @@ -21,9 +19,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 28763648,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_small_en_uncased/2",
},
Expand All @@ -34,9 +30,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 41373184,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_medium_en_uncased/2",
},
Expand All @@ -47,9 +41,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 109482240,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_base_en_uncased/2",
},
Expand All @@ -60,9 +52,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 108310272,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_base_en/2",
},
Expand All @@ -72,9 +62,7 @@
"12-layer BERT model. Trained on Chinese Wikipedia."
),
"params": 102267648,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_base_zh/2",
},
Expand All @@ -84,9 +72,7 @@
"12-layer BERT model where case is maintained. Trained on trained on Wikipedias of 104 languages"
),
"params": 177853440,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_base_multi/2",
},
Expand All @@ -97,9 +83,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 335141888,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_large_en_uncased/2",
},
Expand All @@ -110,9 +94,7 @@
"Trained on English Wikipedia + BooksCorpus."
),
"params": 333579264,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_large_en/2",
},
Expand All @@ -122,9 +104,7 @@
"The bert_tiny_en_uncased backbone model fine-tuned on the SST-2 sentiment analysis dataset."
),
"params": 4385920,
"official_name": "BERT",
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "kaggle://keras/bert/keras/bert_tiny_en_uncased_sst2/4",
},
Expand Down
16 changes: 0 additions & 16 deletions keras_hub/src/models/bloom/bloom_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,7 @@
"trained on 45 natural languages and 12 programming languages."
),
"params": 559214592,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-560m",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_560m_multi/3",
},
Expand All @@ -21,9 +19,7 @@
"trained on 45 natural languages and 12 programming languages."
),
"params": 1065314304,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-1b1",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_1.1b_multi/1",
},
Expand All @@ -34,9 +30,7 @@
"trained on 45 natural languages and 12 programming languages."
),
"params": 1722408960,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-1b7",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_1.7b_multi/1",
},
Expand All @@ -47,9 +41,7 @@
"trained on 45 natural languages and 12 programming languages."
),
"params": 3002557440,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-3b",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_3b_multi/1",
},
Expand All @@ -60,9 +52,7 @@
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 559214592,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-560m",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_560m_multi/1",
},
Expand All @@ -73,9 +63,7 @@
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 1065314304,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-1b1",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_1.1b_multi/1",
},
Expand All @@ -86,9 +74,7 @@
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 1722408960,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-1b7",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_1.7b_multi/1",
},
Expand All @@ -99,9 +85,7 @@
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 3002557440,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-3b",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_3b_multi/1",
},
Expand Down
16 changes: 0 additions & 16 deletions keras_hub/src/models/clip/clip_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,9 +9,7 @@
"text, patch size of 16, CLIP model."
),
"params": 149620934,
"official_name": "CLIP",
"path": "clip",
"model_card": "https://github.com/openai/CLIP/blob/main/model-card.md",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_base_patch16/1",
},
Expand All @@ -22,9 +20,7 @@
"text, patch size of 32, CLIP model."
),
"params": 151277363,
"official_name": "CLIP",
"path": "clip",
"model_card": "https://github.com/openai/CLIP/blob/main/model-card.md",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_base_patch32/1",
},
Expand All @@ -35,9 +31,7 @@
"text, patch size of 14, CLIP model."
),
"params": 427616770,
"official_name": "CLIP",
"path": "clip",
"model_card": "https://github.com/openai/CLIP/blob/main/model-card.md",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_large_patch14/1",
},
Expand All @@ -48,9 +42,7 @@
"text, patch size of 14, image size of 336, CLIP model."
),
"params": 427944770,
"official_name": "CLIP",
"path": "clip",
"model_card": "https://github.com/openai/CLIP/blob/main/model-card.md",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_large_patch14_336/1",
},
Expand All @@ -61,9 +53,7 @@
"text, patch size of 32, Open CLIP model."
),
"params": 151277363,
"official_name": "Open CLIP",
"path": "clip",
"model_card": "https://github.com/mlfoundations/open_clip",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_b_32_laion2b_s34b_b79k/1",
},
Expand All @@ -74,9 +64,7 @@
"text, patch size of 14, Open CLIP model."
),
"params": 986109698,
"official_name": "Open CLIP",
"path": "clip",
"model_card": "https://github.com/mlfoundations/open_clip",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_h_14_laion2b_s32b_b79k/1",
},
Expand All @@ -87,9 +75,7 @@
"text, patch size of 14, Open CLIP model."
),
"params": 1366678530,
"official_name": "Open CLIP",
"path": "clip",
"model_card": "https://github.com/mlfoundations/open_clip",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_g_14_laion2b_s12b_b42k/1",
},
Expand All @@ -100,9 +86,7 @@
"text, patch size of 14, Open CLIP model."
),
"params": 2539567362,
"official_name": "Open CLIP",
"path": "clip",
"model_card": "https://github.com/mlfoundations/open_clip",
},
"kaggle_handle": "kaggle://keras/clip/keras/clip_vit_bigg_14_laion2b_39b_b160k/1",
},
Expand Down
10 changes: 0 additions & 10 deletions keras_hub/src/models/deberta_v3/deberta_v3_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,7 @@
"Trained on English Wikipedia, BookCorpus and OpenWebText."
),
"params": 70682112,
"official_name": "DeBERTaV3",
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-xsmall",
},
"kaggle_handle": "kaggle://keras/deberta_v3/keras/deberta_v3_extra_small_en/2",
},
Expand All @@ -21,9 +19,7 @@
"Trained on English Wikipedia, BookCorpus and OpenWebText."
),
"params": 141304320,
"official_name": "DeBERTaV3",
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-small",
},
"kaggle_handle": "kaggle://keras/deberta_v3/keras/deberta_v3_small_en/2",
},
Expand All @@ -34,9 +30,7 @@
"Trained on English Wikipedia, BookCorpus and OpenWebText."
),
"params": 183831552,
"official_name": "DeBERTaV3",
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-base",
},
"kaggle_handle": "kaggle://keras/deberta_v3/keras/deberta_v3_base_en/2",
},
Expand All @@ -47,9 +41,7 @@
"Trained on English Wikipedia, BookCorpus and OpenWebText."
),
"params": 434012160,
"official_name": "DeBERTaV3",
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-large",
},
"kaggle_handle": "kaggle://keras/deberta_v3/keras/deberta_v3_large_en/2",
},
Expand All @@ -60,9 +52,7 @@
"Trained on the 2.5TB multilingual CC100 dataset."
),
"params": 278218752,
"official_name": "DeBERTaV3",
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/mdeberta-v3-base",
},
"kaggle_handle": "kaggle://keras/deberta_v3/keras/deberta_v3_base_multi/2",
},
Expand Down
2 changes: 0 additions & 2 deletions keras_hub/src/models/deeplab_v3/deeplab_v3_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,9 +9,7 @@
"which is having categorical accuracy of 90.01 and 0.63 Mean IoU."
),
"params": 39190656,
"official_name": "DeepLabV3",
"path": "deeplab_v3",
"model_card": "https://arxiv.org/abs/1802.02611",
},
"kaggle_handle": "kaggle://keras/deeplabv3plus/keras/deeplab_v3_plus_resnet50_pascalvoc/3",
},
Expand Down
Loading
Loading