Skip to content

Commit

Permalink
Add bloom presets (#1501)
Browse files Browse the repository at this point in the history
  • Loading branch information
abuelnasr0 authored Mar 11, 2024
1 parent c5a37bc commit 465ce7b
Showing 1 changed file with 95 additions and 4 deletions.
99 changes: 95 additions & 4 deletions keras_nlp/models/bloom/bloom_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,14 +17,105 @@
"bloom_560m_multi": {
"metadata": {
"description": (
"24-layer Bloom model. trained on 45 natural languages and "
"12 programming languages."
"24-layer Bloom model with hidden dimension of 1024. "
"trained on 45 natural languages and 12 programming languages."
),
"params": 816115712,
"params": 559214592,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom",
"model_card": "https://huggingface.co/bigscience/bloom-560m",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_560m_multi/3",
},
"bloom_1.1b_multi": {
"metadata": {
"description": (
"24-layer Bloom model with hidden dimension of 1536. "
"trained on 45 natural languages and 12 programming languages."
),
"params": 1065314304,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-1b1",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_1.1b_multi/1",
},
"bloom_1.7b_multi": {
"metadata": {
"description": (
"24-layer Bloom model with hidden dimension of 2048. "
"trained on 45 natural languages and 12 programming languages."
),
"params": 1722408960,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-1b7",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_1.7b_multi/1",
},
"bloom_3b_multi": {
"metadata": {
"description": (
"30-layer Bloom model with hidden dimension of 2560. "
"trained on 45 natural languages and 12 programming languages."
),
"params": 3002557440,
"official_name": "BLOOM",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloom-3b",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloom_3b_multi/1",
},
"bloomz_560m_multi": {
"metadata": {
"description": (
"24-layer Bloom model with hidden dimension of 1024. "
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 559214592,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-560m",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_560m_multi/1",
},
"bloomz_1.1b_multi": {
"metadata": {
"description": (
"24-layer Bloom model with hidden dimension of 1536. "
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 1065314304,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-1b1",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_1.1b_multi/1",
},
"bloomz_1.7b_multi": {
"metadata": {
"description": (
"24-layer Bloom model with hidden dimension of 2048. "
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 1722408960,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-1b7",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_1.7b_multi/1",
},
"bloomz_3b_multi": {
"metadata": {
"description": (
"30-layer Bloom model with hidden dimension of 2560. "
"finetuned on crosslingual task mixture (xP3) dataset."
),
"params": 3002557440,
"official_name": "BLOOMZ",
"path": "bloom",
"model_card": "https://huggingface.co/bigscience/bloomz-3b",
},
"kaggle_handle": "kaggle://keras/bloom/keras/bloomz_3b_multi/1",
},
}

0 comments on commit 465ce7b

Please sign in to comment.