From 026c6ed38a925507a549319e68aea43493a52f5f Mon Sep 17 00:00:00 2001 From: Gabriel Rasskin <43894452+grasskin@users.noreply.github.com> Date: Fri, 3 May 2024 10:14:37 -0400 Subject: [PATCH] Add CodeGemma 1.1 presets. (#1617) --- keras_nlp/src/models/gemma/gemma_presets.py | 28 +++++++++++++++++++++ 1 file changed, 28 insertions(+) diff --git a/keras_nlp/src/models/gemma/gemma_presets.py b/keras_nlp/src/models/gemma/gemma_presets.py index a65a6da43a..a79e3c47a8 100644 --- a/keras_nlp/src/models/gemma/gemma_presets.py +++ b/keras_nlp/src/models/gemma/gemma_presets.py @@ -50,6 +50,20 @@ }, "kaggle_handle": "kaggle://keras/gemma/keras/gemma_1.1_instruct_2b_en/3", }, + "code_gemma_1.1_2b_en": { + "metadata": { + "description": ( + "2 billion parameter, 18-layer, CodeGemma model. This model " + "has been trained on a fill-in-the-middle (FIM) task for code " + "completion. The 1.1 update improves model quality." + ), + "params": 2506172416, + "official_name": "Gemma", + "path": "gemma", + "model_card": "https://www.kaggle.com/models/google/gemma", + }, + "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_1.1_2b_en/1", + }, "code_gemma_2b_en": { "metadata": { "description": ( @@ -127,4 +141,18 @@ }, "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_instruct_7b_en/1", }, + "code_gemma_1.1_instruct_7b_en": { + "metadata": { + "description": ( + "7 billion parameter, 28-layer, instruction tuned CodeGemma " + "model. This model has been trained for chat use cases related " + "to code. The 1.1 update improves model quality." + ), + "params": 8537680896, + "official_name": "Gemma", + "path": "gemma", + "model_card": "https://www.kaggle.com/models/google/gemma", + }, + "kaggle_handle": "kaggle://keras/codegemma/keras/code_gemma_1.1_instruct_7b_en/1", + }, }