Skip to content

Commit 5d2102b

Browse files
The gemma.cpp Authorscopybara-github
The gemma.cpp Authors
authored andcommitted
naming scheme between gemma and gemma2 variants on the command line was not consistent
PiperOrigin-RevId: 728409104
1 parent d854471 commit 5d2102b

File tree

3 files changed

+34
-6
lines changed

3 files changed

+34
-6
lines changed

compression/compress_weights.cc

Lines changed: 11 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -110,9 +110,17 @@ struct Args : public ArgsBase<Args> {
110110
"Path to model weights (.bin) file.\n"
111111
" Required argument.");
112112
visitor(model_type_str, "model", std::string(),
113-
"Model type\n 2b-it = 2B parameters, instruction-tuned\n "
114-
"2b-pt = 2B parameters, pretrained\n 7b-it = 7B parameters "
115-
"instruction-tuned\n 7b-pt = 7B parameters, pretrained\n "
113+
"Model type\n "
114+
"gemma-2b-it = Gemma 2B parameters, instruction-tuned\n "
115+
"gemma-2b-pt = Gemma 2B parameters, pretrained\n "
116+
"gemma-7b-it = Gemma 7B parameters, instruction-tuned\n "
117+
"gemma-7b-pt = Gemma 7B parameters, pretrained\n "
118+
"gemma2-2b-it = Gemma2 2B parameters, instruction-tuned\n "
119+
"gemma2-2b-pt = Gemma2 2B parameters, pretrained\n "
120+
"gemma2-9b-it = Gemma2 9B parameters, instruction-tuned\n "
121+
"gemma2-9b-pt = Gemma2 9B parameters, pretrained\n "
122+
"gemma2-27b-it = Gemma2 27B parameters, instruction-tuned\n "
123+
"gemma2-27b-pt = Gemma2 27B parameters, pretrained\n "
116124
"gr2b-it = griffin 2B parameters, instruction-tuned\n "
117125
"gr2b-pt = griffin 2B parameters, pretrained\n "
118126
" Required argument.");

gemma/common.cc

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -44,6 +44,10 @@ constexpr const char* kModelFlags[] = {
4444
"paligemma2-3b-448", // PaliGemma2 3B 448
4545
"paligemma2-10b-224", // PaliGemma2 10B 224
4646
"paligemma2-10b-448", // PaliGemma2 10B 448
47+
"gemma-2b-pt", "gemma-2b-it",
48+
"gemma-7b-pt", "gemma-7b-it",
49+
"gemma2-9b-pt", "gemma2-9b-it",
50+
"gemma2-27b-pt", "gemma2-27b-it",
4751
};
4852
constexpr Model kModelTypes[] = {
4953
Model::GEMMA_2B, Model::GEMMA_2B, // Gemma 2B
@@ -59,6 +63,10 @@ constexpr Model kModelTypes[] = {
5963
Model::PALIGEMMA2_3B_448, // PaliGemma2 3B 448
6064
Model::PALIGEMMA2_10B_224, // PaliGemma2 10B 224
6165
Model::PALIGEMMA2_10B_448, // PaliGemma2 10B 448
66+
Model::GEMMA_2B, Model::GEMMA_2B, // Gemma 2B
67+
Model::GEMMA_7B, Model::GEMMA_7B, // Gemma 7B
68+
Model::GEMMA2_9B, Model::GEMMA2_9B, // Gemma2 9B
69+
Model::GEMMA2_27B, Model::GEMMA2_27B, // Gemma2 27B
6270
};
6371
constexpr PromptWrapping kPromptWrapping[] = {
6472
PromptWrapping::GEMMA_PT, PromptWrapping::GEMMA_IT, // Gemma 2B
@@ -71,6 +79,10 @@ constexpr PromptWrapping kPromptWrapping[] = {
7179
PromptWrapping::PALIGEMMA, PromptWrapping::PALIGEMMA, // PaliGemma 224/448
7280
PromptWrapping::PALIGEMMA, PromptWrapping::PALIGEMMA, // PG2 3B 224/448
7381
PromptWrapping::PALIGEMMA, PromptWrapping::PALIGEMMA, // PG2 10B 224/448
82+
PromptWrapping::GEMMA_PT, PromptWrapping::GEMMA_IT, // Gemma 2B
83+
PromptWrapping::GEMMA_PT, PromptWrapping::GEMMA_IT, // Gemma 7B
84+
PromptWrapping::GEMMA_PT, PromptWrapping::GEMMA_IT, // Gemma2 9B
85+
PromptWrapping::GEMMA_PT, PromptWrapping::GEMMA_IT, // Gemma2 27B
7486
};
7587

7688
constexpr size_t kNumModelFlags = std::size(kModelFlags);

util/app.h

Lines changed: 11 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -206,9 +206,17 @@ struct LoaderArgs : public ArgsBase<LoaderArgs> {
206206
visitor(compressed_weights, "compressed_weights", Path(),
207207
"Alias for --weights.");
208208
visitor(model_type_str, "model", std::string(),
209-
"Model type\n 2b-it = 2B parameters, instruction-tuned\n "
210-
"2b-pt = 2B parameters, pretrained\n 7b-it = 7B parameters "
211-
"instruction-tuned\n 7b-pt = 7B parameters, pretrained\n "
209+
"Model type\n "
210+
"gemma-2b-it = Gemma 2B parameters, instruction-tuned\n "
211+
"gemma-2b-pt = Gemma 2B parameters, pretrained\n "
212+
"gemma-7b-it = Gemma 7B parameters, instruction-tuned\n "
213+
"gemma-7b-pt = Gemma 7B parameters, pretrained\n "
214+
"gemma2-2b-it = Gemma2 2B parameters, instruction-tuned\n "
215+
"gemma2-2b-pt = Gemma2 2B parameters, pretrained\n "
216+
"gemma2-9b-it = Gemma2 9B parameters, instruction-tuned\n "
217+
"gemma2-9b-pt = Gemma2 9B parameters, pretrained\n "
218+
"gemma2-27b-it = Gemma2 27B parameters, instruction-tuned\n "
219+
"gemma2-27b-pt = Gemma2 27B parameters, pretrained\n "
212220
"gr2b-it = griffin 2B parameters, instruction-tuned\n "
213221
"gr2b-pt = griffin 2B parameters, pretrained.");
214222
visitor(weight_type_str, "weight_type", std::string("sfp"),

0 commit comments

Comments
 (0)