Skip to content

Commit

Permalink
add gemma-2 quantized models
Browse files Browse the repository at this point in the history
  • Loading branch information
Judd committed Jun 30, 2024
1 parent 7bfe2e0 commit becf17c
Showing 1 changed file with 33 additions and 0 deletions.
33 changes: 33 additions & 0 deletions scripts/models.json
Original file line number Diff line number Diff line change
Expand Up @@ -274,6 +274,39 @@
}
}
},
"gemma2": {
"brief": "Gemma is a family of lightweight, state-of-the-art open models built by Google DeepMind. Updated to version 2.",
"default": "9b",
"license": "https://ai.google.dev/gemma/terms",
"variants": {
"9b": {
"default": "q4_1",
"quantized": {
"q4_1": {
"size": 5781867888,
"url": "chatllm_quantized_gemma-2/gemma-2-9b_q4_1.bin"
},
"q8": {
"size": 9824849264,
"url": "chatllm_quantized_gemma-2/gemma-2-9b.bin"
}
}
},
"27b": {
"default": "q4_1",
"quantized": {
"q4_1": {
"size": 17023592624,
"url": "chatllm_quantized_gemma-2/gemma-2-27b_q4_1.bin"
},
"q8": {
"size": 28935088304,
"url": "chatllm_quantized_gemma-2/gemma-2-27b.bin"
}
}
}
}
},
"llama3": {
"brief": "Meta Llama 3: The most capable openly available LLM to date.",
"default": "8b",
Expand Down

0 comments on commit becf17c

Please sign in to comment.