Skip to content

Commit 0900710

Browse files
committed
Added gemma 2 GGUF model.
1 parent 705e878 commit 0900710

File tree

2 files changed

+14
-0
lines changed

2 files changed

+14
-0
lines changed

doc_generator/types.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,7 @@ class LLMModels(str, Enum):
2424
GOOGLE_GEMMA_7B_INSTRUCT = "google/gemma-7b-it"
2525
GOOGLE_CODEGEMMA_2B_INSTRUCT = "google/codegemma-2b-it"
2626
GOOGLE_CODEGEMMA_7B_INSTRUCT = "google/codegemma-7b-it"
27+
GOOGLE_GEMMA_2B_INSTRUCT_GGUF = "bartowski/gemma-2-2b-it-GGUF"
2728

2829

2930
class Priority(str, Enum):

doc_generator/utils/llm_utils.py

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -310,6 +310,19 @@ def get_tokenizer(model_name: str, gguf_file=None):
310310
failed=0,
311311
total=0,
312312
),
313+
LLMModels.GOOGLE_GEMMA_2B_INSTRUCT_GGUF: LLMModelDetails(
314+
name=LLMModels.GOOGLE_GEMMA_2B_INSTRUCT_GGUF,
315+
input_cost_per_1k_tokens=0,
316+
output_cost_per_1k_tokens=0,
317+
max_length=8192,
318+
llm=None,
319+
input_tokens=0,
320+
output_tokens=0,
321+
succeeded=0,
322+
failed=0,
323+
total=0,
324+
gguf_file="gemma-2-2b-it-IQ3_M.gguf"
325+
),
313326
}
314327

315328

0 commit comments

Comments
 (0)