thuannh commited on
Commit
776e891
·
1 Parent(s): 46e87d2

init model gemma 2 2b

Browse files
Files changed (2) hide show
  1. model.gguf +2 -2
  2. model.yml +3 -3
model.gguf CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd87fc03fe3d651ac419ae35f4a0e6d861167db156572b6c4b90fb81822a3547
3
- size 5127231648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af92b6a034fd095807bd339ae9268ceba1a951201994063d5eea15e564f0a42f
3
+ size 1708582496
model.yml CHANGED
@@ -1,5 +1,5 @@
1
- name: gemma
2
- model: gemma:7B
3
  version: 1
4
 
5
  # Results Preferences
@@ -14,7 +14,7 @@ max_tokens: 4096 # Infer from base config.json -> max_position_embeddings
14
  stream: true # true | false
15
 
16
  # Engine / Model Settings
17
- ngl: 33 # Infer from base config.json -> num_attention_heads
18
  ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
19
  engine: cortex.llamacpp
20
  prompt_template: "<start_of_turn>user\n{prompt}<end_of_turn>\n<start_of_turn>model"
 
1
+ name: gemma2
2
+ model: gemma2:2B
3
  version: 1
4
 
5
  # Results Preferences
 
14
  stream: true # true | false
15
 
16
  # Engine / Model Settings
17
+ ngl: 300 # Infer from base config.json -> num_attention_heads
18
  ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
19
  engine: cortex.llamacpp
20
  prompt_template: "<start_of_turn>user\n{prompt}<end_of_turn>\n<start_of_turn>model"