jan-hq commited on
Commit
b400690
·
verified ·
1 Parent(s): 8d9d1ae

Create model.yml

Browse files
Files changed (1) hide show
  1. model.yml +21 -0
model.yml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: granite
2
+ model: granite:8B
3
+ version: 1
4
+
5
+ # Results Preferences
6
+ stop:
7
+ - </s>
8
+ - <|end_of_text|>
9
+ - <|end_of_role|>
10
+ top_p: 0.95
11
+ temperature: 0.7
12
+ frequency_penalty: 0
13
+ presence_penalty: 0
14
+ max_tokens: 4096 # Infer from base config.json -> max_position_embeddings
15
+ stream: true # true | false
16
+
17
+ # Engine / Model Settings
18
+ ngl: 33 # Infer from base config.json -> num_attention_heads
19
+ ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
20
+ engine: llama-cpp
21
+ prompt_template: "<|start_of_role|>system<|end_of_role|>{system_message}<|end_of_text|>\n<|start_of_role|>user<|end_of_role|>{prompt}<|end_of_text|>\n<|start_of_role|>assistant<|end_of_role|>"