van-qa commited on
Commit
ecffaa8
·
verified ·
1 Parent(s): 3ea8103

Update model.yml

Browse files
Files changed (1) hide show
  1. model.yml +1 -0
model.yml CHANGED
@@ -16,6 +16,7 @@ max_tokens: 4096 # Infer from base config.json -> max_position_embeddings
16
  stream: true # true | false
17
 
18
  # Engine / Model Settings
 
19
  ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
20
  engine: cortex.llamacpp
21
  prompt_template: "{system_message} [INST] {prompt} [/INST]"
 
16
  stream: true # true | false
17
 
18
  # Engine / Model Settings
19
+ ngl: 33 # Infer from base config.json -> num_attention_heads
20
  ctx_len: 4096 # Infer from base config.json -> max_position_embeddings
21
  engine: cortex.llamacpp
22
  prompt_template: "{system_message} [INST] {prompt} [/INST]"