We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3837366 commit a938550Copy full SHA for a938550
config.yml
@@ -24,6 +24,8 @@ data:
24
# Model Definition -------------------
25
model:
26
hf_model_ckpt: "NousResearch/Llama-2-7b-hf"
27
+ torch_dtype: "bfloat16"
28
+ attn_implementation: "flash_attention_2"
29
quantize: true
30
bitsandbytes:
31
load_in_4bit: true
@@ -80,4 +82,4 @@ qa:
80
82
- verb_percent
81
83
- adjective_percent
84
- noun_percent
- - summary_length
85
+ - summary_length
0 commit comments