-
Notifications
You must be signed in to change notification settings - Fork 235
/
llama-7b.yaml
53 lines (47 loc) · 1.23 KB
/
llama-7b.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
alg_name: "ROME"
model_name: "./hugging_cache/llama-2-7b"
stats_dir: "./data/stats"
device: 0
layers: [5]
fact_token: "subject_last"
v_num_grad_steps: 25
v_lr: 5e-1
v_loss_layer: 31
v_weight_decay: 1e-3
clamp_norm_factor: 4
kl_factor: 0.0625
mom2_adjustment: false
context_template_length_params: [[5, 10], [10, 10]]
rewrite_module_tmp: "model.layers.{}.mlp.down_proj"
layer_module_tmp: "model.layers.{}"
mlp_module_tmp: "model.layers.{}.mlp"
attn_module_tmp: "model.layers.{}.self_attn"
ln_f_module: "model.norm"
lm_head_module: "lm_head"
mom2_dataset: "wikipedia"
mom2_n_samples: 100000
mom2_dtype: "float32"
model_parallel: false
# fp16: true
#alg_name: "ROME"
#model_name: "./hugging_cache/llama-7b"
#device: 0
#layers: [5]
#fact_token: "subject_last"
#v_num_grad_steps: 20
#v_lr: 1e-1
#v_loss_layer: 31
#v_weight_decay: 1e-3
#clamp_norm_factor: 4
#kl_factor: 0.0625
#mom2_adjustment: false
#context_template_length_params: [[5, 10], [10, 10]]
#rewrite_module_tmp: "model.layers.{}.mlp.down_proj"
#layer_module_tmp: "model.layers.{}"
#mlp_module_tmp: "model.layers.{}.mlp"
#attn_module_tmp: "model.layers.{}.self_attn"
#ln_f_module: "model.norm"
#lm_head_module: "lm_head"
#mom2_dataset: "wikipedia"
#mom2_n_samples: 100000
#mom2_dtype: "float32"