File size: 597 Bytes
d6682b6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
alg_name: "WISE"
model_name: "./hugging_cache/gpt2"
device: cpu

mask_ratio: 0.2
edit_lr: 1.0
n_iter: 40
norm_constraint: 1.0
act_margin: [15.0, 40.0, 20.0] # alpha, beta, gamma
act_ratio: 0.7
save_freq: 1
merge_freq: 1
merge_alg: 'ties'
objective_optimization: 'only_label'
inner_params:
- transformer.h[8].mlp.c_fc.weight


## alternative: WISE-Merge, WISE-Retrieve

# for merge (if merge)
densities: 0.53
weights: 1.0

# for retrieve (if retrieve, pls set to True)
retrieve: True
replay: False # True --> will replay the past editing instances: see https://arxiv.org/abs/2405.14768 Appendix B.3