File size: 597 Bytes
d6682b6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 |
alg_name: "WISE"
model_name: "./hugging_cache/gpt2"
device: cpu
mask_ratio: 0.2
edit_lr: 1.0
n_iter: 40
norm_constraint: 1.0
act_margin: [15.0, 40.0, 20.0] # alpha, beta, gamma
act_ratio: 0.7
save_freq: 1
merge_freq: 1
merge_alg: 'ties'
objective_optimization: 'only_label'
inner_params:
- transformer.h[8].mlp.c_fc.weight
## alternative: WISE-Merge, WISE-Retrieve
# for merge (if merge)
densities: 0.53
weights: 1.0
# for retrieve (if retrieve, pls set to True)
retrieve: True
replay: False # True --> will replay the past editing instances: see https://arxiv.org/abs/2405.14768 Appendix B.3 |