alg_name: "WISE" | |
model_name: "./hugging_cache/gpt2" | |
device: cpu | |
mask_ratio: 0.2 | |
edit_lr: 1.0 | |
n_iter: 40 | |
norm_constraint: 1.0 | |
act_margin: [15.0, 40.0, 20.0] # alpha, beta, gamma | |
act_ratio: 0.7 | |
save_freq: 1 | |
merge_freq: 1 | |
merge_alg: 'ties' | |
objective_optimization: 'only_label' | |
inner_params: | |
- transformer.h[8].mlp.c_fc.weight | |
## alternative: WISE-Merge, WISE-Retrieve | |
# for merge (if merge) | |
densities: 0.53 | |
weights: 1.0 | |
# for retrieve (if retrieve, pls set to True) | |
retrieve: True | |
replay: False # True --> will replay the past editing instances: see https://arxiv.org/abs/2405.14768 Appendix B.3 |