| alg_name: "WISE" | |
| model_name: "./hugging_cache/gpt2" | |
| device: cpu | |
| mask_ratio: 0.2 | |
| edit_lr: 1.0 | |
| n_iter: 40 | |
| norm_constraint: 1.0 | |
| act_margin: [15.0, 40.0, 20.0] # alpha, beta, gamma | |
| act_ratio: 0.7 | |
| save_freq: 1 | |
| merge_freq: 1 | |
| merge_alg: 'ties' | |
| objective_optimization: 'only_label' | |
| inner_params: | |
| - transformer.h[8].mlp.c_fc.weight | |
| ## alternative: WISE-Merge, WISE-Retrieve | |
| # for merge (if merge) | |
| densities: 0.53 | |
| weights: 1.0 | |
| # for retrieve (if retrieve, pls set to True) | |
| retrieve: True | |
| replay: False # True --> will replay the past editing instances: see https://arxiv.org/abs/2405.14768 Appendix B.3 |