default: &default use_tqdm: true random_seed: 42 base_save_path: /home/msadraei/trained_final model_name: google/t5-small-lm-adapt project_name_prefix: iclr_softmax_effect experiment_name_suffix: null train_batch_size: 32 valid_batch_size: 32 remove_dropout: true learning_rate: 0.01 weight_decay: 0.01 num_epochs: 20 peft_params: null # no mutation hot_modules: - sadcl best_finder: save: True metric: valid_mean higher_better: true tasks: # - superglue:rte # - superglue:cb # - superglue:wic # - superglue:copa # - glue:cola # - glue:mrpc # - superglue:boolq # - glue:stsb # - glue:qqp # - glue:qnli # - glue:mnli # - glue:sst2 - superglue:multirc run_configs: - <<: *default peft_params: kind: combine n_tokens: 10 n_comb_tokens: 128 softmax: true # - <<: *default # learning_rate: 0.3 # peft_params: # kind: residual # n_tokens: 10 # mlp_size: 128