|
{ |
|
"attn_matrices": null, |
|
"batch_norm_affine": true, |
|
"batch_norm_non_linearity": "relu", |
|
"clip_range": 10000, |
|
"config_id": "default", |
|
"down_sample_size": 128, |
|
"efficient_tuning": true, |
|
"inv_adapter": null, |
|
"ln_after": false, |
|
"ln_before": false, |
|
"non_linearity": "relu", |
|
"original_ln_after": true, |
|
"original_ln_before": true, |
|
"output_adapter": true, |
|
"reduction_factor": 2, |
|
"residual_before_ln": true, |
|
"residual_in_bottleneck": true, |
|
"train_bias": "none", |
|
"train_lora": false, |
|
"train_moe_gate": false, |
|
"train_moe_params": false, |
|
"train_params": false, |
|
"train_prefix_tuning": false, |
|
"train_task_adapter": false, |
|
"up_sample_size": null |
|
} |