| { | |
| "alora_invocation_tokens": null, | |
| "alpha_pattern": {}, | |
| "arrow_config": null, | |
| "auto_mapping": null, | |
| "base_model_name_or_path": null, | |
| "bias": "none", | |
| "corda_config": null, | |
| "ensure_weight_tying": false, | |
| "eva_config": null, | |
| "exclude_modules": null, | |
| "fan_in_fan_out": false, | |
| "inference_mode": false, | |
| "init_lora_weights": true, | |
| "layer_replication": null, | |
| "layers_pattern": null, | |
| "layers_to_transform": null, | |
| "loftq_config": {}, | |
| "lora_alpha": 32, | |
| "lora_bias": false, | |
| "lora_dropout": 0.0, | |
| "megatron_config": null, | |
| "megatron_core": "megatron.core", | |
| "modules_to_save": null, | |
| "peft_type": "LORA", | |
| "peft_version": "0.18.1", | |
| "qalora_group_size": 16, | |
| "r": 32, | |
| "rank_pattern": {}, | |
| "revision": null, | |
| "target_modules": [ | |
| "4.adaLN_modulation.0", | |
| "15.adaLN_modulation.0", | |
| "20.adaLN_modulation.0", | |
| "16.adaLN_modulation.0", | |
| "10.adaLN_modulation.0", | |
| "26.adaLN_modulation.0", | |
| "27.adaLN_modulation.0", | |
| "18.adaLN_modulation.0", | |
| "23.adaLN_modulation.0", | |
| "29.adaLN_modulation.0", | |
| "13.adaLN_modulation.0", | |
| "14.adaLN_modulation.0", | |
| "7.adaLN_modulation.0", | |
| "w1", | |
| "2.adaLN_modulation.0", | |
| "22.adaLN_modulation.0", | |
| "8.adaLN_modulation.0", | |
| "qkv", | |
| "17.adaLN_modulation.0", | |
| "19.adaLN_modulation.0", | |
| "w2", | |
| "0.adaLN_modulation.0", | |
| "out", | |
| "28.adaLN_modulation.0", | |
| "3.adaLN_modulation.0", | |
| "25.adaLN_modulation.0", | |
| "9.adaLN_modulation.0", | |
| "11.adaLN_modulation.0", | |
| "24.adaLN_modulation.0", | |
| "5.adaLN_modulation.0", | |
| "12.adaLN_modulation.0", | |
| "21.adaLN_modulation.0", | |
| "1.adaLN_modulation.0", | |
| "w3", | |
| "6.adaLN_modulation.0" | |
| ], | |
| "target_parameters": null, | |
| "task_type": null, | |
| "trainable_token_indices": null, | |
| "use_dora": false, | |
| "use_qalora": false, | |
| "use_rslora": false | |
| } |