MIS0630T1 / adapter_config.json
Litzy619's picture
Upload model
915751b verified
{
"adapter_emb_size": 512,
"adaptive_ratio": 0.01,
"adaptive_ratio_decay": 1.001,
"allow_empty_lora": true,
"allow_negative_weights": false,
"auto_mapping": null,
"base_model_name_or_path": "mistralai/Mistral-7B-v0.1",
"bias": "none",
"dynamic_adapter_pool": true,
"enable_lora": null,
"fan_in_fan_out": false,
"inference_mode": true,
"input_based_adapter_selection": true,
"insert_zero_lora": false,
"layer_to_lora": [],
"lora_alpha": 16,
"lora_dropout": 0.05,
"lora_lm_head": true,
"merge_weights": false,
"modules_to_save": null,
"number_of_adapter_pre_layer": 3,
"ot_diversified_dispatcher": false,
"peft_type": "FORZEN_MA_LORA",
"pool_selective_inference": true,
"pool_selective_training": true,
"pretrain_adapter_list": "./trained_adapter_mis2.txt",
"r": 16,
"random_ratio": 1.0,
"random_ratio_decay": 0.999,
"random_routing": false,
"random_routing_inference": false,
"scaling_ratio": 0.01,
"scaling_ratio_decay": 1.001,
"selective_num": 3,
"simple_hidden_matching": true,
"simple_instance_matching": true,
"target_modules": [
"up_proj",
"v_proj",
"down_proj",
"gate_proj",
"q_proj",
"o_proj",
"k_proj",
"lm_head"
],
"task_type": "CAUSAL_LM",
"train_lm_head": true
}