V0224O1 / adapter_config.json
Litzy619's picture
End of training
8e55e67 verified
raw
history blame contribute delete
907 Bytes
{
"adaptive_ratio": 1.0,
"adaptive_ratio_decay": 1.0,
"auto_mapping": null,
"base_model_name_or_path": "yahma/llama-7b-hf",
"bias": "none",
"dynamic_adapter_pool": false,
"enable_lora": null,
"encoder_hidden_size": 4096,
"fan_in_fan_out": false,
"inference_mode": true,
"input_based_adapter_selection": true,
"lora_alpha": 16,
"lora_dropout": 0.05,
"merge_weights": false,
"modules_to_save": null,
"num_attention_heads": 32,
"num_layers": 32,
"num_prefix_set": 8,
"num_transformer_submodules": 1,
"num_virtual_tokens": 30,
"number_of_adapter_pre_layer": 8,
"ot_diversified_dispatcher": false,
"peft_type": "PREFIX_MA_LORA",
"pool_selective_inference": true,
"pool_selective_training": true,
"prefix_projection": false,
"r": 16,
"selective_num": 8,
"target_modules": [
"q_proj",
"v_proj"
],
"task_type": "CAUSAL_LM",
"token_dim": 4096
}