Text Generation
Adapters
llama
llama-2
calpt's picture
Upload LlamaForCausalLM
65505ef verified
raw
history blame contribute delete
No virus
1.07 kB
{
"config": {
"adapter_residual_before_ln": false,
"cross_adapter": false,
"dropout": 0.0,
"factorized_phm_W": true,
"factorized_phm_rule": false,
"hypercomplex_nonlinearity": "glorot-uniform",
"init_weights": "bert",
"inv_adapter": null,
"inv_adapter_reduction_factor": null,
"is_parallel": false,
"learn_phm": true,
"leave_out": [],
"ln_after": false,
"ln_before": false,
"mh_adapter": true,
"non_linearity": "swish",
"original_ln_after": true,
"original_ln_before": false,
"output_adapter": true,
"phm_bias": true,
"phm_c_init": "normal",
"phm_dim": 4,
"phm_init_range": 0.0001,
"phm_layer": false,
"phm_rank": 1,
"reduction_factor": 16,
"residual_before_ln": true,
"scaling": 1.0,
"shared_W_phm": false,
"shared_phm_rule": true,
"use_gating": false
},
"hidden_size": 4096,
"model_class": "LlamaForCausalLM",
"model_name": "meta-llama/Llama-2-7b-hf",
"model_type": "llama",
"name": "assistant_adapter",
"version": "0.1.2"
}