File size: 1,066 Bytes
355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 355f9e9 78b2927 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 |
{
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dropout_rate": 0.1,
"eos_token_id": 1,
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"layer_norm_epsilon": 1e-06,
"model_type": "t5",
"n_positions": 512,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"max_length": 32,
"num_beams": 4,
"prefix": ""
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 32,
"num_beams": 4,
"prefix": ""
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 32,
"num_beams": 4,
"prefix": ""
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 32,
"num_beams": 4,
"prefix": ""
}
},
"vocab_size": 32101
}
|