File size: 1,066 Bytes
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
 
 
 
 
 
 
 
 
 
 
 
 
355f9e9
78b2927
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
355f9e9
78b2927
 
 
355f9e9
78b2927
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
{

  "architectures": [

    "T5ForConditionalGeneration"

  ],

  "d_ff": 3072,

  "d_kv": 64,

  "d_model": 768,

  "decoder_start_token_id": 0,

  "dropout_rate": 0.1,

  "eos_token_id": 1,

  "initializer_factor": 1.0,

  "is_encoder_decoder": true,

  "layer_norm_epsilon": 1e-06,

  "model_type": "t5",

  "n_positions": 512,

  "num_heads": 12,

  "num_layers": 12,

  "output_past": true,

  "pad_token_id": 0,

  "relative_attention_num_buckets": 32,

  "task_specific_params": {

    "summarization": {

      "early_stopping": true,

      "max_length": 32,

      "num_beams": 4,

      "prefix": ""

    },

    "translation_en_to_fr": {

      "early_stopping": true,

      "max_length": 32,

      "num_beams": 4,

      "prefix": ""

    },

    "translation_en_to_de": {

      "early_stopping": true,

      "max_length": 32,

      "num_beams": 4,

      "prefix": ""

    },

    "translation_en_to_ro": {

      "early_stopping": true,

      "max_length": 32,

      "num_beams": 4,

      "prefix": ""

    }

  },

  "vocab_size": 32101

}