File size: 329 Bytes
035cb20
fb9f7d6
035cb20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
name: distilbert_lm
config_type: model
task: language_modeling
activation: gelu
attention_dropout: 0.1
dim: 768
dropout: 0.1
hidden_dim: 3072
initializer_range: 0.02
max_position_embeddings: 512
model_type: distilbert
n_heads: 12
n_layers: 6
output_past: true
pad_token_id: 0
qa_dropout: 0.1
tie_weights_: true
vocab_size: 42000