arxyzan commited on
Commit
b265e9e
1 Parent(s): 657b4dd

Hezar: Upload model and config

Browse files
Files changed (1) hide show
  1. model_config.yaml +21 -0
model_config.yaml ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: roberta_lm
2
+ config_type: model
3
+ task: language_modeling
4
+ attention_probs_dropout_prob: 0.1
5
+ bos_token_id: 0
6
+ eos_token_id: 2
7
+ gradient_checkpointing: false
8
+ hidden_act: gelu
9
+ hidden_dropout_prob: 0.1
10
+ hidden_size: 768
11
+ initializer_range: 0.02
12
+ intermediate_size: 3072
13
+ layer_norm_eps: 1.0e-12
14
+ max_position_embeddings: 514
15
+ num_attention_heads: 12
16
+ num_hidden_layers: 12
17
+ pad_token_id: 1
18
+ position_embedding_type: absolute
19
+ type_vocab_size: 1
20
+ use_cache: true
21
+ vocab_size: 42000