DylanonWic commited on
Commit
1e4e4b3
1 Parent(s): c72dd3f

Training in progress, step 1000

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. pytorch_model.bin +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -54,12 +54,12 @@
54
  "final_dropout": 0.0,
55
  "gradient_checkpointing": false,
56
  "hidden_act": "gelu",
57
- "hidden_dropout": 0.08,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
- "layerdrop": 0.3,
63
  "mask_channel_length": 10,
64
  "mask_channel_min_space": 1,
65
  "mask_channel_other": 0.0,
@@ -82,7 +82,7 @@
82
  "num_conv_pos_embedding_groups": 16,
83
  "num_conv_pos_embeddings": 128,
84
  "num_feat_extract_layers": 7,
85
- "num_hidden_layers": 32,
86
  "num_negatives": 100,
87
  "output_hidden_size": 1024,
88
  "pad_token_id": 69,
 
54
  "final_dropout": 0.0,
55
  "gradient_checkpointing": false,
56
  "hidden_act": "gelu",
57
+ "hidden_dropout": 0.05,
58
  "hidden_size": 1024,
59
  "initializer_range": 0.02,
60
  "intermediate_size": 4096,
61
  "layer_norm_eps": 1e-05,
62
+ "layerdrop": 0.25,
63
  "mask_channel_length": 10,
64
  "mask_channel_min_space": 1,
65
  "mask_channel_other": 0.0,
 
82
  "num_conv_pos_embedding_groups": 16,
83
  "num_conv_pos_embeddings": 128,
84
  "num_feat_extract_layers": 7,
85
+ "num_hidden_layers": 24,
86
  "num_negatives": 100,
87
  "output_hidden_size": 1024,
88
  "pad_token_id": 69,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d9e53a707a0c12bd3bb5f63cde3aa57ed1a345070dad78003250db99a94388c
3
- size 1665320813
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:561a654b417c3744ec5b46c40fe86535fe717c3c86a483f91291e8a3dc0e8aa2
3
+ size 1262197037
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd38da3854fe738a469da4e3feb290654e3235a80d62e8093d9b52b8df640ae5
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b887c852210af941b93e4bb319b1ec7b70c0ccd532c4f5bf434a6311fa295a0
3
  size 3579