Training in progress, step 300
Browse files- config.json +1 -1
- pytorch_model.bin +1 -1
- run.sh +1 -1
- run_speech_recognition_seq2seq_streaming.py +1 -0
- runs/Dec14_09-09-02_129-213-22-31/1671009068.9843225/events.out.tfevents.1671009068.129-213-22-31.76517.1 +3 -0
- runs/Dec14_09-09-02_129-213-22-31/events.out.tfevents.1671009068.129-213-22-31.76517.0 +3 -0
- training_args.bin +1 -1
config.json
CHANGED
@@ -17,7 +17,7 @@
|
|
17 |
"decoder_layerdrop": 0.0,
|
18 |
"decoder_layers": 24,
|
19 |
"decoder_start_token_id": 50258,
|
20 |
-
"dropout": 0.
|
21 |
"encoder_attention_heads": 16,
|
22 |
"encoder_ffn_dim": 4096,
|
23 |
"encoder_layerdrop": 0.0,
|
|
|
17 |
"decoder_layerdrop": 0.0,
|
18 |
"decoder_layers": 24,
|
19 |
"decoder_start_token_id": 50258,
|
20 |
+
"dropout": 0.1,
|
21 |
"encoder_attention_heads": 16,
|
22 |
"encoder_ffn_dim": 4096,
|
23 |
"encoder_layerdrop": 0.0,
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3055754841
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7636e3d95bfeff32e8b2bd10d0996660c605ffd61c13facfde26c8e2b5599938
|
3 |
size 3055754841
|
run.sh
CHANGED
@@ -29,7 +29,7 @@ python run_speech_recognition_seq2seq_streaming.py \
|
|
29 |
--load_best_model_at_end \
|
30 |
--gradient_checkpointing \
|
31 |
--fp16 \
|
32 |
-
--overwrite_output_dir="
|
33 |
--do_train \
|
34 |
--do_eval \
|
35 |
--predict_with_generate \
|
|
|
29 |
--load_best_model_at_end \
|
30 |
--gradient_checkpointing \
|
31 |
--fp16 \
|
32 |
+
--overwrite_output_dir="False" \
|
33 |
--do_train \
|
34 |
--do_eval \
|
35 |
--predict_with_generate \
|
run_speech_recognition_seq2seq_streaming.py
CHANGED
@@ -556,6 +556,7 @@ def main():
|
|
556 |
elif isinstance(train_dataloader.dataset, IterableDataset):
|
557 |
train_dataloader.dataset.set_epoch(train_dataloader.dataset._epoch + 1)
|
558 |
|
|
|
559 |
# Initialize Trainer
|
560 |
trainer = Seq2SeqTrainer(
|
561 |
model=model,
|
|
|
556 |
elif isinstance(train_dataloader.dataset, IterableDataset):
|
557 |
train_dataloader.dataset.set_epoch(train_dataloader.dataset._epoch + 1)
|
558 |
|
559 |
+
model.config.dropout=0.1
|
560 |
# Initialize Trainer
|
561 |
trainer = Seq2SeqTrainer(
|
562 |
model=model,
|
runs/Dec14_09-09-02_129-213-22-31/1671009068.9843225/events.out.tfevents.1671009068.129-213-22-31.76517.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78cc986e73b2a39d30783ce62e763818707dbb5a8526f805a7b55958b29b7b3b
|
3 |
+
size 5869
|
runs/Dec14_09-09-02_129-213-22-31/events.out.tfevents.1671009068.129-213-22-31.76517.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d74cebc2feab7a04ab7fde962da8d39c21532b57ef537c4a6242c1f298ea2d9
|
3 |
+
size 5211
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3579
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c533f7abd990d9ef06c67fc5110076fffbb3d083bf1fbae49a66b54b16fd23b
|
3 |
size 3579
|