elsayedissa commited on
Commit
8f31d06
1 Parent(s): 49e97d5

Training in progress, step 7000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:577ecc5f3164ed1f8764ca8bcc0923b04a67d26eb58b25b5bbfd3a6671922b0c
3
  size 2524414853
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8b93e7897bc3f43ea6b1a664fc0daee99a1df27feebf5e9743f2a0bbfb65f30
3
  size 2524414853
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca12f11ddd482d1635bc0d81ed113f4ea1e018a2f62477116cfcc83538540b81
3
  size 1262229869
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c04132f7025e27d9cf890f119fc19b9fbfc35fa926c5345bb77dcfcf19e918
3
  size 1262229869
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e610a7a1ab34f2269d078954a068657d20de039358e571630da376d40a0a0adb
3
  size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aebbece3849c4ea65c57e14ac7218389ce4023006361ce66491299183a563542
3
  size 14639
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:508ae3fa47b1fb7e443f3373117b2addb3ea1903f0b754d943fc68d31b332e19
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e97f75ec4a68ce2d88e985bf5af3c9d9064b2fdb2fc3093a5ded26ae274c6de
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.06791821116824107,
3
  "best_model_checkpoint": "./wav2vec2-xls-r-300m-ar/checkpoint-6000",
4
- "epoch": 53.097345132743364,
5
- "global_step": 6000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1500,11 +1500,260 @@
1500
  "eval_steps_per_second": 1.209,
1501
  "eval_wer": 0.06791821116824107,
1502
  "step": 6000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1503
  }
1504
  ],
1505
  "max_steps": 10000,
1506
  "num_train_epochs": 89,
1507
- "total_flos": 2.3640957156336247e+19,
1508
  "trial_name": null,
1509
  "trial_params": null
1510
  }
 
1
  {
2
  "best_metric": 0.06791821116824107,
3
  "best_model_checkpoint": "./wav2vec2-xls-r-300m-ar/checkpoint-6000",
4
+ "epoch": 61.94690265486726,
5
+ "global_step": 7000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1500
  "eval_steps_per_second": 1.209,
1501
  "eval_wer": 0.06791821116824107,
1502
  "step": 6000
1503
+ },
1504
+ {
1505
+ "epoch": 53.32,
1506
+ "learning_rate": 0.0001255263157894737,
1507
+ "loss": 0.0153,
1508
+ "step": 6025
1509
+ },
1510
+ {
1511
+ "epoch": 53.54,
1512
+ "learning_rate": 0.00012473684210526315,
1513
+ "loss": 0.013,
1514
+ "step": 6050
1515
+ },
1516
+ {
1517
+ "epoch": 53.76,
1518
+ "learning_rate": 0.00012394736842105263,
1519
+ "loss": 0.0093,
1520
+ "step": 6075
1521
+ },
1522
+ {
1523
+ "epoch": 53.98,
1524
+ "learning_rate": 0.00012315789473684208,
1525
+ "loss": 0.0125,
1526
+ "step": 6100
1527
+ },
1528
+ {
1529
+ "epoch": 54.2,
1530
+ "learning_rate": 0.00012236842105263157,
1531
+ "loss": 0.0122,
1532
+ "step": 6125
1533
+ },
1534
+ {
1535
+ "epoch": 54.42,
1536
+ "learning_rate": 0.00012157894736842104,
1537
+ "loss": 0.0131,
1538
+ "step": 6150
1539
+ },
1540
+ {
1541
+ "epoch": 54.65,
1542
+ "learning_rate": 0.0001207894736842105,
1543
+ "loss": 0.0129,
1544
+ "step": 6175
1545
+ },
1546
+ {
1547
+ "epoch": 54.87,
1548
+ "learning_rate": 0.00011999999999999999,
1549
+ "loss": 0.0119,
1550
+ "step": 6200
1551
+ },
1552
+ {
1553
+ "epoch": 55.09,
1554
+ "learning_rate": 0.00011921052631578947,
1555
+ "loss": 0.012,
1556
+ "step": 6225
1557
+ },
1558
+ {
1559
+ "epoch": 55.31,
1560
+ "learning_rate": 0.00011842105263157894,
1561
+ "loss": 0.0106,
1562
+ "step": 6250
1563
+ },
1564
+ {
1565
+ "epoch": 55.53,
1566
+ "learning_rate": 0.00011763157894736841,
1567
+ "loss": 0.0077,
1568
+ "step": 6275
1569
+ },
1570
+ {
1571
+ "epoch": 55.75,
1572
+ "learning_rate": 0.00011684210526315788,
1573
+ "loss": 0.0093,
1574
+ "step": 6300
1575
+ },
1576
+ {
1577
+ "epoch": 55.97,
1578
+ "learning_rate": 0.00011605263157894735,
1579
+ "loss": 0.0103,
1580
+ "step": 6325
1581
+ },
1582
+ {
1583
+ "epoch": 56.19,
1584
+ "learning_rate": 0.00011526315789473682,
1585
+ "loss": 0.0148,
1586
+ "step": 6350
1587
+ },
1588
+ {
1589
+ "epoch": 56.42,
1590
+ "learning_rate": 0.00011447368421052632,
1591
+ "loss": 0.0158,
1592
+ "step": 6375
1593
+ },
1594
+ {
1595
+ "epoch": 56.64,
1596
+ "learning_rate": 0.00011368421052631579,
1597
+ "loss": 0.0108,
1598
+ "step": 6400
1599
+ },
1600
+ {
1601
+ "epoch": 56.86,
1602
+ "learning_rate": 0.00011289473684210526,
1603
+ "loss": 0.0135,
1604
+ "step": 6425
1605
+ },
1606
+ {
1607
+ "epoch": 57.08,
1608
+ "learning_rate": 0.00011210526315789472,
1609
+ "loss": 0.0116,
1610
+ "step": 6450
1611
+ },
1612
+ {
1613
+ "epoch": 57.3,
1614
+ "learning_rate": 0.0001113157894736842,
1615
+ "loss": 0.0105,
1616
+ "step": 6475
1617
+ },
1618
+ {
1619
+ "epoch": 57.52,
1620
+ "learning_rate": 0.00011052631578947366,
1621
+ "loss": 0.0101,
1622
+ "step": 6500
1623
+ },
1624
+ {
1625
+ "epoch": 57.74,
1626
+ "learning_rate": 0.00010973684210526316,
1627
+ "loss": 0.0089,
1628
+ "step": 6525
1629
+ },
1630
+ {
1631
+ "epoch": 57.96,
1632
+ "learning_rate": 0.00010894736842105263,
1633
+ "loss": 0.0098,
1634
+ "step": 6550
1635
+ },
1636
+ {
1637
+ "epoch": 58.19,
1638
+ "learning_rate": 0.0001081578947368421,
1639
+ "loss": 0.0121,
1640
+ "step": 6575
1641
+ },
1642
+ {
1643
+ "epoch": 58.41,
1644
+ "learning_rate": 0.00010736842105263157,
1645
+ "loss": 0.013,
1646
+ "step": 6600
1647
+ },
1648
+ {
1649
+ "epoch": 58.63,
1650
+ "learning_rate": 0.00010657894736842104,
1651
+ "loss": 0.012,
1652
+ "step": 6625
1653
+ },
1654
+ {
1655
+ "epoch": 58.85,
1656
+ "learning_rate": 0.00010578947368421051,
1657
+ "loss": 0.0089,
1658
+ "step": 6650
1659
+ },
1660
+ {
1661
+ "epoch": 59.07,
1662
+ "learning_rate": 0.00010499999999999999,
1663
+ "loss": 0.0111,
1664
+ "step": 6675
1665
+ },
1666
+ {
1667
+ "epoch": 59.29,
1668
+ "learning_rate": 0.00010421052631578947,
1669
+ "loss": 0.0085,
1670
+ "step": 6700
1671
+ },
1672
+ {
1673
+ "epoch": 59.51,
1674
+ "learning_rate": 0.00010342105263157894,
1675
+ "loss": 0.0094,
1676
+ "step": 6725
1677
+ },
1678
+ {
1679
+ "epoch": 59.73,
1680
+ "learning_rate": 0.00010263157894736841,
1681
+ "loss": 0.0098,
1682
+ "step": 6750
1683
+ },
1684
+ {
1685
+ "epoch": 59.96,
1686
+ "learning_rate": 0.00010184210526315788,
1687
+ "loss": 0.0109,
1688
+ "step": 6775
1689
+ },
1690
+ {
1691
+ "epoch": 60.18,
1692
+ "learning_rate": 0.00010105263157894735,
1693
+ "loss": 0.0129,
1694
+ "step": 6800
1695
+ },
1696
+ {
1697
+ "epoch": 60.4,
1698
+ "learning_rate": 0.00010026315789473683,
1699
+ "loss": 0.01,
1700
+ "step": 6825
1701
+ },
1702
+ {
1703
+ "epoch": 60.62,
1704
+ "learning_rate": 9.94736842105263e-05,
1705
+ "loss": 0.0089,
1706
+ "step": 6850
1707
+ },
1708
+ {
1709
+ "epoch": 60.84,
1710
+ "learning_rate": 9.868421052631579e-05,
1711
+ "loss": 0.0122,
1712
+ "step": 6875
1713
+ },
1714
+ {
1715
+ "epoch": 61.06,
1716
+ "learning_rate": 9.789473684210526e-05,
1717
+ "loss": 0.0167,
1718
+ "step": 6900
1719
+ },
1720
+ {
1721
+ "epoch": 61.28,
1722
+ "learning_rate": 9.710526315789473e-05,
1723
+ "loss": 0.0105,
1724
+ "step": 6925
1725
+ },
1726
+ {
1727
+ "epoch": 61.5,
1728
+ "learning_rate": 9.63157894736842e-05,
1729
+ "loss": 0.0089,
1730
+ "step": 6950
1731
+ },
1732
+ {
1733
+ "epoch": 61.73,
1734
+ "learning_rate": 9.552631578947368e-05,
1735
+ "loss": 0.0102,
1736
+ "step": 6975
1737
+ },
1738
+ {
1739
+ "epoch": 61.95,
1740
+ "learning_rate": 9.473684210526315e-05,
1741
+ "loss": 0.0149,
1742
+ "step": 7000
1743
+ },
1744
+ {
1745
+ "epoch": 61.95,
1746
+ "eval_loss": 0.2759546935558319,
1747
+ "eval_runtime": 10.7835,
1748
+ "eval_samples_per_second": 9.273,
1749
+ "eval_steps_per_second": 1.206,
1750
+ "eval_wer": 0.07174458926222647,
1751
+ "step": 7000
1752
  }
1753
  ],
1754
  "max_steps": 10000,
1755
  "num_train_epochs": 89,
1756
+ "total_flos": 2.756451071078706e+19,
1757
  "trial_name": null,
1758
  "trial_params": null
1759
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca12f11ddd482d1635bc0d81ed113f4ea1e018a2f62477116cfcc83538540b81
3
  size 1262229869
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c04132f7025e27d9cf890f119fc19b9fbfc35fa926c5345bb77dcfcf19e918
3
  size 1262229869
runs/Apr09_14-45-21_gpu07.cyverse.org/events.out.tfevents.1681076808.gpu07.cyverse.org.48142.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fa0c2b70002f87a44d106c5be0907e96fc3567270c9387d4e18c661e3204a4b
3
- size 44970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17afcb646f4bffba0651ee2b2d287faa8b2e8e9a98dac1f49fdb1210b9df2b8a
3
+ size 51568