elsayedissa
commited on
Commit
·
49e97d5
1
Parent(s):
e2327c2
Training in progress, step 6000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +2 -2
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +254 -5
- pytorch_model.bin +1 -1
- runs/Apr09_14-45-21_gpu07.cyverse.org/events.out.tfevents.1681076808.gpu07.cyverse.org.48142.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2524414853
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:577ecc5f3164ed1f8764ca8bcc0923b04a67d26eb58b25b5bbfd3a6671922b0c
|
3 |
size 2524414853
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1262229869
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca12f11ddd482d1635bc0d81ed113f4ea1e018a2f62477116cfcc83538540b81
|
3 |
size 1262229869
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e610a7a1ab34f2269d078954a068657d20de039358e571630da376d40a0a0adb
|
3 |
+
size 14639
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:508ae3fa47b1fb7e443f3373117b2addb3ea1903f0b754d943fc68d31b332e19
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "./wav2vec2-xls-r-300m-ar/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1251,11 +1251,260 @@
|
|
1251 |
"eval_steps_per_second": 1.211,
|
1252 |
"eval_wer": 0.07437522420184145,
|
1253 |
"step": 5000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1254 |
}
|
1255 |
],
|
1256 |
"max_steps": 10000,
|
1257 |
"num_train_epochs": 89,
|
1258 |
-
"total_flos":
|
1259 |
"trial_name": null,
|
1260 |
"trial_params": null
|
1261 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.06791821116824107,
|
3 |
+
"best_model_checkpoint": "./wav2vec2-xls-r-300m-ar/checkpoint-6000",
|
4 |
+
"epoch": 53.097345132743364,
|
5 |
+
"global_step": 6000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1251 |
"eval_steps_per_second": 1.211,
|
1252 |
"eval_wer": 0.07437522420184145,
|
1253 |
"step": 5000
|
1254 |
+
},
|
1255 |
+
{
|
1256 |
+
"epoch": 44.47,
|
1257 |
+
"learning_rate": 0.00015710526315789472,
|
1258 |
+
"loss": 0.0163,
|
1259 |
+
"step": 5025
|
1260 |
+
},
|
1261 |
+
{
|
1262 |
+
"epoch": 44.69,
|
1263 |
+
"learning_rate": 0.00015631578947368418,
|
1264 |
+
"loss": 0.0196,
|
1265 |
+
"step": 5050
|
1266 |
+
},
|
1267 |
+
{
|
1268 |
+
"epoch": 44.91,
|
1269 |
+
"learning_rate": 0.00015552631578947366,
|
1270 |
+
"loss": 0.0161,
|
1271 |
+
"step": 5075
|
1272 |
+
},
|
1273 |
+
{
|
1274 |
+
"epoch": 45.13,
|
1275 |
+
"learning_rate": 0.00015473684210526317,
|
1276 |
+
"loss": 0.0158,
|
1277 |
+
"step": 5100
|
1278 |
+
},
|
1279 |
+
{
|
1280 |
+
"epoch": 45.35,
|
1281 |
+
"learning_rate": 0.00015394736842105263,
|
1282 |
+
"loss": 0.0159,
|
1283 |
+
"step": 5125
|
1284 |
+
},
|
1285 |
+
{
|
1286 |
+
"epoch": 45.58,
|
1287 |
+
"learning_rate": 0.0001531578947368421,
|
1288 |
+
"loss": 0.0163,
|
1289 |
+
"step": 5150
|
1290 |
+
},
|
1291 |
+
{
|
1292 |
+
"epoch": 45.8,
|
1293 |
+
"learning_rate": 0.00015236842105263156,
|
1294 |
+
"loss": 0.0137,
|
1295 |
+
"step": 5175
|
1296 |
+
},
|
1297 |
+
{
|
1298 |
+
"epoch": 46.02,
|
1299 |
+
"learning_rate": 0.00015157894736842105,
|
1300 |
+
"loss": 0.0131,
|
1301 |
+
"step": 5200
|
1302 |
+
},
|
1303 |
+
{
|
1304 |
+
"epoch": 46.24,
|
1305 |
+
"learning_rate": 0.0001507894736842105,
|
1306 |
+
"loss": 0.0125,
|
1307 |
+
"step": 5225
|
1308 |
+
},
|
1309 |
+
{
|
1310 |
+
"epoch": 46.46,
|
1311 |
+
"learning_rate": 0.00015,
|
1312 |
+
"loss": 0.0138,
|
1313 |
+
"step": 5250
|
1314 |
+
},
|
1315 |
+
{
|
1316 |
+
"epoch": 46.68,
|
1317 |
+
"learning_rate": 0.00014921052631578947,
|
1318 |
+
"loss": 0.0179,
|
1319 |
+
"step": 5275
|
1320 |
+
},
|
1321 |
+
{
|
1322 |
+
"epoch": 46.9,
|
1323 |
+
"learning_rate": 0.00014842105263157893,
|
1324 |
+
"loss": 0.0169,
|
1325 |
+
"step": 5300
|
1326 |
+
},
|
1327 |
+
{
|
1328 |
+
"epoch": 47.12,
|
1329 |
+
"learning_rate": 0.0001476315789473684,
|
1330 |
+
"loss": 0.0152,
|
1331 |
+
"step": 5325
|
1332 |
+
},
|
1333 |
+
{
|
1334 |
+
"epoch": 47.35,
|
1335 |
+
"learning_rate": 0.0001468421052631579,
|
1336 |
+
"loss": 0.0146,
|
1337 |
+
"step": 5350
|
1338 |
+
},
|
1339 |
+
{
|
1340 |
+
"epoch": 47.57,
|
1341 |
+
"learning_rate": 0.00014605263157894735,
|
1342 |
+
"loss": 0.0143,
|
1343 |
+
"step": 5375
|
1344 |
+
},
|
1345 |
+
{
|
1346 |
+
"epoch": 47.79,
|
1347 |
+
"learning_rate": 0.00014526315789473683,
|
1348 |
+
"loss": 0.0116,
|
1349 |
+
"step": 5400
|
1350 |
+
},
|
1351 |
+
{
|
1352 |
+
"epoch": 48.01,
|
1353 |
+
"learning_rate": 0.00014447368421052631,
|
1354 |
+
"loss": 0.0162,
|
1355 |
+
"step": 5425
|
1356 |
+
},
|
1357 |
+
{
|
1358 |
+
"epoch": 48.23,
|
1359 |
+
"learning_rate": 0.00014368421052631577,
|
1360 |
+
"loss": 0.0115,
|
1361 |
+
"step": 5450
|
1362 |
+
},
|
1363 |
+
{
|
1364 |
+
"epoch": 48.45,
|
1365 |
+
"learning_rate": 0.00014289473684210525,
|
1366 |
+
"loss": 0.0156,
|
1367 |
+
"step": 5475
|
1368 |
+
},
|
1369 |
+
{
|
1370 |
+
"epoch": 48.67,
|
1371 |
+
"learning_rate": 0.0001421052631578947,
|
1372 |
+
"loss": 0.0144,
|
1373 |
+
"step": 5500
|
1374 |
+
},
|
1375 |
+
{
|
1376 |
+
"epoch": 48.89,
|
1377 |
+
"learning_rate": 0.0001413157894736842,
|
1378 |
+
"loss": 0.0155,
|
1379 |
+
"step": 5525
|
1380 |
+
},
|
1381 |
+
{
|
1382 |
+
"epoch": 49.12,
|
1383 |
+
"learning_rate": 0.00014052631578947367,
|
1384 |
+
"loss": 0.0146,
|
1385 |
+
"step": 5550
|
1386 |
+
},
|
1387 |
+
{
|
1388 |
+
"epoch": 49.34,
|
1389 |
+
"learning_rate": 0.00013973684210526316,
|
1390 |
+
"loss": 0.0164,
|
1391 |
+
"step": 5575
|
1392 |
+
},
|
1393 |
+
{
|
1394 |
+
"epoch": 49.56,
|
1395 |
+
"learning_rate": 0.00013894736842105261,
|
1396 |
+
"loss": 0.0128,
|
1397 |
+
"step": 5600
|
1398 |
+
},
|
1399 |
+
{
|
1400 |
+
"epoch": 49.78,
|
1401 |
+
"learning_rate": 0.0001381578947368421,
|
1402 |
+
"loss": 0.0133,
|
1403 |
+
"step": 5625
|
1404 |
+
},
|
1405 |
+
{
|
1406 |
+
"epoch": 50.0,
|
1407 |
+
"learning_rate": 0.00013736842105263155,
|
1408 |
+
"loss": 0.0126,
|
1409 |
+
"step": 5650
|
1410 |
+
},
|
1411 |
+
{
|
1412 |
+
"epoch": 50.22,
|
1413 |
+
"learning_rate": 0.00013657894736842104,
|
1414 |
+
"loss": 0.011,
|
1415 |
+
"step": 5675
|
1416 |
+
},
|
1417 |
+
{
|
1418 |
+
"epoch": 50.44,
|
1419 |
+
"learning_rate": 0.00013578947368421052,
|
1420 |
+
"loss": 0.0154,
|
1421 |
+
"step": 5700
|
1422 |
+
},
|
1423 |
+
{
|
1424 |
+
"epoch": 50.66,
|
1425 |
+
"learning_rate": 0.000135,
|
1426 |
+
"loss": 0.0154,
|
1427 |
+
"step": 5725
|
1428 |
+
},
|
1429 |
+
{
|
1430 |
+
"epoch": 50.88,
|
1431 |
+
"learning_rate": 0.00013421052631578946,
|
1432 |
+
"loss": 0.0131,
|
1433 |
+
"step": 5750
|
1434 |
+
},
|
1435 |
+
{
|
1436 |
+
"epoch": 51.11,
|
1437 |
+
"learning_rate": 0.00013342105263157894,
|
1438 |
+
"loss": 0.0161,
|
1439 |
+
"step": 5775
|
1440 |
+
},
|
1441 |
+
{
|
1442 |
+
"epoch": 51.33,
|
1443 |
+
"learning_rate": 0.0001326315789473684,
|
1444 |
+
"loss": 0.0135,
|
1445 |
+
"step": 5800
|
1446 |
+
},
|
1447 |
+
{
|
1448 |
+
"epoch": 51.55,
|
1449 |
+
"learning_rate": 0.00013184210526315788,
|
1450 |
+
"loss": 0.0125,
|
1451 |
+
"step": 5825
|
1452 |
+
},
|
1453 |
+
{
|
1454 |
+
"epoch": 51.77,
|
1455 |
+
"learning_rate": 0.00013105263157894736,
|
1456 |
+
"loss": 0.0114,
|
1457 |
+
"step": 5850
|
1458 |
+
},
|
1459 |
+
{
|
1460 |
+
"epoch": 51.99,
|
1461 |
+
"learning_rate": 0.00013026315789473685,
|
1462 |
+
"loss": 0.0106,
|
1463 |
+
"step": 5875
|
1464 |
+
},
|
1465 |
+
{
|
1466 |
+
"epoch": 52.21,
|
1467 |
+
"learning_rate": 0.0001294736842105263,
|
1468 |
+
"loss": 0.0119,
|
1469 |
+
"step": 5900
|
1470 |
+
},
|
1471 |
+
{
|
1472 |
+
"epoch": 52.43,
|
1473 |
+
"learning_rate": 0.00012868421052631578,
|
1474 |
+
"loss": 0.0123,
|
1475 |
+
"step": 5925
|
1476 |
+
},
|
1477 |
+
{
|
1478 |
+
"epoch": 52.65,
|
1479 |
+
"learning_rate": 0.00012789473684210524,
|
1480 |
+
"loss": 0.0111,
|
1481 |
+
"step": 5950
|
1482 |
+
},
|
1483 |
+
{
|
1484 |
+
"epoch": 52.88,
|
1485 |
+
"learning_rate": 0.00012710526315789472,
|
1486 |
+
"loss": 0.0139,
|
1487 |
+
"step": 5975
|
1488 |
+
},
|
1489 |
+
{
|
1490 |
+
"epoch": 53.1,
|
1491 |
+
"learning_rate": 0.00012631578947368418,
|
1492 |
+
"loss": 0.0155,
|
1493 |
+
"step": 6000
|
1494 |
+
},
|
1495 |
+
{
|
1496 |
+
"epoch": 53.1,
|
1497 |
+
"eval_loss": 0.2688598036766052,
|
1498 |
+
"eval_runtime": 10.7568,
|
1499 |
+
"eval_samples_per_second": 9.296,
|
1500 |
+
"eval_steps_per_second": 1.209,
|
1501 |
+
"eval_wer": 0.06791821116824107,
|
1502 |
+
"step": 6000
|
1503 |
}
|
1504 |
],
|
1505 |
"max_steps": 10000,
|
1506 |
"num_train_epochs": 89,
|
1507 |
+
"total_flos": 2.3640957156336247e+19,
|
1508 |
"trial_name": null,
|
1509 |
"trial_params": null
|
1510 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1262229869
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca12f11ddd482d1635bc0d81ed113f4ea1e018a2f62477116cfcc83538540b81
|
3 |
size 1262229869
|
runs/Apr09_14-45-21_gpu07.cyverse.org/events.out.tfevents.1681076808.gpu07.cyverse.org.48142.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fa0c2b70002f87a44d106c5be0907e96fc3567270c9387d4e18c661e3204a4b
|
3 |
+
size 44970
|