arshsin commited on
Commit
6bf1f81
1 Parent(s): 61969c2

Training in progress, epoch 10, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8c4bc197ae6609e636c1acebdecb4450fae4cfd794e2f8bc9b54c75e3ce752e
3
  size 344814656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1cfd92e5b02b8ff66c36c2a61b8d216af20f9b464d495fc9268d634fc57e174
3
  size 344814656
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbb5b73e896c076b7857396e5c3157c071638b325ea0b1351b027ca98c90c9fa
3
  size 689741690
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb4bd2222fc55ea760e270b7a90df63003a9adbfcb8051634a05548fa377517c
3
  size 689741690
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3bd3cafcd141485c5526689e7070ba65dab1e4639fbae44141ae41439003c1f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c94c375fe5ad2903d244ca6b5cc2a1a6cba4c0c26196f3b9cbd9ddd170bb0b8
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bb119f3746a9da47b87642d601b53ab62f9c42621fd5116cb0fdc3c05776476
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56251b046e7a9d0ca44cd9a61d2356bc2bfc323d763eb05420cc0c6f1e732d28
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.89,
3
- "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
- "epoch": 9.0,
5
  "eval_steps": 500,
6
- "global_step": 1017,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1306,13 +1306,160 @@
1306
  "eval_samples_per_second": 6.682,
1307
  "eval_steps_per_second": 0.869,
1308
  "step": 1017
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1309
  }
1310
  ],
1311
  "logging_steps": 5,
1312
  "max_steps": 1130,
1313
  "num_train_epochs": 10,
1314
  "save_steps": 500,
1315
- "total_flos": 5.484701028895949e+17,
1316
  "trial_name": null,
1317
  "trial_params": null
1318
  }
 
1
  {
2
+ "best_metric": 0.9,
3
+ "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-1130",
4
+ "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 1130,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1306
  "eval_samples_per_second": 6.682,
1307
  "eval_steps_per_second": 0.869,
1308
  "step": 1017
1309
+ },
1310
+ {
1311
+ "epoch": 9.03,
1312
+ "learning_rate": 5.408062930186824e-06,
1313
+ "loss": 0.0,
1314
+ "step": 1020
1315
+ },
1316
+ {
1317
+ "epoch": 9.07,
1318
+ "learning_rate": 5.162241887905605e-06,
1319
+ "loss": 0.0,
1320
+ "step": 1025
1321
+ },
1322
+ {
1323
+ "epoch": 9.12,
1324
+ "learning_rate": 4.9164208456243854e-06,
1325
+ "loss": 0.0,
1326
+ "step": 1030
1327
+ },
1328
+ {
1329
+ "epoch": 9.16,
1330
+ "learning_rate": 4.670599803343166e-06,
1331
+ "loss": 0.0,
1332
+ "step": 1035
1333
+ },
1334
+ {
1335
+ "epoch": 9.2,
1336
+ "learning_rate": 4.424778761061947e-06,
1337
+ "loss": 0.0,
1338
+ "step": 1040
1339
+ },
1340
+ {
1341
+ "epoch": 9.25,
1342
+ "learning_rate": 4.178957718780728e-06,
1343
+ "loss": 0.0,
1344
+ "step": 1045
1345
+ },
1346
+ {
1347
+ "epoch": 9.29,
1348
+ "learning_rate": 3.933136676499508e-06,
1349
+ "loss": 0.0,
1350
+ "step": 1050
1351
+ },
1352
+ {
1353
+ "epoch": 9.34,
1354
+ "learning_rate": 3.6873156342182893e-06,
1355
+ "loss": 0.0,
1356
+ "step": 1055
1357
+ },
1358
+ {
1359
+ "epoch": 9.38,
1360
+ "learning_rate": 3.44149459193707e-06,
1361
+ "loss": 0.0,
1362
+ "step": 1060
1363
+ },
1364
+ {
1365
+ "epoch": 9.42,
1366
+ "learning_rate": 3.1956735496558502e-06,
1367
+ "loss": 0.0,
1368
+ "step": 1065
1369
+ },
1370
+ {
1371
+ "epoch": 9.47,
1372
+ "learning_rate": 2.9498525073746313e-06,
1373
+ "loss": 0.0,
1374
+ "step": 1070
1375
+ },
1376
+ {
1377
+ "epoch": 9.51,
1378
+ "learning_rate": 2.704031465093412e-06,
1379
+ "loss": 0.0332,
1380
+ "step": 1075
1381
+ },
1382
+ {
1383
+ "epoch": 9.56,
1384
+ "learning_rate": 2.4582104228121927e-06,
1385
+ "loss": 0.0,
1386
+ "step": 1080
1387
+ },
1388
+ {
1389
+ "epoch": 9.6,
1390
+ "learning_rate": 2.2123893805309734e-06,
1391
+ "loss": 0.0,
1392
+ "step": 1085
1393
+ },
1394
+ {
1395
+ "epoch": 9.65,
1396
+ "learning_rate": 1.966568338249754e-06,
1397
+ "loss": 0.0,
1398
+ "step": 1090
1399
+ },
1400
+ {
1401
+ "epoch": 9.69,
1402
+ "learning_rate": 1.720747295968535e-06,
1403
+ "loss": 0.3838,
1404
+ "step": 1095
1405
+ },
1406
+ {
1407
+ "epoch": 9.73,
1408
+ "learning_rate": 1.4749262536873157e-06,
1409
+ "loss": 0.0,
1410
+ "step": 1100
1411
+ },
1412
+ {
1413
+ "epoch": 9.78,
1414
+ "learning_rate": 1.2291052114060964e-06,
1415
+ "loss": 0.0,
1416
+ "step": 1105
1417
+ },
1418
+ {
1419
+ "epoch": 9.82,
1420
+ "learning_rate": 9.83284169124877e-07,
1421
+ "loss": 0.0,
1422
+ "step": 1110
1423
+ },
1424
+ {
1425
+ "epoch": 9.87,
1426
+ "learning_rate": 7.374631268436578e-07,
1427
+ "loss": 0.0,
1428
+ "step": 1115
1429
+ },
1430
+ {
1431
+ "epoch": 9.91,
1432
+ "learning_rate": 4.916420845624385e-07,
1433
+ "loss": 0.0,
1434
+ "step": 1120
1435
+ },
1436
+ {
1437
+ "epoch": 9.96,
1438
+ "learning_rate": 2.4582104228121926e-07,
1439
+ "loss": 0.0,
1440
+ "step": 1125
1441
+ },
1442
+ {
1443
+ "epoch": 10.0,
1444
+ "learning_rate": 0.0,
1445
+ "loss": 0.0,
1446
+ "step": 1130
1447
+ },
1448
+ {
1449
+ "epoch": 10.0,
1450
+ "eval_accuracy": 0.9,
1451
+ "eval_loss": 0.7291831970214844,
1452
+ "eval_runtime": 15.0581,
1453
+ "eval_samples_per_second": 6.641,
1454
+ "eval_steps_per_second": 0.863,
1455
+ "step": 1130
1456
  }
1457
  ],
1458
  "logging_steps": 5,
1459
  "max_steps": 1130,
1460
  "num_train_epochs": 10,
1461
  "save_steps": 500,
1462
+ "total_flos": 6.094112254328832e+17,
1463
  "trial_name": null,
1464
  "trial_params": null
1465
  }