elsayedissa commited on
Commit
105cfec
1 Parent(s): 54db0be

Training in progress, step 10000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0c2be3452d8137d689d35c0df6e890c78020bf9843bc1e5ee746f483f22d91d
3
  size 2524414853
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91a8bc4af41578250a3b744334e77d523696c897dbeb1f992605c463a67991ec
3
  size 2524414853
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c2f9145d655487602d0119001d797a278a1eb42e4a3b0bd88e042a0adbe3136
3
  size 1262229869
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:611a34e0242d2ec649f0d1a86165d8423ae4a1d7e81641c0d56c2019e5ef6450
3
  size 1262229869
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70a396db9e5798714b943d735d77ab7ab39ac707fd4daa400a37b45acbc4d16e
3
- size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a300d66a0192b31de2f7c8bff794f15d013787aa64770ba8b66b59e79dd7ee3
3
+ size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e7b0809e95e7bb66d8269d06cf0ed6189035774c3ca188b731868d7c85cab50
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a8805627ff330405ad609ba9ab7315667856758f8bf2f6a02771e64b1ec5ccb
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.065048427597752,
3
- "best_model_checkpoint": "./wav2vec2-xls-r-300m-ar/checkpoint-9000",
4
- "epoch": 79.64601769911505,
5
- "global_step": 9000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2247,11 +2247,260 @@
2247
  "eval_steps_per_second": 1.201,
2248
  "eval_wer": 0.065048427597752,
2249
  "step": 9000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2250
  }
2251
  ],
2252
  "max_steps": 10000,
2253
  "num_train_epochs": 89,
2254
- "total_flos": 3.5456385787518284e+19,
2255
  "trial_name": null,
2256
  "trial_params": null
2257
  }
 
1
  {
2
+ "best_metric": 0.06361353581250748,
3
+ "best_model_checkpoint": "./wav2vec2-xls-r-300m-ar/checkpoint-10000",
4
+ "epoch": 88.49557522123894,
5
+ "global_step": 10000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2247
  "eval_steps_per_second": 1.201,
2248
  "eval_wer": 0.065048427597752,
2249
  "step": 9000
2250
+ },
2251
+ {
2252
+ "epoch": 79.87,
2253
+ "learning_rate": 3.078947368421052e-05,
2254
+ "loss": 0.0052,
2255
+ "step": 9025
2256
+ },
2257
+ {
2258
+ "epoch": 80.09,
2259
+ "learning_rate": 2.9999999999999997e-05,
2260
+ "loss": 0.0053,
2261
+ "step": 9050
2262
+ },
2263
+ {
2264
+ "epoch": 80.31,
2265
+ "learning_rate": 2.921052631578947e-05,
2266
+ "loss": 0.0049,
2267
+ "step": 9075
2268
+ },
2269
+ {
2270
+ "epoch": 80.53,
2271
+ "learning_rate": 2.8421052631578946e-05,
2272
+ "loss": 0.0049,
2273
+ "step": 9100
2274
+ },
2275
+ {
2276
+ "epoch": 80.75,
2277
+ "learning_rate": 2.7631578947368416e-05,
2278
+ "loss": 0.0045,
2279
+ "step": 9125
2280
+ },
2281
+ {
2282
+ "epoch": 80.97,
2283
+ "learning_rate": 2.6842105263157892e-05,
2284
+ "loss": 0.0053,
2285
+ "step": 9150
2286
+ },
2287
+ {
2288
+ "epoch": 81.19,
2289
+ "learning_rate": 2.605263157894737e-05,
2290
+ "loss": 0.0051,
2291
+ "step": 9175
2292
+ },
2293
+ {
2294
+ "epoch": 81.42,
2295
+ "learning_rate": 2.5263157894736838e-05,
2296
+ "loss": 0.0056,
2297
+ "step": 9200
2298
+ },
2299
+ {
2300
+ "epoch": 81.64,
2301
+ "learning_rate": 2.4473684210526314e-05,
2302
+ "loss": 0.0056,
2303
+ "step": 9225
2304
+ },
2305
+ {
2306
+ "epoch": 81.86,
2307
+ "learning_rate": 2.3684210526315787e-05,
2308
+ "loss": 0.0047,
2309
+ "step": 9250
2310
+ },
2311
+ {
2312
+ "epoch": 82.08,
2313
+ "learning_rate": 2.289473684210526e-05,
2314
+ "loss": 0.0072,
2315
+ "step": 9275
2316
+ },
2317
+ {
2318
+ "epoch": 82.3,
2319
+ "learning_rate": 2.2105263157894733e-05,
2320
+ "loss": 0.0055,
2321
+ "step": 9300
2322
+ },
2323
+ {
2324
+ "epoch": 82.52,
2325
+ "learning_rate": 2.131578947368421e-05,
2326
+ "loss": 0.005,
2327
+ "step": 9325
2328
+ },
2329
+ {
2330
+ "epoch": 82.74,
2331
+ "learning_rate": 2.0526315789473685e-05,
2332
+ "loss": 0.0035,
2333
+ "step": 9350
2334
+ },
2335
+ {
2336
+ "epoch": 82.96,
2337
+ "learning_rate": 1.9736842105263155e-05,
2338
+ "loss": 0.0052,
2339
+ "step": 9375
2340
+ },
2341
+ {
2342
+ "epoch": 83.19,
2343
+ "learning_rate": 1.894736842105263e-05,
2344
+ "loss": 0.0046,
2345
+ "step": 9400
2346
+ },
2347
+ {
2348
+ "epoch": 83.41,
2349
+ "learning_rate": 1.8157894736842104e-05,
2350
+ "loss": 0.0056,
2351
+ "step": 9425
2352
+ },
2353
+ {
2354
+ "epoch": 83.63,
2355
+ "learning_rate": 1.7368421052631577e-05,
2356
+ "loss": 0.005,
2357
+ "step": 9450
2358
+ },
2359
+ {
2360
+ "epoch": 83.85,
2361
+ "learning_rate": 1.657894736842105e-05,
2362
+ "loss": 0.0046,
2363
+ "step": 9475
2364
+ },
2365
+ {
2366
+ "epoch": 84.07,
2367
+ "learning_rate": 1.5789473684210522e-05,
2368
+ "loss": 0.0061,
2369
+ "step": 9500
2370
+ },
2371
+ {
2372
+ "epoch": 84.29,
2373
+ "learning_rate": 1.4999999999999999e-05,
2374
+ "loss": 0.0051,
2375
+ "step": 9525
2376
+ },
2377
+ {
2378
+ "epoch": 84.51,
2379
+ "learning_rate": 1.4210526315789473e-05,
2380
+ "loss": 0.0033,
2381
+ "step": 9550
2382
+ },
2383
+ {
2384
+ "epoch": 84.73,
2385
+ "learning_rate": 1.3421052631578946e-05,
2386
+ "loss": 0.0035,
2387
+ "step": 9575
2388
+ },
2389
+ {
2390
+ "epoch": 84.96,
2391
+ "learning_rate": 1.2631578947368419e-05,
2392
+ "loss": 0.0054,
2393
+ "step": 9600
2394
+ },
2395
+ {
2396
+ "epoch": 85.18,
2397
+ "learning_rate": 1.1842105263157894e-05,
2398
+ "loss": 0.005,
2399
+ "step": 9625
2400
+ },
2401
+ {
2402
+ "epoch": 85.4,
2403
+ "learning_rate": 1.1052631578947366e-05,
2404
+ "loss": 0.0039,
2405
+ "step": 9650
2406
+ },
2407
+ {
2408
+ "epoch": 85.62,
2409
+ "learning_rate": 1.0263157894736843e-05,
2410
+ "loss": 0.0044,
2411
+ "step": 9675
2412
+ },
2413
+ {
2414
+ "epoch": 85.84,
2415
+ "learning_rate": 9.473684210526315e-06,
2416
+ "loss": 0.0049,
2417
+ "step": 9700
2418
+ },
2419
+ {
2420
+ "epoch": 86.06,
2421
+ "learning_rate": 8.684210526315788e-06,
2422
+ "loss": 0.0042,
2423
+ "step": 9725
2424
+ },
2425
+ {
2426
+ "epoch": 86.28,
2427
+ "learning_rate": 7.894736842105261e-06,
2428
+ "loss": 0.0041,
2429
+ "step": 9750
2430
+ },
2431
+ {
2432
+ "epoch": 86.5,
2433
+ "learning_rate": 7.105263157894737e-06,
2434
+ "loss": 0.0036,
2435
+ "step": 9775
2436
+ },
2437
+ {
2438
+ "epoch": 86.73,
2439
+ "learning_rate": 6.3157894736842095e-06,
2440
+ "loss": 0.0037,
2441
+ "step": 9800
2442
+ },
2443
+ {
2444
+ "epoch": 86.95,
2445
+ "learning_rate": 5.526315789473683e-06,
2446
+ "loss": 0.005,
2447
+ "step": 9825
2448
+ },
2449
+ {
2450
+ "epoch": 87.17,
2451
+ "learning_rate": 4.736842105263158e-06,
2452
+ "loss": 0.0047,
2453
+ "step": 9850
2454
+ },
2455
+ {
2456
+ "epoch": 87.39,
2457
+ "learning_rate": 3.947368421052631e-06,
2458
+ "loss": 0.0039,
2459
+ "step": 9875
2460
+ },
2461
+ {
2462
+ "epoch": 87.61,
2463
+ "learning_rate": 3.1578947368421047e-06,
2464
+ "loss": 0.0041,
2465
+ "step": 9900
2466
+ },
2467
+ {
2468
+ "epoch": 87.83,
2469
+ "learning_rate": 2.368421052631579e-06,
2470
+ "loss": 0.0052,
2471
+ "step": 9925
2472
+ },
2473
+ {
2474
+ "epoch": 88.05,
2475
+ "learning_rate": 1.5789473684210524e-06,
2476
+ "loss": 0.0041,
2477
+ "step": 9950
2478
+ },
2479
+ {
2480
+ "epoch": 88.27,
2481
+ "learning_rate": 7.894736842105262e-07,
2482
+ "loss": 0.004,
2483
+ "step": 9975
2484
+ },
2485
+ {
2486
+ "epoch": 88.5,
2487
+ "learning_rate": 0.0,
2488
+ "loss": 0.0033,
2489
+ "step": 10000
2490
+ },
2491
+ {
2492
+ "epoch": 88.5,
2493
+ "eval_loss": 0.32122763991355896,
2494
+ "eval_runtime": 10.9251,
2495
+ "eval_samples_per_second": 9.153,
2496
+ "eval_steps_per_second": 1.19,
2497
+ "eval_wer": 0.06361353581250748,
2498
+ "step": 10000
2499
  }
2500
  ],
2501
  "max_steps": 10000,
2502
  "num_train_epochs": 89,
2503
+ "total_flos": 3.937659402470073e+19,
2504
  "trial_name": null,
2505
  "trial_params": null
2506
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c2f9145d655487602d0119001d797a278a1eb42e4a3b0bd88e042a0adbe3136
3
  size 1262229869
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:611a34e0242d2ec649f0d1a86165d8423ae4a1d7e81641c0d56c2019e5ef6450
3
  size 1262229869
runs/Apr09_14-45-21_gpu07.cyverse.org/events.out.tfevents.1681076808.gpu07.cyverse.org.48142.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d5ae4f462216938e728a8fba4681e7f5455b3d2c2795cb02eb92e4c0cd05237
3
- size 64764
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6406d5a68ae370ad6e03e2fd256a904caa05f4dcec974cccfa689cc8778c1dde
3
+ size 71362