File size: 2,354 Bytes
e859a16
 
 
3e00e68
e859a16
3e00e68
e859a16
 
 
 
 
 
07e2ba1
e859a16
 
 
 
 
 
 
07e2ba1
 
 
e859a16
 
 
 
07e2ba1
e859a16
 
 
 
 
 
07e2ba1
e859a16
07e2ba1
e859a16
 
 
 
07e2ba1
 
 
 
e859a16
82af8c7
 
 
07e2ba1
82af8c7
07e2ba1
82af8c7
 
 
 
07e2ba1
82af8c7
 
 
 
 
 
07e2ba1
82af8c7
07e2ba1
82af8c7
 
 
 
07e2ba1
 
 
 
82af8c7
e859a16
 
 
 
 
 
 
 
 
 
 
 
 
 
3e00e68
e859a16
 
 
 
3e00e68
e859a16
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.0011276075925577898,
  "eval_steps": 3,
  "global_step": 6,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.00018793459875963165,
      "grad_norm": 0.40805867314338684,
      "learning_rate": 2e-05,
      "loss": 2.0097,
      "step": 1
    },
    {
      "epoch": 0.00018793459875963165,
      "eval_loss": 2.225860595703125,
      "eval_runtime": 104.7616,
      "eval_samples_per_second": 10.7,
      "eval_steps_per_second": 10.7,
      "step": 1
    },
    {
      "epoch": 0.0003758691975192633,
      "grad_norm": 0.3363264501094818,
      "learning_rate": 4e-05,
      "loss": 2.0424,
      "step": 2
    },
    {
      "epoch": 0.0005638037962788949,
      "grad_norm": 0.4387308359146118,
      "learning_rate": 6e-05,
      "loss": 2.2437,
      "step": 3
    },
    {
      "epoch": 0.0005638037962788949,
      "eval_loss": 2.223356246948242,
      "eval_runtime": 105.324,
      "eval_samples_per_second": 10.643,
      "eval_steps_per_second": 10.643,
      "step": 3
    },
    {
      "epoch": 0.0007517383950385266,
      "grad_norm": 0.30487483739852905,
      "learning_rate": 8e-05,
      "loss": 2.1183,
      "step": 4
    },
    {
      "epoch": 0.0009396729937981583,
      "grad_norm": 0.44409823417663574,
      "learning_rate": 0.0001,
      "loss": 2.2092,
      "step": 5
    },
    {
      "epoch": 0.0011276075925577898,
      "grad_norm": 0.31591424345970154,
      "learning_rate": 0.00012,
      "loss": 2.223,
      "step": 6
    },
    {
      "epoch": 0.0011276075925577898,
      "eval_loss": 2.2032065391540527,
      "eval_runtime": 104.9365,
      "eval_samples_per_second": 10.683,
      "eval_steps_per_second": 10.683,
      "step": 6
    }
  ],
  "logging_steps": 1,
  "max_steps": 10,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 3,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 417433827409920.0,
  "train_batch_size": 1,
  "trial_name": null,
  "trial_params": null
}