lapp0 commited on
Commit
f8cd216
1 Parent(s): 86f60e4

Training in progress, step 5000

Browse files
logs/dataset_max_seq_length=1024, dataset_sample_size=1000000, dataset_subset=sample-10BT, dataset_uri=HuggingFaceFW_fineweb, logits_loss_fn=liger_kl, per_device_train_batch_size=8/events.out.tfevents.1727261283.1c1a426a2fee ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51ea11e0b109f95ccb929a99315a09da1f4c0333c8fd4dbc07e83a17fd4d4f6c
3
+ size 140509
logs/dataset_max_seq_length=1024, dataset_sample_size=1000000, dataset_subset=sample-10BT, dataset_uri=HuggingFaceFW_fineweb, per_device_train_batch_size=8/completed.flag ADDED
File without changes
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7027dade237cc34c1fe1e5665a672c949815fca8bbc0df8d3bbdec24cc732533
3
  size 325669528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04ccde75028f60080bfc4be957bbd2c788df78c233244c1120c479eb9dff963d
3
  size 325669528
tokenizer.json CHANGED
@@ -1,7 +1,19 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 1023,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": "BatchLongest",
11
+ "direction": "Right",
12
+ "pad_to_multiple_of": null,
13
+ "pad_id": 0,
14
+ "pad_type_id": 0,
15
+ "pad_token": "<|endoftext|>"
16
+ },
17
  "added_tokens": [
18
  {
19
  "id": 0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66494727ec03541c5c991424dd80273f96b4325bc02006dd5123394dcf73c030
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:489ac1c599f8c23dd19af80387679fc021366579b87b8a776b5ebb68da3da2a3
3
+ size 5688