Training in progress, step 45
Browse files- .gitignore +1 -0
- config.json +39 -0
- merges.txt +0 -0
- pytorch_model.bin +3 -0
- runs/May18_18-49-00_molly-dl/1684461034.0884118/events.out.tfevents.1684461034.molly-dl.445636.1 +3 -0
- runs/May18_18-49-00_molly-dl/events.out.tfevents.1684461034.molly-dl.445636.0 +3 -0
- runs/May18_19-01-20_molly-dl/1684461685.2734933/events.out.tfevents.1684461685.molly-dl.445636.3 +3 -0
- runs/May18_19-01-20_molly-dl/events.out.tfevents.1684461685.molly-dl.445636.2 +3 -0
- runs/May18_19-02-15_molly-dl/1684461740.4800537/events.out.tfevents.1684461740.molly-dl.450457.1 +3 -0
- runs/May18_19-02-15_molly-dl/events.out.tfevents.1684461740.molly-dl.450457.0 +3 -0
- runs/May18_19-04-12_molly-dl/1684461857.993086/events.out.tfevents.1684461857.molly-dl.450711.1 +3 -0
- runs/May18_19-04-12_molly-dl/events.out.tfevents.1684461857.molly-dl.450711.0 +3 -0
- runs/May18_19-06-27_molly-dl/1684461992.6714196/events.out.tfevents.1684461992.molly-dl.450962.1 +3 -0
- runs/May18_19-06-27_molly-dl/events.out.tfevents.1684461992.molly-dl.450962.0 +3 -0
- runs/May18_19-07-20_molly-dl/1684462045.1422544/events.out.tfevents.1684462045.molly-dl.451147.1 +3 -0
- runs/May18_19-07-20_molly-dl/events.out.tfevents.1684462045.molly-dl.451147.0 +3 -0
- runs/May18_19-08-21_molly-dl/1684462105.7766871/events.out.tfevents.1684462105.molly-dl.451339.1 +3 -0
- runs/May18_19-08-21_molly-dl/events.out.tfevents.1684462105.molly-dl.451339.0 +3 -0
- runs/May18_19-09-07_molly-dl/1684462152.2975395/events.out.tfevents.1684462152.molly-dl.451518.1 +3 -0
- runs/May18_19-09-07_molly-dl/events.out.tfevents.1684462152.molly-dl.451518.0 +3 -0
- runs/May18_19-09-58_molly-dl/1684462202.481355/events.out.tfevents.1684462202.molly-dl.451702.1 +3 -0
- runs/May18_19-09-58_molly-dl/events.out.tfevents.1684462202.molly-dl.451702.0 +3 -0
- runs/May18_20-11-45_molly-dl/1684465909.682996/events.out.tfevents.1684465909.molly-dl.454431.1 +3 -0
- runs/May18_20-11-45_molly-dl/events.out.tfevents.1684465909.molly-dl.454431.0 +3 -0
- special_tokens_map.json +6 -0
- tokenizer.json +0 -0
- tokenizer_config.json +10 -0
- training_args.bin +3 -0
- vocab.json +0 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "gpt2",
|
3 |
+
"activation_function": "gelu_new",
|
4 |
+
"architectures": [
|
5 |
+
"GPT2LMHeadModel"
|
6 |
+
],
|
7 |
+
"attn_pdrop": 0.1,
|
8 |
+
"bos_token_id": 0,
|
9 |
+
"embd_pdrop": 0.1,
|
10 |
+
"eos_token_id": 0,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"layer_norm_epsilon": 1e-05,
|
13 |
+
"model_type": "gpt2",
|
14 |
+
"n_ctx": 128,
|
15 |
+
"n_embd": 768,
|
16 |
+
"n_head": 12,
|
17 |
+
"n_inner": null,
|
18 |
+
"n_layer": 12,
|
19 |
+
"n_positions": 1024,
|
20 |
+
"reorder_and_upcast_attn": false,
|
21 |
+
"resid_pdrop": 0.1,
|
22 |
+
"scale_attn_by_inverse_layer_idx": false,
|
23 |
+
"scale_attn_weights": true,
|
24 |
+
"summary_activation": null,
|
25 |
+
"summary_first_dropout": 0.1,
|
26 |
+
"summary_proj_to_labels": true,
|
27 |
+
"summary_type": "cls_index",
|
28 |
+
"summary_use_proj": true,
|
29 |
+
"task_specific_params": {
|
30 |
+
"text-generation": {
|
31 |
+
"do_sample": true,
|
32 |
+
"max_length": 50
|
33 |
+
}
|
34 |
+
},
|
35 |
+
"torch_dtype": "float32",
|
36 |
+
"transformers_version": "4.23.1",
|
37 |
+
"use_cache": true,
|
38 |
+
"vocab_size": 50000
|
39 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b1d759dc5c25f3eaaba2eeae418d2421bfed7ca3f3770da402570087013d6a0
|
3 |
+
size 509607017
|
runs/May18_18-49-00_molly-dl/1684461034.0884118/events.out.tfevents.1684461034.molly-dl.445636.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:863e87d60b08e969d212ffbc014ddd502a4526e0f55d43e82dd6ec493a0d8085
|
3 |
+
size 5473
|
runs/May18_18-49-00_molly-dl/events.out.tfevents.1684461034.molly-dl.445636.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5808ede2bf505b2fc96d896ebb3881c31b08b8d425db4dfea240988b5110b652
|
3 |
+
size 4293
|
runs/May18_19-01-20_molly-dl/1684461685.2734933/events.out.tfevents.1684461685.molly-dl.445636.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19e61d7413a3d0cea1e31e931255c63429d49890eb8dda8e497dee6612eeeebe
|
3 |
+
size 5473
|
runs/May18_19-01-20_molly-dl/events.out.tfevents.1684461685.molly-dl.445636.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:186dd8360b90d0dfee14e84b6d1e84ec679bdcf2f0445bf470ca368dc1d6f1b1
|
3 |
+
size 40
|
runs/May18_19-02-15_molly-dl/1684461740.4800537/events.out.tfevents.1684461740.molly-dl.450457.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a92d9c33c5f7813b2ca725c4d4074bbfabf7fe7c8240e49d26e0818c7f00ca9c
|
3 |
+
size 5473
|
runs/May18_19-02-15_molly-dl/events.out.tfevents.1684461740.molly-dl.450457.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9062b87547024f541025efb4b404b16216f0da8bd3d656dfc1a5c7f5a87c5eb
|
3 |
+
size 40
|
runs/May18_19-04-12_molly-dl/1684461857.993086/events.out.tfevents.1684461857.molly-dl.450711.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0317a1075c1ab8bcf63d252afdb56f889d95110ab748239b44a121ddaa933489
|
3 |
+
size 5473
|
runs/May18_19-04-12_molly-dl/events.out.tfevents.1684461857.molly-dl.450711.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12fe16347584dc63fff066994dfa68db70629b777fcf50cccf0df2b93f81a981
|
3 |
+
size 40
|
runs/May18_19-06-27_molly-dl/1684461992.6714196/events.out.tfevents.1684461992.molly-dl.450962.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dab91465892794aa19107eb6c3d0526498df3e2b13a2201f5ca4978f7df39ac
|
3 |
+
size 5473
|
runs/May18_19-06-27_molly-dl/events.out.tfevents.1684461992.molly-dl.450962.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f35bac49ce1d030f36b396c739bb64e38f509727eefd945e14b8c1971f5410d9
|
3 |
+
size 40
|
runs/May18_19-07-20_molly-dl/1684462045.1422544/events.out.tfevents.1684462045.molly-dl.451147.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5e6e59f8e31a643b5382063a542dbc2f4a111e742477a06b1b2e68a5f12b331
|
3 |
+
size 5473
|
runs/May18_19-07-20_molly-dl/events.out.tfevents.1684462045.molly-dl.451147.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d28a84d86ac8ceb918fbfa323d755d2c9e192a61ed6f91aadb733a597c554df
|
3 |
+
size 40
|
runs/May18_19-08-21_molly-dl/1684462105.7766871/events.out.tfevents.1684462105.molly-dl.451339.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e82383c1e31e22f71f4a62a6eefc25dad770b9e84ebc171181f927e4b61ba8d8
|
3 |
+
size 5473
|
runs/May18_19-08-21_molly-dl/events.out.tfevents.1684462105.molly-dl.451339.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca710ba8955be50840f93d3742efecb1fcee0e1ef3ba59c2a3520f3e9f99823a
|
3 |
+
size 40
|
runs/May18_19-09-07_molly-dl/1684462152.2975395/events.out.tfevents.1684462152.molly-dl.451518.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:572edecd48661c8323b1f1ad043d9dc448fbd106a800e570aa5c26b0b9d952a4
|
3 |
+
size 5473
|
runs/May18_19-09-07_molly-dl/events.out.tfevents.1684462152.molly-dl.451518.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:657c35cf8e4e7a2c96b628e312408a96b0b34bf9863462ebaf6d41c281a2ca82
|
3 |
+
size 40
|
runs/May18_19-09-58_molly-dl/1684462202.481355/events.out.tfevents.1684462202.molly-dl.451702.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3564a04154c442420f18462fe3ea682e414591cea89682d7fce7f5474523c352
|
3 |
+
size 5473
|
runs/May18_19-09-58_molly-dl/events.out.tfevents.1684462202.molly-dl.451702.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b65bd10d85dae087b3b1a66a574755cbb8834b45a2dc55d8357d01a38e9a6202
|
3 |
+
size 3946
|
runs/May18_20-11-45_molly-dl/1684465909.682996/events.out.tfevents.1684465909.molly-dl.454431.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e0bd0ecd72e8b426083a9edecbad4e4f2de154b0f56cc977929a7f75251c84a
|
3 |
+
size 5473
|
runs/May18_20-11-45_molly-dl/events.out.tfevents.1684465909.molly-dl.454431.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa7b6862056d16ed8e18fbc0600a8a388507f4571674b1ee8f67c6ca5570f0f3
|
3 |
+
size 6037
|
special_tokens_map.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": "<|endoftext|>",
|
3 |
+
"eos_token": "<|endoftext|>",
|
4 |
+
"pad_token": "<|endoftext|>",
|
5 |
+
"unk_token": "<|endoftext|>"
|
6 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"bos_token": "<|endoftext|>",
|
4 |
+
"eos_token": "<|endoftext|>",
|
5 |
+
"model_max_length": 1024,
|
6 |
+
"name_or_path": "huggingface-course/code-search-net-tokenizer",
|
7 |
+
"special_tokens_map_file": null,
|
8 |
+
"tokenizer_class": "GPT2Tokenizer",
|
9 |
+
"unk_token": "<|endoftext|>"
|
10 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73042d6b54b294a74b197ad7d304fde51a509a27d0c1ca8d27861a9677096304
|
3 |
+
size 3375
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|