Training in progress, step 500
Browse files- config.json +31 -0
- model.safetensors +3 -0
- runs/Nov03_00-43-35_cd4dc85877da/events.out.tfevents.1698972222.cd4dc85877da.180.0 +3 -0
- runs/Nov03_00-45-56_cd4dc85877da/events.out.tfevents.1698972362.cd4dc85877da.180.1 +3 -0
- runs/Nov03_00-50-05_cd4dc85877da/events.out.tfevents.1698972616.cd4dc85877da.180.2 +3 -0
- runs/Nov03_00-54-06_cd4dc85877da/events.out.tfevents.1698972852.cd4dc85877da.180.3 +3 -0
- runs/Nov03_01-02-11_cd4dc85877da/events.out.tfevents.1698973337.cd4dc85877da.11422.0 +3 -0
- runs/Nov03_01-07-50_cd4dc85877da/events.out.tfevents.1698973679.cd4dc85877da.12957.0 +3 -0
- runs/Nov03_01-34-17_cd4dc85877da/events.out.tfevents.1698975261.cd4dc85877da.12957.1 +3 -0
- runs/Nov03_01-37-30_cd4dc85877da/events.out.tfevents.1698975457.cd4dc85877da.20433.0 +3 -0
- runs/Nov03_01-44-38_cd4dc85877da/events.out.tfevents.1698975885.cd4dc85877da.22555.0 +3 -0
- training_args.bin +3 -0
config.json
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "facebook/opt-125m",
|
3 |
+
"_remove_final_layer_norm": false,
|
4 |
+
"activation_dropout": 0.0,
|
5 |
+
"activation_function": "relu",
|
6 |
+
"architectures": [
|
7 |
+
"OPTForCausalLM"
|
8 |
+
],
|
9 |
+
"attention_dropout": 0.0,
|
10 |
+
"bos_token_id": 2,
|
11 |
+
"do_layer_norm_before": true,
|
12 |
+
"dropout": 0.1,
|
13 |
+
"enable_bias": true,
|
14 |
+
"eos_token_id": 2,
|
15 |
+
"ffn_dim": 3072,
|
16 |
+
"hidden_size": 768,
|
17 |
+
"init_std": 0.02,
|
18 |
+
"layer_norm_elementwise_affine": true,
|
19 |
+
"layerdrop": 0.0,
|
20 |
+
"max_position_embeddings": 2048,
|
21 |
+
"model_type": "opt",
|
22 |
+
"num_attention_heads": 12,
|
23 |
+
"num_hidden_layers": 12,
|
24 |
+
"pad_token_id": 1,
|
25 |
+
"prefix": "</s>",
|
26 |
+
"torch_dtype": "float32",
|
27 |
+
"transformers_version": "4.35.0",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 50272,
|
30 |
+
"word_embed_proj_dim": 768
|
31 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:743031bd5648f9c2832ee8ce1100f25c23fe1ae3b581048c169bc40653938ea4
|
3 |
+
size 500979600
|
runs/Nov03_00-43-35_cd4dc85877da/events.out.tfevents.1698972222.cd4dc85877da.180.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9a6654cee75c8fcca7acdb363c7d4ceaf52f1fcdba095c9267b785b1a218a40
|
3 |
+
size 4350
|
runs/Nov03_00-45-56_cd4dc85877da/events.out.tfevents.1698972362.cd4dc85877da.180.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8dee985829033a7ba94205be1495c54e6a87f753706b4532252d4b0c236a26d
|
3 |
+
size 4350
|
runs/Nov03_00-50-05_cd4dc85877da/events.out.tfevents.1698972616.cd4dc85877da.180.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f9b14b2cc305ae55a19e8508fef59154c556454ff340a4bb3ce379af836a29d
|
3 |
+
size 4350
|
runs/Nov03_00-54-06_cd4dc85877da/events.out.tfevents.1698972852.cd4dc85877da.180.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af6d6394236e7e65e1ac673b02207cceee0669ba8a69981bf6bfcbc0acec5583
|
3 |
+
size 4350
|
runs/Nov03_01-02-11_cd4dc85877da/events.out.tfevents.1698973337.cd4dc85877da.11422.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d802f16cfa079c51662ad258109685c1428ebc7236486e017acc25826334f7be
|
3 |
+
size 4350
|
runs/Nov03_01-07-50_cd4dc85877da/events.out.tfevents.1698973679.cd4dc85877da.12957.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eef9d695f2d926c0b3d221e31dc8b8139a16c404bd18eaa351ef19bcd64595fd
|
3 |
+
size 4350
|
runs/Nov03_01-34-17_cd4dc85877da/events.out.tfevents.1698975261.cd4dc85877da.12957.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdad6a6d04a24c08f8c487b619f160f7aa9d5c1278315e076bf7188431fc8143
|
3 |
+
size 4184
|
runs/Nov03_01-37-30_cd4dc85877da/events.out.tfevents.1698975457.cd4dc85877da.20433.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8af754437dd17c4cde64230ee6a5308be5e2b2ad5f338127ebbb19cbcabdf1ff
|
3 |
+
size 4350
|
runs/Nov03_01-44-38_cd4dc85877da/events.out.tfevents.1698975885.cd4dc85877da.22555.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6164e75aebc766f6721cd9e52e88f929ef0e0289991767ab2dd2070eeb936778
|
3 |
+
size 4507
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac81429579793b8a566f442c775a7961f63636e0ac785121b7d672b94927e515
|
3 |
+
size 4600
|