Herocat commited on
Commit
1ac5a3c
·
1 Parent(s): f09b6ea

Training in progress, step 500

Browse files
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/opt-125m",
3
+ "_remove_final_layer_norm": false,
4
+ "activation_dropout": 0.0,
5
+ "activation_function": "relu",
6
+ "architectures": [
7
+ "OPTForCausalLM"
8
+ ],
9
+ "attention_dropout": 0.0,
10
+ "bos_token_id": 2,
11
+ "do_layer_norm_before": true,
12
+ "dropout": 0.1,
13
+ "enable_bias": true,
14
+ "eos_token_id": 2,
15
+ "ffn_dim": 3072,
16
+ "hidden_size": 768,
17
+ "init_std": 0.02,
18
+ "layer_norm_elementwise_affine": true,
19
+ "layerdrop": 0.0,
20
+ "max_position_embeddings": 2048,
21
+ "model_type": "opt",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 12,
24
+ "pad_token_id": 1,
25
+ "prefix": "</s>",
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.35.0",
28
+ "use_cache": true,
29
+ "vocab_size": 50272,
30
+ "word_embed_proj_dim": 768
31
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:743031bd5648f9c2832ee8ce1100f25c23fe1ae3b581048c169bc40653938ea4
3
+ size 500979600
runs/Nov03_00-43-35_cd4dc85877da/events.out.tfevents.1698972222.cd4dc85877da.180.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9a6654cee75c8fcca7acdb363c7d4ceaf52f1fcdba095c9267b785b1a218a40
3
+ size 4350
runs/Nov03_00-45-56_cd4dc85877da/events.out.tfevents.1698972362.cd4dc85877da.180.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8dee985829033a7ba94205be1495c54e6a87f753706b4532252d4b0c236a26d
3
+ size 4350
runs/Nov03_00-50-05_cd4dc85877da/events.out.tfevents.1698972616.cd4dc85877da.180.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f9b14b2cc305ae55a19e8508fef59154c556454ff340a4bb3ce379af836a29d
3
+ size 4350
runs/Nov03_00-54-06_cd4dc85877da/events.out.tfevents.1698972852.cd4dc85877da.180.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af6d6394236e7e65e1ac673b02207cceee0669ba8a69981bf6bfcbc0acec5583
3
+ size 4350
runs/Nov03_01-02-11_cd4dc85877da/events.out.tfevents.1698973337.cd4dc85877da.11422.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d802f16cfa079c51662ad258109685c1428ebc7236486e017acc25826334f7be
3
+ size 4350
runs/Nov03_01-07-50_cd4dc85877da/events.out.tfevents.1698973679.cd4dc85877da.12957.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eef9d695f2d926c0b3d221e31dc8b8139a16c404bd18eaa351ef19bcd64595fd
3
+ size 4350
runs/Nov03_01-34-17_cd4dc85877da/events.out.tfevents.1698975261.cd4dc85877da.12957.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdad6a6d04a24c08f8c487b619f160f7aa9d5c1278315e076bf7188431fc8143
3
+ size 4184
runs/Nov03_01-37-30_cd4dc85877da/events.out.tfevents.1698975457.cd4dc85877da.20433.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8af754437dd17c4cde64230ee6a5308be5e2b2ad5f338127ebbb19cbcabdf1ff
3
+ size 4350
runs/Nov03_01-44-38_cd4dc85877da/events.out.tfevents.1698975885.cd4dc85877da.22555.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6164e75aebc766f6721cd9e52e88f929ef0e0289991767ab2dd2070eeb936778
3
+ size 4507
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac81429579793b8a566f442c775a7961f63636e0ac785121b7d672b94927e515
3
+ size 4600