tm21cy commited on
Commit
05ed9ef
·
verified ·
1 Parent(s): 5ec4d2a

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,27 +1,50 @@
1
  {
2
- "_name_or_path": "bert-base-uncased",
3
  "architectures": [
4
- "BertForSequenceClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "gradient_checkpointing": false,
9
- "hidden_act": "gelu",
10
- "hidden_dropout_prob": 0.1,
 
 
 
 
11
  "hidden_size": 768,
 
 
 
 
 
 
 
 
12
  "initializer_range": 0.02,
 
13
  "intermediate_size": 3072,
 
 
 
 
 
 
 
 
14
  "layer_norm_eps": 1e-12,
15
  "max_position_embeddings": 512,
16
- "model_type": "bert",
 
17
  "num_attention_heads": 12,
 
18
  "num_hidden_layers": 12,
 
19
  "pad_token_id": 0,
20
  "position_embedding_type": "absolute",
21
  "problem_type": "single_label_classification",
22
  "torch_dtype": "float32",
23
  "transformers_version": "4.38.2",
24
  "type_vocab_size": 2,
25
- "use_cache": true,
26
- "vocab_size": 30522
27
  }
 
1
  {
2
+ "_name_or_path": "albert-base-v2",
3
  "architectures": [
4
+ "AlbertForSequenceClassification"
5
  ],
6
+ "attention_probs_dropout_prob": 0,
7
+ "bos_token_id": 2,
8
+ "classifier_dropout_prob": 0.1,
9
+ "down_scale_factor": 1,
10
+ "embedding_size": 128,
11
+ "eos_token_id": 3,
12
+ "gap_size": 0,
13
+ "hidden_act": "gelu_new",
14
+ "hidden_dropout_prob": 0,
15
  "hidden_size": 768,
16
+ "id2label": {
17
+ "0": "LABEL_0",
18
+ "1": "LABEL_1",
19
+ "2": "LABEL_2",
20
+ "3": "LABEL_3",
21
+ "4": "LABEL_4",
22
+ "5": "LABEL_5"
23
+ },
24
  "initializer_range": 0.02,
25
+ "inner_group_num": 1,
26
  "intermediate_size": 3072,
27
+ "label2id": {
28
+ "LABEL_0": 0,
29
+ "LABEL_1": 1,
30
+ "LABEL_2": 2,
31
+ "LABEL_3": 3,
32
+ "LABEL_4": 4,
33
+ "LABEL_5": 5
34
+ },
35
  "layer_norm_eps": 1e-12,
36
  "max_position_embeddings": 512,
37
+ "model_type": "albert",
38
+ "net_structure_type": 0,
39
  "num_attention_heads": 12,
40
+ "num_hidden_groups": 1,
41
  "num_hidden_layers": 12,
42
+ "num_memory_blocks": 0,
43
  "pad_token_id": 0,
44
  "position_embedding_type": "absolute",
45
  "problem_type": "single_label_classification",
46
  "torch_dtype": "float32",
47
  "transformers_version": "4.38.2",
48
  "type_vocab_size": 2,
49
+ "vocab_size": 30000
 
50
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f17c71dd49cec310a5b2255e6b38707197411daca82c3bfef08befb8d318668
3
- size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52c245304e83aee3ce4b087797393147ee7781cc59432e34ce7c452e555871dd
3
+ size 46756216
runs/Mar11_02-17-04_ebad219a5e6d/events.out.tfevents.1710123443.ebad219a5e6d.2185.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef3cc0b274be9ab556cd8ed82ee7e319893c48cff491bc5153a3f5f015155b0
3
+ size 5527
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:112da97fdd0597e69cd1ea2408bcdf4be1810c253eaa73d63864d4320a2349bf
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba4bbca5104c96f3eae07ce3d8729ffd7a2b1a0217fd343ee805bf0bda4cc182
3
  size 4920