ekohrt commited on
Commit
fbfb6a8
·
1 Parent(s): 871dfaf

add model weights and config

Browse files
config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "correlation",
13
+ "1": "causal_explanation",
14
+ "2": "boolean_and",
15
+ "3": "mode",
16
+ "4": "superlative",
17
+ "5": "opinion",
18
+ "6": "set_difference",
19
+ "7": "set_retrieval",
20
+ "8": "datetime_retrieval",
21
+ "9": "datetime_comparison",
22
+ "10": "median",
23
+ "11": "definitional",
24
+ "12": "boolean_retrieval",
25
+ "13": "qualitative_property_retrieval",
26
+ "14": "qualitative_property_multihop_retrieval",
27
+ "15": "range",
28
+ "16": "numeric_comparison",
29
+ "17": "numeric_retrieval",
30
+ "18": "arithmetic",
31
+ "19": "mathematical_comparison",
32
+ "20": "set_property_satisfaction",
33
+ "21": "counting",
34
+ "22": "average",
35
+ "23": "set_intersection",
36
+ "24": "qualitative_comparison",
37
+ "25": "standard_deviation",
38
+ "26": "set_union",
39
+ "27": "boolean_or"
40
+ },
41
+ "initializer_range": 0.02,
42
+ "label2id": {
43
+ "arithmetic": 18,
44
+ "average": 22,
45
+ "boolean_and": 2,
46
+ "boolean_or": 27,
47
+ "boolean_retrieval": 12,
48
+ "causal_explanation": 1,
49
+ "correlation": 0,
50
+ "counting": 21,
51
+ "datetime_comparison": 9,
52
+ "datetime_retrieval": 8,
53
+ "definitional": 11,
54
+ "mathematical_comparison": 19,
55
+ "median": 10,
56
+ "mode": 3,
57
+ "numeric_comparison": 16,
58
+ "numeric_retrieval": 17,
59
+ "opinion": 5,
60
+ "qualitative_comparison": 24,
61
+ "qualitative_property_multihop_retrieval": 14,
62
+ "qualitative_property_retrieval": 13,
63
+ "range": 15,
64
+ "set_difference": 6,
65
+ "set_intersection": 23,
66
+ "set_property_satisfaction": 20,
67
+ "set_retrieval": 7,
68
+ "set_union": 26,
69
+ "standard_deviation": 25,
70
+ "superlative": 4
71
+ },
72
+ "max_position_embeddings": 512,
73
+ "model_type": "distilbert",
74
+ "n_heads": 12,
75
+ "n_layers": 6,
76
+ "pad_token_id": 0,
77
+ "problem_type": "single_label_classification",
78
+ "qa_dropout": 0.1,
79
+ "seq_classif_dropout": 0.2,
80
+ "sinusoidal_pos_embds": false,
81
+ "tie_weights_": true,
82
+ "torch_dtype": "float32",
83
+ "transformers_version": "4.17.0",
84
+ "vocab_size": 30522
85
+ }
pretrained_model/config.json DELETED
@@ -1,85 +0,0 @@
1
- {
2
- "_name_or_path": "distilbert-base-uncased",
3
- "activation": "gelu",
4
- "architectures": [
5
- "DistilBertForSequenceClassification"
6
- ],
7
- "attention_dropout": 0.1,
8
- "dim": 768,
9
- "dropout": 0.1,
10
- "hidden_dim": 3072,
11
- "id2label": {
12
- "0": "LABEL_0",
13
- "1": "LABEL_1",
14
- "2": "LABEL_2",
15
- "3": "LABEL_3",
16
- "4": "LABEL_4",
17
- "5": "LABEL_5",
18
- "6": "LABEL_6",
19
- "7": "LABEL_7",
20
- "8": "LABEL_8",
21
- "9": "LABEL_9",
22
- "10": "LABEL_10",
23
- "11": "LABEL_11",
24
- "12": "LABEL_12",
25
- "13": "LABEL_13",
26
- "14": "LABEL_14",
27
- "15": "LABEL_15",
28
- "16": "LABEL_16",
29
- "17": "LABEL_17",
30
- "18": "LABEL_18",
31
- "19": "LABEL_19",
32
- "20": "LABEL_20",
33
- "21": "LABEL_21",
34
- "22": "LABEL_22",
35
- "23": "LABEL_23",
36
- "24": "LABEL_24",
37
- "25": "LABEL_25",
38
- "26": "LABEL_26",
39
- "27": "LABEL_27"
40
- },
41
- "initializer_range": 0.02,
42
- "label2id": {
43
- "LABEL_0": 0,
44
- "LABEL_1": 1,
45
- "LABEL_10": 10,
46
- "LABEL_11": 11,
47
- "LABEL_12": 12,
48
- "LABEL_13": 13,
49
- "LABEL_14": 14,
50
- "LABEL_15": 15,
51
- "LABEL_16": 16,
52
- "LABEL_17": 17,
53
- "LABEL_18": 18,
54
- "LABEL_19": 19,
55
- "LABEL_2": 2,
56
- "LABEL_20": 20,
57
- "LABEL_21": 21,
58
- "LABEL_22": 22,
59
- "LABEL_23": 23,
60
- "LABEL_24": 24,
61
- "LABEL_25": 25,
62
- "LABEL_26": 26,
63
- "LABEL_27": 27,
64
- "LABEL_3": 3,
65
- "LABEL_4": 4,
66
- "LABEL_5": 5,
67
- "LABEL_6": 6,
68
- "LABEL_7": 7,
69
- "LABEL_8": 8,
70
- "LABEL_9": 9
71
- },
72
- "max_position_embeddings": 512,
73
- "model_type": "distilbert",
74
- "n_heads": 12,
75
- "n_layers": 6,
76
- "pad_token_id": 0,
77
- "problem_type": "single_label_classification",
78
- "qa_dropout": 0.1,
79
- "seq_classif_dropout": 0.2,
80
- "sinusoidal_pos_embds": false,
81
- "tie_weights_": true,
82
- "torch_dtype": "float32",
83
- "transformers_version": "4.17.0",
84
- "vocab_size": 30522
85
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
pretrained_model/pytorch_model.bin → pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8537e381cc4d36e9bdb0a8ccc710ae45663c7c98193b8db1297c0c4a5b2aa05a
3
  size 267940465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32b323f57d8047ec8a5c413b6c25ec482cecf2930884adf0a52c366001d4564a
3
  size 267940465