qcat / config.json
ekohrt's picture
add model weights and config
fbfb6a8
{
"_name_or_path": "distilbert-base-uncased",
"activation": "gelu",
"architectures": [
"DistilBertForSequenceClassification"
],
"attention_dropout": 0.1,
"dim": 768,
"dropout": 0.1,
"hidden_dim": 3072,
"id2label": {
"0": "correlation",
"1": "causal_explanation",
"2": "boolean_and",
"3": "mode",
"4": "superlative",
"5": "opinion",
"6": "set_difference",
"7": "set_retrieval",
"8": "datetime_retrieval",
"9": "datetime_comparison",
"10": "median",
"11": "definitional",
"12": "boolean_retrieval",
"13": "qualitative_property_retrieval",
"14": "qualitative_property_multihop_retrieval",
"15": "range",
"16": "numeric_comparison",
"17": "numeric_retrieval",
"18": "arithmetic",
"19": "mathematical_comparison",
"20": "set_property_satisfaction",
"21": "counting",
"22": "average",
"23": "set_intersection",
"24": "qualitative_comparison",
"25": "standard_deviation",
"26": "set_union",
"27": "boolean_or"
},
"initializer_range": 0.02,
"label2id": {
"arithmetic": 18,
"average": 22,
"boolean_and": 2,
"boolean_or": 27,
"boolean_retrieval": 12,
"causal_explanation": 1,
"correlation": 0,
"counting": 21,
"datetime_comparison": 9,
"datetime_retrieval": 8,
"definitional": 11,
"mathematical_comparison": 19,
"median": 10,
"mode": 3,
"numeric_comparison": 16,
"numeric_retrieval": 17,
"opinion": 5,
"qualitative_comparison": 24,
"qualitative_property_multihop_retrieval": 14,
"qualitative_property_retrieval": 13,
"range": 15,
"set_difference": 6,
"set_intersection": 23,
"set_property_satisfaction": 20,
"set_retrieval": 7,
"set_union": 26,
"standard_deviation": 25,
"superlative": 4
},
"max_position_embeddings": 512,
"model_type": "distilbert",
"n_heads": 12,
"n_layers": 6,
"pad_token_id": 0,
"problem_type": "single_label_classification",
"qa_dropout": 0.1,
"seq_classif_dropout": 0.2,
"sinusoidal_pos_embds": false,
"tie_weights_": true,
"torch_dtype": "float32",
"transformers_version": "4.17.0",
"vocab_size": 30522
}