stochastic's picture
Training in progress, epoch 1
3f610ee
raw
history blame
2.43 kB
{
"_name_or_path": "google/vit-base-patch16-224-in21k",
"architectures": [
"ViTForImageClassification"
],
"attention_probs_dropout_prob": 0.0,
"encoder_stride": 16,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.0,
"hidden_size": 768,
"id2label": {
"0": "SK",
"1": "HK",
"10": "KR",
"11": "SI",
"12": "BD",
"13": "PE",
"14": "US",
"15": "AU",
"16": "ZA",
"17": "LT",
"18": "FI",
"19": "KH",
"2": "JP",
"20": "SE",
"21": "MY",
"22": "HU",
"23": "CH",
"24": "CO",
"25": "IL",
"26": "IS",
"27": "UA",
"28": "TW",
"29": "PL",
"3": "GB",
"30": "ES",
"31": "CL",
"32": "BW",
"33": "RU",
"34": "LV",
"35": "NL",
"36": "BE",
"37": "AD",
"38": "BT",
"39": "AR",
"4": "IE",
"40": "NO",
"41": "GR",
"42": "IT",
"43": "HR",
"44": "ID",
"45": "SZ",
"46": "CZ",
"47": "AE",
"48": "EE",
"49": "TH",
"5": "FR",
"50": "MX",
"51": "DE",
"52": "BR",
"53": "DK",
"54": "RO",
"55": "PT",
"6": "CA",
"7": "BG",
"8": "SG",
"9": "NZ"
},
"image_size": 224,
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"AD": "37",
"AE": "47",
"AR": "39",
"AU": "15",
"BD": "12",
"BE": "36",
"BG": "7",
"BR": "52",
"BT": "38",
"BW": "32",
"CA": "6",
"CH": "23",
"CL": "31",
"CO": "24",
"CZ": "46",
"DE": "51",
"DK": "53",
"EE": "48",
"ES": "30",
"FI": "18",
"FR": "5",
"GB": "3",
"GR": "41",
"HK": "1",
"HR": "43",
"HU": "22",
"ID": "44",
"IE": "4",
"IL": "25",
"IS": "26",
"IT": "42",
"JP": "2",
"KH": "19",
"KR": "10",
"LT": "17",
"LV": "34",
"MX": "50",
"MY": "21",
"NL": "35",
"NO": "40",
"NZ": "9",
"PE": "13",
"PL": "29",
"PT": "55",
"RO": "54",
"RU": "33",
"SE": "20",
"SG": "8",
"SI": "11",
"SK": "0",
"SZ": "45",
"TH": "49",
"TW": "28",
"UA": "27",
"US": "14",
"ZA": "16"
},
"layer_norm_eps": 1e-12,
"model_type": "vit",
"num_attention_heads": 12,
"num_channels": 3,
"num_hidden_layers": 12,
"patch_size": 16,
"problem_type": "single_label_classification",
"qkv_bias": true,
"torch_dtype": "float32",
"transformers_version": "4.21.2"
}