Training in progress, step 500

Files changed (6) hide show

config.json CHANGED Viewed

@@ -2,17 +2,12 @@
   "_name_or_path": "HooshvareLab/distilbert-fa-zwnj-base",
   "activation": "gelu",
   "architectures": [
-    "BertForTokenClassification"
   ],
   "attention_dropout": 0.1,
-  "attention_probs_dropout_prob": 0.1,
-  "classifier_dropout": null,
   "dim": 768,
   "dropout": 0.1,
-  "hidden_act": "gelu",
   "hidden_dim": 3072,
-  "hidden_dropout_prob": 0.1,
-  "hidden_size": 768,
   "id2label": {
     "0": "O",
     "1": "B-DAT",
@@ -37,7 +32,6 @@
     "20": "I-TIM"
   },
   "initializer_range": 0.02,
-  "intermediate_size": 3072,
   "label2id": {
     "B-DAT": 1,
     "B-EVE": 3,
@@ -61,23 +55,17 @@
     "I-TIM": 20,
     "O": 0
   },
-  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
-  "model_type": "bert",
   "n_heads": 12,
   "n_layers": 6,
-  "num_attention_heads": 12,
-  "num_hidden_layers": 12,
   "output_past": true,
   "pad_token_id": 0,
-  "position_embedding_type": "absolute",
   "qa_dropout": 0.1,
   "seq_classif_dropout": 0.2,
   "sinusoidal_pos_embds": false,
   "tie_weights_": true,
   "torch_dtype": "float32",
   "transformers_version": "4.21.2",
-  "type_vocab_size": 2,
-  "use_cache": true,
   "vocab_size": 42000
 }

   "_name_or_path": "HooshvareLab/distilbert-fa-zwnj-base",
   "activation": "gelu",
   "architectures": [
+    "DistilBertForTokenClassification"
   ],
   "attention_dropout": 0.1,
   "dim": 768,
   "dropout": 0.1,
   "hidden_dim": 3072,
   "id2label": {
     "0": "O",
     "1": "B-DAT",
     "20": "I-TIM"
   },
   "initializer_range": 0.02,
   "label2id": {
     "B-DAT": 1,
     "B-EVE": 3,
     "I-TIM": 20,
     "O": 0
   },
   "max_position_embeddings": 512,
+  "model_type": "distilbert",
   "n_heads": 12,
   "n_layers": 6,
   "output_past": true,
   "pad_token_id": 0,
   "qa_dropout": 0.1,
   "seq_classif_dropout": 0.2,
   "sinusoidal_pos_embds": false,
   "tie_weights_": true,
   "torch_dtype": "float32",
   "transformers_version": "4.21.2",
   "vocab_size": 42000
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3050e769fbc091222d642cd1655f6ac9f67d68147ab0723929e347b36693613a
-size 470962033

 version https://git-lfs.github.com/spec/v1
+oid sha256:08c698b7122d80715ba4f59f06542d3fd744ef37722489c9083475d67c3e151c
+size 300810165

runs/Sep03_01-14-34_330500caa281/1662167876.3330314/events.out.tfevents.1662167876.330500caa281.70.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5137e7da004cb45023726c417725539fe0d68d80478765b7c45aa4195f0afb1c
+size 5472

runs/Sep03_01-14-34_330500caa281/events.out.tfevents.1662167876.330500caa281.70.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:25131c33e10214dc90e5fae01d5ae444ac6d481abde86e2b3e83afd141d3e710
+size 4136

tokenizer.json CHANGED Viewed

@@ -1,6 +1,11 @@
 {
   "version": "1.0",
-  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 512,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
   "padding": null,
   "added_tokens": [
     {

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:40da26b2ebfe93efae0fcf147d289e0404ea51cf1947b0e2cfb2a9c5ba8bd99c
 size 3375

 version https://git-lfs.github.com/spec/v1
+oid sha256:6ff19d2172b2b834a2fa8c121f158c3ff46938c64ed0e9917814bc4b8efe7d8e
 size 3375