End of training

Files changed (7) hide show

README.md CHANGED Viewed

@@ -1,4 +1,6 @@
 ---
 tags:
 - generated_from_trainer
 datasets:
@@ -13,9 +15,9 @@ should probably proofread and complete it, then remove this comment. -->
 # dialogue_Summary
-This model was trained from scratch on the samsum dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.1356
 ## Model description
@@ -46,7 +48,7 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 0.08          | 1.0   | 148  | 0.1356          |
 ### Framework versions

 ---
+license: mit
+base_model: facebook/bart-large-cnn
 tags:
 - generated_from_trainer
 datasets:
 # dialogue_Summary
+This model is a fine-tuned version of [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn) on the samsum dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.1338
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 0.0825        | 1.0   | 148  | 0.1338          |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "./bart-cnn-samsum-finetuned/tuned_model_1697080968.4021988",
   "_num_labels": 3,
   "activation_dropout": 0.0,
   "activation_function": "gelu",

 {
+  "_name_or_path": "facebook/bart-large-cnn",
   "_num_labels": 3,
   "activation_dropout": 0.0,
   "activation_function": "gelu",

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:15ae918b67473f15b3efaf3d7c9330ca455203d04198a2dfbde3779c4e490e69
 size 1625537293

 version https://git-lfs.github.com/spec/v1
+oid sha256:374eb589c3e85134ab5e5f1d29af77eead992d5bbeff35a0da0d068a4a9cb191
 size 1625537293

special_tokens_map.json CHANGED Viewed

@@ -1,11 +1,4 @@
 {
-  "additional_special_tokens": [
-    "<s>",
-    "<pad>",
-    "</s>",
-    "<unk>",
-    "<mask>"
-  ],
   "bos_token": "<s>",
   "cls_token": "<s>",
   "eos_token": "</s>",

 {
   "bos_token": "<s>",
   "cls_token": "<s>",
   "eos_token": "</s>",

tokenizer.json CHANGED Viewed

@@ -1,7 +1,21 @@
 {
   "version": "1.0",
-  "truncation": null,
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 1024,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
+  "padding": {
+    "strategy": {
+      "Fixed": 1024
+    },
+    "direction": "Right",
+    "pad_to_multiple_of": null,
+    "pad_id": 2,
+    "pad_type_id": 0,
+    "pad_token": "</s>"
+  },
   "added_tokens": [
     {
       "id": 0,

tokenizer_config.json CHANGED Viewed

@@ -42,30 +42,17 @@
       "special": true
     }
   },
-  "additional_special_tokens": [
-    "<s>",
-    "<pad>",
-    "</s>",
-    "<unk>",
-    "<mask>"
-  ],
   "bos_token": "<s>",
   "clean_up_tokenization_spaces": true,
   "cls_token": "<s>",
   "eos_token": "</s>",
   "errors": "replace",
   "mask_token": "<mask>",
-  "max_length": 1024,
   "model_max_length": 1024,
-  "pad_to_multiple_of": null,
   "pad_token": "</s>",
-  "pad_token_type_id": 0,
-  "padding_side": "right",
   "sep_token": "</s>",
-  "stride": 0,
   "tokenizer_class": "BartTokenizer",
   "trim_offsets": true,
-  "truncation_side": "right",
-  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }

       "special": true
     }
   },
+  "additional_special_tokens": [],
   "bos_token": "<s>",
   "clean_up_tokenization_spaces": true,
   "cls_token": "<s>",
   "eos_token": "</s>",
   "errors": "replace",
   "mask_token": "<mask>",
   "model_max_length": 1024,
   "pad_token": "</s>",
   "sep_token": "</s>",
   "tokenizer_class": "BartTokenizer",
   "trim_offsets": true,
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b95b6c2c8d77931c46b8fec94cce415934ad1469df2fc23fc22b87baa9be3c3
 size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:45c3fe017c0c07b9bcaa75e1e79e0a8080d4cbfec70c94bb7cd0ffb0d9d7faf3
 size 4091