Xmm
/

led-large-16384-cnn_dailymail

@@ -4,9 +4,24 @@ tags:
 - generated_from_trainer
 datasets:
 - cnn_dailymail
 model-index:
 - name: led-large-16384-cnn_dailymail
-  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,6 +30,12 @@ should probably proofread and complete it, then remove this comment. -->
 # led-large-16384-cnn_dailymail
 This model is a fine-tuned version of [allenai/led-base-16384](https://huggingface.co/allenai/led-base-16384) on the cnn_dailymail dataset.
 ## Model description
@@ -43,6 +64,24 @@ The following hyperparameters were used during training:
 - lr_scheduler_type: linear
 - num_epochs: 5
 ### Framework versions
 - Transformers 4.30.2

 - generated_from_trainer
 datasets:
 - cnn_dailymail
+metrics:
+- rouge
 model-index:
 - name: led-large-16384-cnn_dailymail
+  results:
+  - task:
+      name: Sequence-to-sequence Language Modeling
+      type: text2text-generation
+    dataset:
+      name: cnn_dailymail
+      type: cnn_dailymail
+      config: 3.0.0
+      split: test
+      args: 3.0.0
+    metrics:
+    - name: Rouge1
+      type: rouge
+      value: 0.3724824193877514
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # led-large-16384-cnn_dailymail
 This model is a fine-tuned version of [allenai/led-base-16384](https://huggingface.co/allenai/led-base-16384) on the cnn_dailymail dataset.
+It achieves the following results on the evaluation set:
+- Loss: 1.9320
+- Rouge1: 0.3725
+- Rouge2: 0.1570
+- Rougel: 0.2429
+- Rougelsum: 0.3515
 ## Model description
 - lr_scheduler_type: linear
 - num_epochs: 5
+### Training results
+| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
+|:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|
+| 1.9531        | 0.4   | 500  | 1.8639          | 0.3485 | 0.1441 | 0.2275 | 0.3288    |
+| 1.9563        | 0.8   | 1000 | 1.8260          | 0.3538 | 0.1482 | 0.2315 | 0.3343    |
+| 1.7176        | 1.2   | 1500 | 1.8208          | 0.3628 | 0.1527 | 0.2383 | 0.3433    |
+| 1.7197        | 1.6   | 2000 | 1.8162          | 0.3696 | 0.1602 | 0.2434 | 0.3486    |
+| 1.8086        | 2.0   | 2500 | 1.7924          | 0.3558 | 0.1533 | 0.2334 | 0.3361    |
+| 1.2448        | 2.4   | 3000 | 1.8510          | 0.3703 | 0.1591 | 0.2447 | 0.3483    |
+| 1.3574        | 2.8   | 3500 | 1.8277          | 0.3741 | 0.1593 | 0.2422 | 0.3540    |
+| 1.0966        | 3.2   | 4000 | 1.8924          | 0.3682 | 0.1576 | 0.2424 | 0.3479    |
+| 0.9938        | 3.6   | 4500 | 1.8957          | 0.3723 | 0.1599 | 0.2451 | 0.3511    |
+| 1.0735        | 4.0   | 5000 | 1.8772          | 0.3653 | 0.1557 | 0.2399 | 0.3454    |
+| 0.9106        | 4.4   | 5500 | 1.9401          | 0.3720 | 0.1585 | 0.2436 | 0.3504    |
+| 1.015         | 4.8   | 6000 | 1.9320          | 0.3725 | 0.1570 | 0.2429 | 0.3515    |
 ### Framework versions
 - Transformers 4.30.2

generation_config.json CHANGED Viewed

@@ -8,6 +8,5 @@
   "min_length": 100,
   "no_repeat_ngram_size": 3,
   "pad_token_id": 1,
-  "transformers_version": "4.30.2",
-  "use_cache": false
 }

   "min_length": 100,
   "no_repeat_ngram_size": 3,
   "pad_token_id": 1,
+  "transformers_version": "4.30.2"
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:447e50f6b82e594486846219840ae65e68b4139d6c8dc692913cfb73e2695953
 size 647680813

 version https://git-lfs.github.com/spec/v1
+oid sha256:6edc4670ad32c8860fad7714a846e58bf71716b59c3722835cc4d6839af6aad8
 size 647680813