Spaces:

charlesapochi
/

plagiarism-detection-llm

Running

App Files Files Community

charlesapochi commited on Sep 26, 2024

Commit

56c1c60

1 Parent(s): 37ab146

initial commit

Browse files

Files changed (8) hide show

README.md +3 -12
__pycache__/app.cpython-310.pyc +0 -0
app.py +5 -2
components/__pycache__/utils.cpython-310.pyc +0 -0
components/utils.py +12 -0
experiments/results/detailed_results.json +0 -0
experiments/results/summary_metrics.json +124 -0
experiments/watermark_experiment.ipynb +0 -0

README.md CHANGED Viewed

@@ -1,13 +1,4 @@
----
-title: Plagiarism Detection Llm
-emoji: 👁
-colorFrom: blue
-colorTo: red
-sdk: gradio
-sdk_version: 4.41.0
-app_file: app.py
-pinned: false
-license: apache-2.0
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference


1	+ To run demo locally on gradio: python app.py (Make aure to install all dependencies and packages)
2	+
3	+ To test app on huggiigface: https://huggingface.co/spaces/charlesapochi/plagiarism-detection-llm








4

__pycache__/app.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-310.pyc and b/__pycache__/app.cpython-310.pyc differ

app.py CHANGED Viewed

@@ -83,9 +83,11 @@ def run_gradio(args, model=None, device=None, tokenizer=None):
         def update_algorithm(session_state, value):
             if value == "advance":
                 session_state.run_extended = True
             elif value == "basic":
                 session_state.run_extended = False
-            return session_state,
         algorithm.change(update_algorithm,inputs=[session_args, algorithm], outputs=[session_args])
@@ -227,7 +229,8 @@ def analyze(input_text, args, device=None, tokenizer=None):
     return output, args
 if __name__ == "__main__":
-    args = get_default_args()
     # args = process_args(args)
     input_text = get_default_prompt()
     args.default_prompt = input_text

         def update_algorithm(session_state, value):
             if value == "advance":
                 session_state.run_extended = True
+                # args.run_extended = True
             elif value == "basic":
                 session_state.run_extended = False
+                # args.run_extended = False
+            return session_state
         algorithm.change(update_algorithm,inputs=[session_args, algorithm], outputs=[session_args])
     return output, args
 if __name__ == "__main__":
+    args = parse_args()
+    # args = get_default_args()
     # args = process_args(args)
     input_text = get_default_prompt()
     args.default_prompt = input_text

components/__pycache__/utils.cpython-310.pyc CHANGED Viewed

Binary files a/components/__pycache__/utils.cpython-310.pyc and b/components/__pycache__/utils.cpython-310.pyc differ

components/utils.py CHANGED Viewed

@@ -187,6 +187,12 @@ def parse_args():
         default=False,
         help="Skip the model loading to debug the interface.",
     )
     parser.add_argument(
         "--seed_separately",
         type=str2bool,
@@ -199,6 +205,12 @@ def parse_args():
         default=False,
         help="Whether to run model in float16 precsion.",
     )
     args = parser.parse_args()
     return args

         default=False,
         help="Skip the model loading to debug the interface.",
     )
+    parser.add_argument(
+        "--ignore_repeated_ngrams",
+        type=str2bool,
+        default=False,
+        help="Ignore repeated ngrams.",
+    )
     parser.add_argument(
         "--seed_separately",
         type=str2bool,
         default=False,
         help="Whether to run model in float16 precsion.",
     )
+    parser.add_argument(
+        "--run_extended",
+        type=str2bool,
+        default=False,
+        help="Whether to run basic or advance algorithm.",
+    )
     args = parser.parse_args()
     return args

experiments/results/detailed_results.json ADDED Viewed

The diff for this file is too large to render. See raw diff

experiments/results/summary_metrics.json ADDED Viewed

	@@ -0,0 +1,124 @@

+{
+  "sst2": {
+    "train": {
+      "accuracy_without_watermark": 0.49,
+      "accuracy_with_watermark": 0.56,
+      "f1_without_watermark": 0.5714285714285714,
+      "f1_with_watermark": 0.56
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.44,
+      "accuracy_with_watermark": 0.51,
+      "f1_without_watermark": 0.44,
+      "f1_with_watermark": 0.5882352941176471
+    }
+  },
+  "cola": {
+    "train": {
+      "matthews_corr_without_watermark": -0.09611547479941228,
+      "matthews_corr_with_watermark": 0.11224602755526586
+    },
+    "validation": {
+      "matthews_corr_without_watermark": 0.2683870161053685,
+      "matthews_corr_with_watermark": 0.031219527052723135
+    }
+  },
+  "mrpc": {
+    "train": {
+      "accuracy_without_watermark": 0.53,
+      "accuracy_with_watermark": 0.44,
+      "f1_without_watermark": 0.6758620689655173,
+      "f1_with_watermark": 0.5882352941176471
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.59,
+      "accuracy_with_watermark": 0.57,
+      "f1_without_watermark": 0.7210884353741497,
+      "f1_with_watermark": 0.6993006993006993
+    }
+  },
+  "qqp": {
+    "train": {
+      "accuracy_without_watermark": 0.53,
+      "accuracy_with_watermark": 0.51,
+      "f1_without_watermark": 0.38961038961038963,
+      "f1_with_watermark": 0.19672131147540983
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.54,
+      "accuracy_with_watermark": 0.59,
+      "f1_without_watermark": 0.23333333333333334,
+      "f1_with_watermark": 0.22641509433962265
+    }
+  },
+  "stsb": {
+    "train": {
+      "pearson_corr_without_watermark": NaN,
+      "pearson_corr_with_watermark": -0.3385932975390179,
+      "spearman_corr_without_watermark": NaN,
+      "spearman_corr_with_watermark": -0.3389426353569145
+    },
+    "validation": {
+      "pearson_corr_without_watermark": 0.01675197019312319,
+      "pearson_corr_with_watermark": -0.0999659022196252,
+      "spearman_corr_without_watermark": -0.041560976173932014,
+      "spearman_corr_with_watermark": -0.07632988977600694
+    }
+  },
+  "mnli": {
+    "train": {
+      "accuracy_without_watermark": 0.47,
+      "accuracy_with_watermark": 0.37,
+      "f1_without_watermark": 0.39293604945778854,
+      "f1_with_watermark": 0.24262017885423737
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.37,
+      "accuracy_with_watermark": 0.35,
+      "f1_without_watermark": 0.26940892298948566,
+      "f1_with_watermark": 0.25000682333033103
+    }
+  },
+  "qnli": {
+    "train": {
+      "accuracy_without_watermark": 0.56,
+      "accuracy_with_watermark": 0.54,
+      "f1_without_watermark": 0.5280995280995281,
+      "f1_with_watermark": 0.4875222816399287
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.57,
+      "accuracy_with_watermark": 0.49,
+      "f1_without_watermark": 0.5501621508525996,
+      "f1_with_watermark": 0.4498975299320462
+    }
+  },
+  "rte": {
+    "train": {
+      "accuracy_without_watermark": 0.53,
+      "accuracy_with_watermark": 0.49,
+      "f1_without_watermark": 0.5123975516132379,
+      "f1_with_watermark": 0.4357782940590773
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.53,
+      "accuracy_with_watermark": 0.55,
+      "f1_without_watermark": 0.5123975516132379,
+      "f1_with_watermark": 0.4950061721467849
+    }
+  },
+  "wnli": {
+    "train": {
+      "accuracy_without_watermark": 0.44,
+      "accuracy_with_watermark": 0.52,
+      "f1_without_watermark": 0.43977591036414565,
+      "f1_with_watermark": 0.5198079231692677
+    },
+    "validation": {
+      "accuracy_without_watermark": 0.4788732394366197,
+      "accuracy_with_watermark": 0.49295774647887325,
+      "f1_without_watermark": 0.47845940043676793,
+      "f1_with_watermark": 0.49043062200956933
+    }
+  }
+}

experiments/watermark_experiment.ipynb ADDED Viewed

The diff for this file is too large to render. See raw diff