{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "gpuType": "T4", "collapsed_sections": [ "XvAe3EPARrBm", "BWCA5X_etylC", "3AQ19vC4t4vs", "NTZdY_8OuXC4", "Tb2Br2K1uf0H", "3GI4NqmeunVl", "oc9xnUMVRoS4", "4jiOX9DBo8Yp" ] }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "accelerator": "GPU", "widgets": { "application/vnd.jupyter.widget-state+json": { "a971d84b85cc4d868176a1421dc2a0f7": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_ca555e939bdb4736890800c58a23ec77", "IPY_MODEL_b7ac2f7ecd904a618626d66202170451", "IPY_MODEL_d91c3928ba1043919e6f7b10a0db9447" ], "layout": "IPY_MODEL_aff475d25e07496786680c38e409161a" } }, "ca555e939bdb4736890800c58a23ec77": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bab23d3e8dce48788b69b7498fe68033", "placeholder": "​", "style": "IPY_MODEL_66ff1b38e57c45f18e085009d5d53f0d", "value": "Map: 100%" } }, "b7ac2f7ecd904a618626d66202170451": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2f48af6ab211491c9639ceb91a19248d", "max": 29908, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_a2a533503e83433299e1bc897743863a", "value": 29908 } }, "d91c3928ba1043919e6f7b10a0db9447": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0e9f963127fc423f9a189b480657efcc", "placeholder": "​", "style": "IPY_MODEL_3a72ff8679f14ac689de8667571582d6", "value": " 29908/29908 [01:34<00:00, 196.50 examples/s]" } }, "aff475d25e07496786680c38e409161a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bab23d3e8dce48788b69b7498fe68033": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "66ff1b38e57c45f18e085009d5d53f0d": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "2f48af6ab211491c9639ceb91a19248d": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a2a533503e83433299e1bc897743863a": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "0e9f963127fc423f9a189b480657efcc": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3a72ff8679f14ac689de8667571582d6": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "c08db8312d3e4cc6ada9443e5a32eb6d": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_968c745569084c12ac876b4c3dc8aede", "IPY_MODEL_27c90016d4ac49c2b870ba8967d4a5df", "IPY_MODEL_b59c4157290449269b98f135c09a844e" ], "layout": "IPY_MODEL_ec9ea53f168e4892acfc7b2272f48762" } }, "968c745569084c12ac876b4c3dc8aede": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0f0be4b403a04e25915758770b64a3bb", "placeholder": "​", "style": "IPY_MODEL_e749b52a2c9241dea2ccb390b1093a06", "value": "Map: 100%" } }, "27c90016d4ac49c2b870ba8967d4a5df": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f221c8ae15a946e4b80ac2a84813dade", "max": 8257, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_17bd7bf9b90b42f4993e0a4a8d96f5fd", "value": 8257 } }, "b59c4157290449269b98f135c09a844e": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e407f7b6e1924087aed73c6ef7e1e180", "placeholder": "​", "style": "IPY_MODEL_befa179548c043debfeb7d5d59e12050", "value": " 8257/8257 [00:27<00:00, 408.10 examples/s]" } }, "ec9ea53f168e4892acfc7b2272f48762": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "0f0be4b403a04e25915758770b64a3bb": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e749b52a2c9241dea2ccb390b1093a06": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "f221c8ae15a946e4b80ac2a84813dade": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "17bd7bf9b90b42f4993e0a4a8d96f5fd": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "e407f7b6e1924087aed73c6ef7e1e180": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "befa179548c043debfeb7d5d59e12050": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "markdown", "source": [ "## Training" ], "metadata": { "id": "XvAe3EPARrBm" } }, { "cell_type": "markdown", "source": [ "### Load Training data" ], "metadata": { "id": "BWCA5X_etylC" } }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 107 }, "id": "vGEGzvTmmBWk", "outputId": "92846876-7e0f-4048-b5c7-d12cfc69da00" }, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "Downloading...\n", "From: https://drive.google.com/uc?id=1j0SdyJ8gMrLtpFl1gDJ83s41TyUkKqUt\n", "To: /content/dataset.tsv\n", "100%|██████████| 78.4M/78.4M [00:00<00:00, 140MB/s]\n" ] }, { "output_type": "execute_result", "data": { "text/plain": [ "'dataset.tsv'" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" } }, "metadata": {}, "execution_count": 1 } ], "source": [ "import gdown\n", "\n", "# Link to your file (ID extracted from the URL)\n", "file_id = \"1j0SdyJ8gMrLtpFl1gDJ83s41TyUkKqUt\"\n", "gdown.download(f\"https://drive.google.com/uc?id={file_id}\", \"dataset.tsv\", quiet=False)" ] }, { "cell_type": "code", "source": [ "import pandas as pd\n", "pd.set_option('display.max_colwidth', 10000)" ], "metadata": { "id": "ALucBhN_t56l" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "df = pd.read_csv(\"dataset.tsv\", sep=\"\\t\")\n", "df.drop(columns=[\"Unnamed: 0\"], inplace=True)\n", "df.duplicated().sum()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "SLb-3E-nn31D", "outputId": "678ac60a-7dea-4f70-d8bb-9f51a8e9db53" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "92" ] }, "metadata": {}, "execution_count": 4 } ] }, { "cell_type": "code", "source": [ "df.drop_duplicates(inplace=True)\n", "df.info()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "SoMS0ZfaNs5W", "outputId": "97f5da96-a8e4-4484-e96b-110ad905f00d" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\n", "Index: 29908 entries, 0 to 29999\n", "Data columns (total 5 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 title 29908 non-null object\n", " 1 text 29908 non-null object\n", " 2 subject 29908 non-null object\n", " 3 date 29908 non-null object\n", " 4 label 29908 non-null int64 \n", "dtypes: int64(1), object(4)\n", "memory usage: 1.4+ MB\n" ] } ] }, { "cell_type": "code", "source": [ "df.label.sum()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "JK-xgJUcXKgu", "outputId": "11c09e3a-daaa-44a4-faef-eb084cb4c9c0" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "14432" ] }, "metadata": {}, "execution_count": 6 } ] }, { "cell_type": "code", "source": [ "# Combine features into one text field\n", "df['combined_text'] = (\n", " \"Title: \" + df['title'] + \" | \" +\n", " \"Subject: \" + df['subject'] + \" | \" +\n", " \"Date: \" + df['date'] + \" | \"\n", " \"Text: \" + df['text']\n", ")" ], "metadata": { "id": "W6E2U9ejqDcS" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "max_length = df['combined_text'].str.len().max()\n", "print(f\"The maximum length of the 'combined_text' column is: {max_length}\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "jrx102ATqgxh", "outputId": "e0a096ab-9886-4533-e5bf-6e579642670e" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "The maximum length of the 'combined_text' column is: 51956\n" ] } ] }, { "cell_type": "code", "source": [ "(df['combined_text'].str.len() > 8000).sum()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "cTPDFaOaro3J", "outputId": "48b5d8d9-43c0-45c5-c7bc-e34facfd421e" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "473" ] }, "metadata": {}, "execution_count": 9 } ] }, { "cell_type": "code", "source": [ "df[df['combined_text'].str.len() > 8000]['label'].sum()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "zabPj8SNr2x_", "outputId": "8385bdd9-4c7d-4ef7-fe87-4fafa4662265" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "63" ] }, "metadata": {}, "execution_count": 10 } ] }, { "cell_type": "code", "source": [ "df['combined_text'].head()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "id": "BiF_rTsCqPyw", "outputId": "71b267f0-24b0-4cde-9be1-69d541e613d1" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "0 Title: Ex-CIA head says Trump remarks on Russia interference 'disgraceful' | Subject: politicsNews | Date: July 22, 2017 | Text: Former CIA director John Brennan on Friday criticized as “disgraceful” President Donald Trump’s efforts to play down U.S. intelligence agencies’ assessment that Russia meddled in the 2016 U.S. election. Trump’s administration has been dogged by investigations into allegations of Russian interference in last year’s U.S. presidential election and possible ties with his campaign team. Speaking one day before his first meeting with Russian President Vladimir Putin in Hamburg earlier this month, Trump said he suspected Russian interference in the election but that no one knows for sure. “These types of comments are just disgraceful ... and the person who said them should be ashamed of himself,” said Brennan, CIA chief under former President Barack Obama, at the Aspen Security Forum. Special Counsel Robert Mueller and several U.S. congressional committees are investigating whether Russia interfered in the election and colluded with Trump’s campaign to try to swing the race in his favor over Democratic rival Hillary Clinton. Those probes are focused almost exclusively on Moscow’s actions, lawmakers and intelligence officials have said, and no evidence has surfaced publicly implicating other countries. Moscow has denied any interference, and Trump has said that his campaign did not collude with Russia. Brennan said he was disappointed by the president’s handling of security issues in his first six months in office. “I must say there are disappointments that I see in terms of what Mr. Trump is doing on the international stage that I think pose serious questions about how he is keeping safe our national security,” Brennan said. Speaking at the same event in Aspen, James Clapper, the former director of national intelligence under Obama, was also critical of Trump’s administration. Asked if Jared Kushner, Trump’s son-in-law and top adviser, should have his security clearance canceled for initially failing to list on a disclosure form contacts he had with Russians, Clapper said it should be suspended pending a review. “I do think the appropriate thing here is take a pause and at least suspend a clearance until you’ve had the opportunity to investigate and then decide whether the clearance should be restored or not,” Clapper told the same panel. Brennan and Clapper also criticized Trump’s remarks in a tweet earlier this year about U.S. spy agencies in which he accused them of practices reminiscent of Nazi Germany. “That (tweet) was a terrible insulting affront not to me or John. We get paid the big bucks to take that. But I’m talking about the rank and file, the people in the trenches, men and women, the patriots in the intelligence community and that was completely inappropriate,” said Clapper.\n", "1 Title: YOU WON’T BELIEVE HIS PUNISHMENT! HISPANIC STORE OWNER Swindles Tax Payers Out Of $1,116,924.27 In Latest Food Stamp Scam | Subject: Government News | Date: Jun 19, 2017 | Text: How did this man come to OWN this store? There is no information on much about this fraudster except that he stole from Americans and is getting just a slap on the wrist. It s no wonder these people are repeat offenders!A hispanic store owner testified in court through a Spanish translator (Why no English?) that he swindled the American tax payers out of millions via food stamp fraud. Eduardo Leonardo plead guilty to stealing from the USDA by illegally exchanging over a million dollars of food stamp benefits for cash for over two years. I stole from the USDA and the Food and Nutrition Service, Eduardo Leonardo said slowly in Spanish through a translator in Brooklyn Federal Court. It was an exchange of benefits for cash. Leonardo, 57, admitted to committing food stamp fraud between Oct. 2015 and March 2017 by giving customers cash in exchange for running their EBT cards for a higher amount, which the federal government would later reimburse.In one instance, an undercover witness from the USDA went into Super Economic and picked up a jar of peanut butter and jelly and crackers, totaling $5.48. The witness then asked Leonardo to exchange benefits for $200 cash and Leonardo charged an undercover EBT card $287.89 and gave the witness $200 in cash, making a $82.41 profit.The USDA lost a total of $1,116,924.27 in the transactions.The scammer has run his store, Super Economic One Way Supermarket out of 104-21 Glenwood Road in Canarsie since Dec. 2011. It became a registered SNAP business on May 25, 2012. Specifically I gave a discounted rate in cash in exchange for them [customers] allowing me to ring up the full amount, Leonardo said to Judge Ann Donnelly.Remember Ann Donnelly?Supplemental Nutrition Assistance Program (SNAP) previously called the food stamp program, uses federal tax dollars to aid low-income households in buying affordable and nutritious food. EBT cards are used like debit cards, to swipe at special terminals in retail food stores to use the benefits in exchange for food.Between Nov. 2015 and Jan. 2017, Super Economic conducted more than 57,000 SNAP transactions totaling more than $1.5 million, according to court documents.About 8 transactions were made for $50 or more, an amount that USDA officials say is high for a store that size, which would normally conduct $15 average transactions.Leonardo is set to be sentenced on Oct. 31 and could face a maximum five years in prison WHAAAAT????THIS IS WHY THIS KEEPS HAPPENING!A man swindles more than a million dollars from Americans yet he gets only 5 years in prison? The punishment does not fit the crime!Via: Brooklyn Eagle\n", "2 Title: Federal Reserve governor Powell's policy views, in his own words | Subject: politicsNews | Date: November 2, 2017 | Text: President Donald Trump on Thursday tapped Federal Reserve Governor Jerome Powell to become head of the U.S. central bank, promoting a soft-spoken centrist to replace Janet Yellen when her term expires in February 2018. In five years as a Fed Governor Jerome Powell has been a consistent, middle of the road voice, backing the consensus crafted by Fed chair Janet Yellen that interest rates should be raised slowly so labor markets could recover, that financial stability risks were muted, and that new regulations had made the economy safer. Following is a collection of quotes from select policy speeches he has delivered since 2015: On Rates: “The financial crisis did significant damage to the productive capacity of our economy, and the damage was of a character, extent, and duration that cannot be fully known today…It seems plausible that at least part of this supply-side damage could be reversed if the economy enjoys a period of sustained growth.4 To encourage that outcome, as monetary policymakers consider removing accommodation, we should look for a little more proof than usual that labor markets are tightening or other supply-side constraints are binding.” - April 2015 speech to New York Council on Foreign Relations: (Graphic: U.S. labor market measures vs interest rates - reut.rs/2h7hsFx) On Financial Stability: “The bottom line is that there has not been an excessive buildup of leverage, maturity transformation, or broadly unsustainable asset prices…Overall, I do not see leveraged finance markets as posing undue financial stability risks. And if risk-taking does not threaten financial stability, it is not the Fed’s job to stop people from losing (or making) money.” - January 2017 speech to American Finance Association, Chicago (Graphic: U.S. stocks and leverage - reut.rs/2iolCp6) On Regulation: “We have substantially increased the capital, liquidity, and other prudential requirements for large banking firms. These measures are not free. Higher capital requirements increase bank costs, and at least some of those costs will be passed along to bank customers and shareholders. But in the longer term, stronger prudential requirements for large banking firms will produce more sustainable credit availability and economic growth.” - June 2017 speech to Salzburg Global Seminar, Salzburg, Austria (Graphic: Commercial credit and bank profitability - reut.rs/2h8lfCm) On the Current Economy: “Risks to the forecast now seem more balanced than they have been for some time. In particular, the global picture has brightened as growth and inflation have broadly moved up for the first time in several years. Here at home, risks seem both moderate and balanced, including the downside risk of lower inflation and the upside risk of labor market overheating. The Committee has been patient in raising rates, and that patience has paid dividends…. If the economy performs about as expected, I would view it as appropriate to continue to gradually raise rates.” - June 2017 speech to the Economic Club of New York (Graphic: The inflation conundrum - reut.rs/2za4ltY) Other issues may confront Powell in his confirmation hearings and as chair, such as whether to keep the current system of paying banks interest on their reserves as the main method of setting short term interest rates, and whether to rely on monetary policy rules: On Reserve Interest: “Simple to operate and has provided good control over the federal funds rate.” - June 2017 speech to the Economic Club of New York (Graphic: Bank reserves at the Fed - reut.rs/2z7Qdl8) On Policy Rules: “I am unable to think of any critical, complex human activity that could be safely reduced to a simple summary equation. In particular, no major central bank uses policy rules in a prescriptive way, and it is hard to predict the consequences of requiring the FOMC to do so, as some have proposed. Policy should be systematic, but not automatic.” - February 2017 speech to the Forecasters Club of New York (Graphic: Monetary policy rules vs reality - reut.rs/2h7mMZE)\n", "3 Title: SCOUNDREL HILLARY SUPPORTER STARTS “TrumpLeaks” Campaign…Desperate Move! | Subject: left-news | Date: Sep 17, 2016 | Text: Hillary Clinton ally David Brock is offering to pay for new information on Donald Trump, hoping that damaging audio or video on the Republican presidential candidate will be submitted to his super PAC.Brock, founder of the left-wing Media Matters and operator of Correct the Record super PAC, recently posted the plea on Correct the Record s website and is referring to the project as TrumpLeaks, NBC News reported.Brock asked for video or audio of Trump that has yet to be released. One of the most important things for voters to evaluate in any election is the full measure of a candidate s views, ideas, and temperament over time, the website states. In making a choice for president, voters must also consider how various candidates present themselves to the public and to the world. There are few things more important in that regard than access to video or audio in the form of prior television or radio interviews or more candid video from events a candidate may have attended. Brock s super PAC goes on to say they can offer compensation to anyone who has new video or audio that has been obtained legally.Read more: WFB\n", "4 Title: NANCY PELOSI ARROGANTLY DISMISSES Questions on Crooked Democrat IT Employees Under Investigation [Video] | Subject: politics | Date: May 26, 2017 | Text: Pleading ignorance is a perfect ploy for Nancy Pelosi Who wouldn t believe she s clueless on pretty much everything. Pelosi claims she s been busy with lots of things . That s laughable! This case is a big deal! Here s what The Daily Caller had to say about this stain on the Democrats:U.S. Capitol Police and other agencies are probing the cyber activities of three brothers who had jobs as congressional staffers at the office of information technology for lawmakers on the House Permanent Select Committee on Intelligence, The Daily Caller News Foundation first reported. Brothers Imran, Abid and Jamal Awan also provided their services for other Democratic members in the lower chamber.When they came under suspicion by law enforcement for accessing the House network without permission last February, they were all banned from accessing it. While some Democratic lawmakers dismissed Imran from their employ when the story, others, like Florida Democratic Rep. Debbie Wasserman Schultz kept him on.Are the Democrats helping these two men hide the evidence?\n", "Name: combined_text, dtype: object" ], "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
combined_text
0Title: Ex-CIA head says Trump remarks on Russia interference 'disgraceful' | Subject: politicsNews | Date: July 22, 2017 | Text: Former CIA director John Brennan on Friday criticized as “disgraceful” President Donald Trump’s efforts to play down U.S. intelligence agencies’ assessment that Russia meddled in the 2016 U.S. election. Trump’s administration has been dogged by investigations into allegations of Russian interference in last year’s U.S. presidential election and possible ties with his campaign team. Speaking one day before his first meeting with Russian President Vladimir Putin in Hamburg earlier this month, Trump said he suspected Russian interference in the election but that no one knows for sure. “These types of comments are just disgraceful ... and the person who said them should be ashamed of himself,” said Brennan, CIA chief under former President Barack Obama, at the Aspen Security Forum. Special Counsel Robert Mueller and several U.S. congressional committees are investigating whether Russia interfered in the election and colluded with Trump’s campaign to try to swing the race in his favor over Democratic rival Hillary Clinton. Those probes are focused almost exclusively on Moscow’s actions, lawmakers and intelligence officials have said, and no evidence has surfaced publicly implicating other countries. Moscow has denied any interference, and Trump has said that his campaign did not collude with Russia. Brennan said he was disappointed by the president’s handling of security issues in his first six months in office. “I must say there are disappointments that I see in terms of what Mr. Trump is doing on the international stage that I think pose serious questions about how he is keeping safe our national security,” Brennan said. Speaking at the same event in Aspen, James Clapper, the former director of national intelligence under Obama, was also critical of Trump’s administration. Asked if Jared Kushner, Trump’s son-in-law and top adviser, should have his security clearance canceled for initially failing to list on a disclosure form contacts he had with Russians, Clapper said it should be suspended pending a review. “I do think the appropriate thing here is take a pause and at least suspend a clearance until you’ve had the opportunity to investigate and then decide whether the clearance should be restored or not,” Clapper told the same panel. Brennan and Clapper also criticized Trump’s remarks in a tweet earlier this year about U.S. spy agencies in which he accused them of practices reminiscent of Nazi Germany. “That (tweet) was a terrible insulting affront not to me or John. We get paid the big bucks to take that. But I’m talking about the rank and file, the people in the trenches, men and women, the patriots in the intelligence community and that was completely inappropriate,” said Clapper.
1Title: YOU WON’T BELIEVE HIS PUNISHMENT! HISPANIC STORE OWNER Swindles Tax Payers Out Of $1,116,924.27 In Latest Food Stamp Scam | Subject: Government News | Date: Jun 19, 2017 | Text: How did this man come to OWN this store? There is no information on much about this fraudster except that he stole from Americans and is getting just a slap on the wrist. It s no wonder these people are repeat offenders!A hispanic store owner testified in court through a Spanish translator (Why no English?) that he swindled the American tax payers out of millions via food stamp fraud. Eduardo Leonardo plead guilty to stealing from the USDA by illegally exchanging over a million dollars of food stamp benefits for cash for over two years. I stole from the USDA and the Food and Nutrition Service, Eduardo Leonardo said slowly in Spanish through a translator in Brooklyn Federal Court. It was an exchange of benefits for cash. Leonardo, 57, admitted to committing food stamp fraud between Oct. 2015 and March 2017 by giving customers cash in exchange for running their EBT cards for a higher amount, which the federal government would later reimburse.In one instance, an undercover witness from the USDA went into Super Economic and picked up a jar of peanut butter and jelly and crackers, totaling $5.48. The witness then asked Leonardo to exchange benefits for $200 cash and Leonardo charged an undercover EBT card $287.89 and gave the witness $200 in cash, making a $82.41 profit.The USDA lost a total of $1,116,924.27 in the transactions.The scammer has run his store, Super Economic One Way Supermarket out of 104-21 Glenwood Road in Canarsie since Dec. 2011. It became a registered SNAP business on May 25, 2012. Specifically I gave a discounted rate in cash in exchange for them [customers] allowing me to ring up the full amount, Leonardo said to Judge Ann Donnelly.Remember Ann Donnelly?Supplemental Nutrition Assistance Program (SNAP) previously called the food stamp program, uses federal tax dollars to aid low-income households in buying affordable and nutritious food. EBT cards are used like debit cards, to swipe at special terminals in retail food stores to use the benefits in exchange for food.Between Nov. 2015 and Jan. 2017, Super Economic conducted more than 57,000 SNAP transactions totaling more than $1.5 million, according to court documents.About 8 transactions were made for $50 or more, an amount that USDA officials say is high for a store that size, which would normally conduct $15 average transactions.Leonardo is set to be sentenced on Oct. 31 and could face a maximum five years in prison WHAAAAT????THIS IS WHY THIS KEEPS HAPPENING!A man swindles more than a million dollars from Americans yet he gets only 5 years in prison? The punishment does not fit the crime!Via: Brooklyn Eagle
2Title: Federal Reserve governor Powell's policy views, in his own words | Subject: politicsNews | Date: November 2, 2017 | Text: President Donald Trump on Thursday tapped Federal Reserve Governor Jerome Powell to become head of the U.S. central bank, promoting a soft-spoken centrist to replace Janet Yellen when her term expires in February 2018. In five years as a Fed Governor Jerome Powell has been a consistent, middle of the road voice, backing the consensus crafted by Fed chair Janet Yellen that interest rates should be raised slowly so labor markets could recover, that financial stability risks were muted, and that new regulations had made the economy safer. Following is a collection of quotes from select policy speeches he has delivered since 2015: On Rates: “The financial crisis did significant damage to the productive capacity of our economy, and the damage was of a character, extent, and duration that cannot be fully known today…It seems plausible that at least part of this supply-side damage could be reversed if the economy enjoys a period of sustained growth.4 To encourage that outcome, as monetary policymakers consider removing accommodation, we should look for a little more proof than usual that labor markets are tightening or other supply-side constraints are binding.” - April 2015 speech to New York Council on Foreign Relations: (Graphic: U.S. labor market measures vs interest rates - reut.rs/2h7hsFx) On Financial Stability: “The bottom line is that there has not been an excessive buildup of leverage, maturity transformation, or broadly unsustainable asset prices…Overall, I do not see leveraged finance markets as posing undue financial stability risks. And if risk-taking does not threaten financial stability, it is not the Fed’s job to stop people from losing (or making) money.” - January 2017 speech to American Finance Association, Chicago (Graphic: U.S. stocks and leverage - reut.rs/2iolCp6) On Regulation: “We have substantially increased the capital, liquidity, and other prudential requirements for large banking firms. These measures are not free. Higher capital requirements increase bank costs, and at least some of those costs will be passed along to bank customers and shareholders. But in the longer term, stronger prudential requirements for large banking firms will produce more sustainable credit availability and economic growth.” - June 2017 speech to Salzburg Global Seminar, Salzburg, Austria (Graphic: Commercial credit and bank profitability - reut.rs/2h8lfCm) On the Current Economy: “Risks to the forecast now seem more balanced than they have been for some time. In particular, the global picture has brightened as growth and inflation have broadly moved up for the first time in several years. Here at home, risks seem both moderate and balanced, including the downside risk of lower inflation and the upside risk of labor market overheating. The Committee has been patient in raising rates, and that patience has paid dividends…. If the economy performs about as expected, I would view it as appropriate to continue to gradually raise rates.” - June 2017 speech to the Economic Club of New York (Graphic: The inflation conundrum - reut.rs/2za4ltY) Other issues may confront Powell in his confirmation hearings and as chair, such as whether to keep the current system of paying banks interest on their reserves as the main method of setting short term interest rates, and whether to rely on monetary policy rules: On Reserve Interest: “Simple to operate and has provided good control over the federal funds rate.” - June 2017 speech to the Economic Club of New York (Graphic: Bank reserves at the Fed - reut.rs/2z7Qdl8) On Policy Rules: “I am unable to think of any critical, complex human activity that could be safely reduced to a simple summary equation. In particular, no major central bank uses policy rules in a prescriptive way, and it is hard to predict the consequences of requiring the FOMC to do so, as some have proposed. Policy should be systematic, but not automatic.” - February 2017 speech to the Forecasters Club of New York (Graphic: Monetary policy rules vs reality - reut.rs/2h7mMZE)
3Title: SCOUNDREL HILLARY SUPPORTER STARTS “TrumpLeaks” Campaign…Desperate Move! | Subject: left-news | Date: Sep 17, 2016 | Text: Hillary Clinton ally David Brock is offering to pay for new information on Donald Trump, hoping that damaging audio or video on the Republican presidential candidate will be submitted to his super PAC.Brock, founder of the left-wing Media Matters and operator of Correct the Record super PAC, recently posted the plea on Correct the Record s website and is referring to the project as TrumpLeaks, NBC News reported.Brock asked for video or audio of Trump that has yet to be released. One of the most important things for voters to evaluate in any election is the full measure of a candidate s views, ideas, and temperament over time, the website states. In making a choice for president, voters must also consider how various candidates present themselves to the public and to the world. There are few things more important in that regard than access to video or audio in the form of prior television or radio interviews or more candid video from events a candidate may have attended. Brock s super PAC goes on to say they can offer compensation to anyone who has new video or audio that has been obtained legally.Read more: WFB
4Title: NANCY PELOSI ARROGANTLY DISMISSES Questions on Crooked Democrat IT Employees Under Investigation [Video] | Subject: politics | Date: May 26, 2017 | Text: Pleading ignorance is a perfect ploy for Nancy Pelosi Who wouldn t believe she s clueless on pretty much everything. Pelosi claims she s been busy with lots of things . That s laughable! This case is a big deal! Here s what The Daily Caller had to say about this stain on the Democrats:U.S. Capitol Police and other agencies are probing the cyber activities of three brothers who had jobs as congressional staffers at the office of information technology for lawmakers on the House Permanent Select Committee on Intelligence, The Daily Caller News Foundation first reported. Brothers Imran, Abid and Jamal Awan also provided their services for other Democratic members in the lower chamber.When they came under suspicion by law enforcement for accessing the House network without permission last February, they were all banned from accessing it. While some Democratic lawmakers dismissed Imran from their employ when the story, others, like Florida Democratic Rep. Debbie Wasserman Schultz kept him on.Are the Democrats helping these two men hide the evidence?
\n", "

" ] }, "metadata": {}, "execution_count": 11 } ] }, { "cell_type": "markdown", "source": [ "### Load necessary module for fine-tuning" ], "metadata": { "id": "3AQ19vC4t4vs" } }, { "cell_type": "code", "source": [ "!pip install git+https://github.com/huggingface/transformers.git\n", "!pip install datasets triton" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "FmcC1m5YVpu1", "outputId": "fe65ad65-af56-400a-92b4-01bb510b637f" }, "execution_count": 19, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Collecting git+https://github.com/huggingface/transformers.git\n", " Cloning https://github.com/huggingface/transformers.git to /tmp/pip-req-build-ff3t48wj\n", " Running command git clone --filter=blob:none --quiet https://github.com/huggingface/transformers.git /tmp/pip-req-build-ff3t48wj\n", " Resolved https://github.com/huggingface/transformers.git to commit 5c75087aeee7081025370e10d1f571a11600f1ae\n", " Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (3.16.1)\n", "Requirement already satisfied: huggingface-hub<1.0,>=0.24.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (0.27.0)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (1.26.4)\n", "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (24.2)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (6.0.2)\n", "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (2024.11.6)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (2.32.3)\n", "Requirement already satisfied: tokenizers<0.22,>=0.21 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (0.21.0)\n", "Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (0.4.5)\n", "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers==4.48.0.dev0) (4.67.1)\n", "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.24.0->transformers==4.48.0.dev0) (2024.9.0)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.24.0->transformers==4.48.0.dev0) (4.12.2)\n", "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.48.0.dev0) (3.4.0)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.48.0.dev0) (3.10)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.48.0.dev0) (2.2.3)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers==4.48.0.dev0) (2024.12.14)\n", "Requirement already satisfied: datasets in /usr/local/lib/python3.10/dist-packages (3.2.0)\n", "Requirement already satisfied: triton in /usr/local/lib/python3.10/dist-packages (3.1.0)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from datasets) (3.16.1)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (1.26.4)\n", "Requirement already satisfied: pyarrow>=15.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (17.0.0)\n", "Requirement already satisfied: dill<0.3.9,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.3.8)\n", "Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (2.2.2)\n", "Requirement already satisfied: requests>=2.32.2 in /usr/local/lib/python3.10/dist-packages (from datasets) (2.32.3)\n", "Requirement already satisfied: tqdm>=4.66.3 in /usr/local/lib/python3.10/dist-packages (from datasets) (4.67.1)\n", "Requirement already satisfied: xxhash in /usr/local/lib/python3.10/dist-packages (from datasets) (3.5.0)\n", "Requirement already satisfied: multiprocess<0.70.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.70.16)\n", "Requirement already satisfied: fsspec<=2024.9.0,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from fsspec[http]<=2024.9.0,>=2023.1.0->datasets) (2024.9.0)\n", "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.11.10)\n", "Requirement already satisfied: huggingface-hub>=0.23.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.27.0)\n", "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets) (24.2)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (6.0.2)\n", "Requirement already satisfied: aiohappyeyeballs>=2.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (2.4.4)\n", "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.2)\n", "Requirement already satisfied: async-timeout<6.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.3)\n", "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (24.3.0)\n", "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.5.0)\n", "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.1.0)\n", "Requirement already satisfied: propcache>=0.2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (0.2.1)\n", "Requirement already satisfied: yarl<2.0,>=1.17.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.18.3)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub>=0.23.0->datasets) (4.12.2)\n", "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (3.4.0)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (3.10)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (2.2.3)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (2024.12.14)\n", "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n", "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2024.2)\n", "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2024.2)\n", "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.2->pandas->datasets) (1.17.0)\n" ] } ] }, { "cell_type": "code", "source": [ "import torch\n", "torch.cuda.empty_cache()\n", "\n", "from transformers import AutoTokenizer, AutoModelForSequenceClassification, Trainer, TrainingArguments\n", "from datasets import Dataset\n", "from transformers import DataCollatorWithPadding" ], "metadata": { "id": "eIFZNvehXxMI" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "print(torch.cuda.get_device_name(0))\n", "print(torch.cuda.is_available())\n", "print(torch.cuda.get_device_capability(0)) # Should be >= 8.0 for Flash Attention" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "1aHn0pNNbMvz", "outputId": "4a131e5b-e003-40e8-c00d-5cd1e93602e7" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Tesla T4\n", "True\n", "(7, 5)\n" ] } ] }, { "cell_type": "code", "source": [ "model_id = \"answerdotai/ModernBERT-base\"\n", "\n", "# Load the tokenizer for ModernBERT\n", "tokenizer = AutoTokenizer.from_pretrained(model_id)\n", "# Load the pre-trained ModernBERT model for sequence classification with Flash Attention\n", "model = AutoModelForSequenceClassification.from_pretrained(\n", " model_id,\n", " num_labels=1,\n", " # attn_implementation=\"flash_attention_2\", # Enable Flash Attention 2.0\n", " torch_dtype=torch.float32, # Use mixed precision for efficiency\n", ").to(\"cuda\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "KZoQQQM9uvQ_", "outputId": "4ae0a6f0-327c-4598-f288-da27329508cb" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "Some weights of ModernBertForSequenceClassification were not initialized from the model checkpoint at answerdotai/ModernBERT-base and are newly initialized: ['classifier.bias', 'classifier.weight']\n", "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n" ] } ] }, { "cell_type": "markdown", "source": [ "### Prepare dataset for training" ], "metadata": { "id": "NTZdY_8OuXC4" } }, { "cell_type": "code", "source": [ "# Tokenize the combined text\n", "def tokenize_data(batch):\n", " return tokenizer(\n", " batch['combined_text'],\n", " truncation=True,\n", " padding='longest', # Use dynamic padding to the longest sequence in the batch\n", " max_length=7000,\n", " return_tensors=\"pt\"\n", " )" ], "metadata": { "id": "syO9mbQruBOh" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "# Convert to Hugging Face Dataset\n", "dataset = Dataset.from_pandas(pd.DataFrame(df['combined_text']))" ], "metadata": { "id": "NmqvgsogQ9Ag" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "# Tokenize the dataset in batches\n", "batch_size = 16 # Adjust based on memory capacity\n", "tokenized_dataset = dataset.map(tokenize_data, batched=True, batch_size=batch_size)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 49, "referenced_widgets": [ "a971d84b85cc4d868176a1421dc2a0f7", "ca555e939bdb4736890800c58a23ec77", "b7ac2f7ecd904a618626d66202170451", "d91c3928ba1043919e6f7b10a0db9447", "aff475d25e07496786680c38e409161a", "bab23d3e8dce48788b69b7498fe68033", "66ff1b38e57c45f18e085009d5d53f0d", "2f48af6ab211491c9639ceb91a19248d", "a2a533503e83433299e1bc897743863a", "0e9f963127fc423f9a189b480657efcc", "3a72ff8679f14ac689de8667571582d6" ] }, "id": "2slbmGKbPXHX", "outputId": "aa551d81-eb62-4c87-fe61-36f93b156358" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Map: 0%| | 0/29908 [00:00" ], "text/html": [ "\n", "
\n", " \n", " \n", " [6355/6355 1:54:34, Epoch 0/1]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
EpochTraining LossValidation Loss
00.0000000.000004

" ] }, "metadata": {} }, { "output_type": "execute_result", "data": { "text/plain": [ "TrainOutput(global_step=6355, training_loss=0.021927670485696906, metrics={'train_runtime': 6876.3305, 'train_samples_per_second': 3.697, 'train_steps_per_second': 0.924, 'total_flos': 2.598128586619892e+16, 'train_loss': 0.021927670485696906, 'epoch': 0.9999606624444357})" ] }, "metadata": {}, "execution_count": 40 } ] }, { "cell_type": "markdown", "source": [ "### Save and download model" ], "metadata": { "id": "3GI4NqmeunVl" } }, { "cell_type": "code", "source": [ "# Save the model\n", "trainer.save_model('./saved_model') # Specify the directory to save the model\n", "tokenizer.save_pretrained('./saved_model') # Save the tokenizer" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "m9s6QFAIzdaN", "outputId": "166002d2-61de-4dfd-fa02-849377faee12" }, "execution_count": null, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "('./saved_model/tokenizer_config.json',\n", " './saved_model/special_tokens_map.json',\n", " './saved_model/tokenizer.json')" ] }, "metadata": {}, "execution_count": 41 } ] }, { "cell_type": "code", "source": [ "import shutil\n", "import os\n", "\n", "# Create a zip file of the saved model directory\n", "shutil.make_archive('./saved_model', 'zip', './saved_model')\n", "\n", "# Download the zip file\n", "from google.colab import files\n", "files.download('./saved_model.zip')" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 34 }, "id": "G-Gvqwiaze8Z", "outputId": "7c3b3ad1-a9e4-4293-d56a-42a4f9a7af38" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "" ], "application/javascript": [ "\n", " async function download(id, filename, size) {\n", " if (!google.colab.kernel.accessAllowed) {\n", " return;\n", " }\n", " const div = document.createElement('div');\n", " const label = document.createElement('label');\n", " label.textContent = `Downloading \"${filename}\": `;\n", " div.appendChild(label);\n", " const progress = document.createElement('progress');\n", " progress.max = size;\n", " div.appendChild(progress);\n", " document.body.appendChild(div);\n", "\n", " const buffers = [];\n", " let downloaded = 0;\n", "\n", " const channel = await google.colab.kernel.comms.open(id);\n", " // Send a message to notify the kernel that we're ready.\n", " channel.send({})\n", "\n", " for await (const message of channel.messages) {\n", " // Send a message to notify the kernel that we're ready.\n", " channel.send({})\n", " if (message.buffers) {\n", " for (const buffer of message.buffers) {\n", " buffers.push(buffer);\n", " downloaded += buffer.byteLength;\n", " progress.value = downloaded;\n", " }\n", " }\n", " }\n", " const blob = new Blob(buffers, {type: 'application/binary'});\n", " const a = document.createElement('a');\n", " a.href = window.URL.createObjectURL(blob);\n", " a.download = filename;\n", " div.appendChild(a);\n", " a.click();\n", " div.remove();\n", " }\n", " " ] }, "metadata": {} }, { "output_type": "display_data", "data": { "text/plain": [ "" ], "application/javascript": [ "download(\"download_e56e2a4d-3008-4274-8653-a40602a7a2a9\", \"saved_model.zip\", 556546545)" ] }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "!nvidia-smi" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "ePrD2WOVbNNe", "outputId": "5bdf58aa-129e-41a9-f3ad-6b68874534c5" }, "execution_count": null, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Sun Dec 29 11:35:58 2024 \n", "+---------------------------------------------------------------------------------------+\n", "| NVIDIA-SMI 535.104.05 Driver Version: 535.104.05 CUDA Version: 12.2 |\n", "|-----------------------------------------+----------------------+----------------------+\n", "| GPU Name Persistence-M | Bus-Id Disp.A | Volatile Uncorr. ECC |\n", "| Fan Temp Perf Pwr:Usage/Cap | Memory-Usage | GPU-Util Compute M. |\n", "| | | MIG M. |\n", "|=========================================+======================+======================|\n", "| 0 Tesla T4 Off | 00000000:00:04.0 Off | 0 |\n", "| N/A 73C P0 31W / 70W | 11167MiB / 15360MiB | 0% Default |\n", "| | | N/A |\n", "+-----------------------------------------+----------------------+----------------------+\n", " \n", "+---------------------------------------------------------------------------------------+\n", "| Processes: |\n", "| GPU GI CI PID Type Process name GPU Memory |\n", "| ID ID Usage |\n", "|=======================================================================================|\n", "+---------------------------------------------------------------------------------------+\n" ] } ] }, { "cell_type": "markdown", "source": [ "## Testing" ], "metadata": { "id": "oc9xnUMVRoS4" } }, { "cell_type": "code", "source": [ "!gdown --id 1fJOaVhtwzQuzpse8OtJSmV5UZjIuR_kN" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "uI0Fdp37OzRt", "outputId": "fa7beee1-2266-4a7e-b81d-878427651897" }, "execution_count": 1, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "/usr/local/lib/python3.10/dist-packages/gdown/__main__.py:140: FutureWarning: Option `--id` was deprecated in version 4.3.1 and will be removed in 5.0. You don't need to pass it anymore to use a file ID.\n", " warnings.warn(\n", "Downloading...\n", "From: https://drive.google.com/uc?id=1fJOaVhtwzQuzpse8OtJSmV5UZjIuR_kN\n", "To: /content/test.tsv\n", "100% 22.0M/22.0M [00:00<00:00, 54.1MB/s]\n" ] } ] }, { "cell_type": "code", "source": [ "import pandas as pd\n", "\n", "pd.set_option('display.max_colwidth', 10000)\n", "test = pd.read_csv(\"test.tsv\", sep=\"\\t\")\n", "test.drop(columns=[\"Unnamed: 0\"], inplace=True)\n", "test.duplicated().sum()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "ILlMP7PEO-2E", "outputId": "33cb4fc8-f9a3-45bb-b731-77e1512d3bd5" }, "execution_count": 1, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "10" ] }, "metadata": {}, "execution_count": 1 } ] }, { "cell_type": "code", "source": [ "test.drop_duplicates(inplace=True)\n", "test.info()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "uE88vtcJPbZV", "outputId": "22dd4bbe-ff23-48e6-d5f1-25b2939cb5e0" }, "execution_count": 2, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\n", "Index: 8257 entries, 0 to 8266\n", "Data columns (total 5 columns):\n", " # Column Non-Null Count Dtype \n", "--- ------ -------------- ----- \n", " 0 title 8257 non-null object\n", " 1 text 8257 non-null object\n", " 2 subject 8257 non-null object\n", " 3 date 8257 non-null object\n", " 4 label 8257 non-null int64 \n", "dtypes: int64(1), object(4)\n", "memory usage: 387.0+ KB\n" ] } ] }, { "cell_type": "code", "source": [ "# Combine features into one text field\n", "test['combined_text'] = (\n", " \"Title: \" + test['title'] + \" | \" +\n", " \"Subject: \" + test['subject'] + \" | \" +\n", " \"Date: \" + test['date'] + \" | \"\n", " \"Text: \" + test['text']\n", ")" ], "metadata": { "id": "Mv55WKi_PoPG" }, "execution_count": 3, "outputs": [] }, { "cell_type": "code", "source": [ "import torch\n", "torch.cuda.empty_cache()\n", "\n", "from transformers import AutoTokenizer, AutoModelForSequenceClassification, Trainer, TrainingArguments\n", "from datasets import Dataset\n", "from transformers import DataCollatorWithPadding" ], "metadata": { "id": "SxoVTW4bR8Qr" }, "execution_count": 6, "outputs": [] }, { "cell_type": "code", "source": [ "!gdown --id 1VCcfo0RxfjCPD7JBlWpx0_Z63Cmeur89" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "PZuA7u0YX9k3", "outputId": "9df30429-51a3-4cd4-eaec-672e445fea83" }, "execution_count": 11, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "/usr/local/lib/python3.10/dist-packages/gdown/__main__.py:140: FutureWarning: Option `--id` was deprecated in version 4.3.1 and will be removed in 5.0. You don't need to pass it anymore to use a file ID.\n", " warnings.warn(\n", "Downloading...\n", "From (original): https://drive.google.com/uc?id=1VCcfo0RxfjCPD7JBlWpx0_Z63Cmeur89\n", "From (redirected): https://drive.google.com/uc?id=1VCcfo0RxfjCPD7JBlWpx0_Z63Cmeur89&confirm=t&uuid=45c74e96-b387-4a05-957d-a462046d1454\n", "To: /content/saved_model.zip\n", "100% 557M/557M [00:24<00:00, 23.1MB/s]\n" ] } ] }, { "cell_type": "code", "source": [ "import zipfile\n", "import os\n", "\n", "zip_file_path = '/content/saved_model.zip'\n", "unzip_dir = 'model_directory' # Directory to extract to\n", "\n", "# Create the directory if it doesn't exist\n", "os.makedirs(unzip_dir, exist_ok=True)\n", "\n", "# Unzip the file\n", "with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:\n", " zip_ref.extractall(unzip_dir)" ], "metadata": { "id": "A7xap4b2VHBh" }, "execution_count": 12, "outputs": [] }, { "cell_type": "code", "source": [ "model_name = unzip_dir\n", "model = AutoModelForSequenceClassification.from_pretrained(model_name).to(\"cuda\")\n", "tokenizer = AutoTokenizer.from_pretrained(model_name)" ], "metadata": { "id": "HxcBHi-mV-Dj" }, "execution_count": 13, "outputs": [] }, { "cell_type": "code", "source": [ "# Tokenize the combined text\n", "def tokenize_data(batch):\n", " return tokenizer(\n", " batch['combined_text'],\n", " truncation=True,\n", " padding='longest', # Use dynamic padding to the longest sequence in the batch\n", " max_length=7000,\n", " return_tensors=\"pt\"\n", " )" ], "metadata": { "id": "GTOcz6puY1JZ" }, "execution_count": 14, "outputs": [] }, { "cell_type": "code", "source": [ "# Convert to Hugging Face Dataset\n", "test_dataset = Dataset.from_pandas(pd.DataFrame(test['combined_text']))\n", "\n", "# Tokenize the dataset in batches\n", "batch_size = 16 # Adjust based on memory capacity\n", "tokenized_dataset = test_dataset.map(tokenize_data, batched=True, batch_size=batch_size)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 49, "referenced_widgets": [ "c08db8312d3e4cc6ada9443e5a32eb6d", "968c745569084c12ac876b4c3dc8aede", "27c90016d4ac49c2b870ba8967d4a5df", "b59c4157290449269b98f135c09a844e", "ec9ea53f168e4892acfc7b2272f48762", "0f0be4b403a04e25915758770b64a3bb", "e749b52a2c9241dea2ccb390b1093a06", "f221c8ae15a946e4b80ac2a84813dade", "17bd7bf9b90b42f4993e0a4a8d96f5fd", "e407f7b6e1924087aed73c6ef7e1e180", "befa179548c043debfeb7d5d59e12050" ] }, "id": "wJ9Ls4xqWd8p", "outputId": "3a736ec9-7fd1-4a07-f62c-0f92063b1301" }, "execution_count": 15, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Map: 0%| | 0/8257 [00:00 0.5).long() # Convert probabilities to binary predictions\n", "\n", " # Store results\n", " predictions.extend(preds.cpu().numpy())\n", " probabilities.extend(probs.cpu().numpy())" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "kdmhybYfafBu", "outputId": "6989b63d-6038-4ca7-9535-b87d2e55f341" }, "execution_count": 23, "outputs": [ { "output_type": "stream", "name": "stderr", "text": [ "Running Inference: 100%|██████████| 517/517 [28:36<00:00, 3.32s/it]\n" ] } ] }, { "cell_type": "code", "source": [ "from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score, roc_auc_score\n", "\n", "# Ground truth labels (true values from your dataset)\n", "true_labels = test['label']\n", "\n", "# Calculate evaluation metrics\n", "accuracy = accuracy_score(true_labels, predictions)\n", "precision = precision_score(true_labels, predictions)\n", "recall = recall_score(true_labels, predictions)\n", "f1 = f1_score(true_labels, predictions)\n", "auc_roc = roc_auc_score(true_labels, probabilities)\n", "\n", "# Print metrics\n", "print(f\"Accuracy: {accuracy:.4f}\")\n", "print(f\"Precision: {precision:.4f}\")\n", "print(f\"Recall: {recall:.4f}\")\n", "print(f\"F1 Score: {f1:.4f}\")\n", "print(f\"AUC-ROC: {auc_roc:.4f}\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "YDLrKth_bCUC", "outputId": "db27415b-f5a1-4b62-aaaf-66fad10fb7a8" }, "execution_count": 24, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Accuracy: 0.7027\n", "Precision: 0.6181\n", "Recall: 1.0000\n", "F1 Score: 0.7640\n", "AUC-ROC: 1.0000\n" ] } ] }, { "cell_type": "code", "source": [ "from sklearn.metrics import confusion_matrix\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "\n", "conf_matrix = confusion_matrix(true_labels, predictions)\n", "sns.heatmap(conf_matrix, annot=True, fmt='d', cmap='Blues')\n", "plt.title('Confusion Matrix')\n", "plt.xlabel('Predicted Labels')\n", "plt.ylabel('True Labels')\n", "plt.show()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 472 }, "id": "v-_7CEEPdE5T", "outputId": "8ede06f0-d250-4ead-b790-1a1a5cd39546" }, "execution_count": 28, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "

" ], "image/png": "\n" }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "probabilities" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 0 }, "id": "9cz1_MhPkHXI", "outputId": "34ff1038-2d12-4b24-8494-93c5bee91acf" }, "execution_count": 31, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "[0.50001657,\n", " 0.73180765,\n", " 0.50006306,\n", " 0.73142564,\n", " 0.500457,\n", " 0.730648,\n", " 0.49988672,\n", " 0.5000267,\n", " 0.49966726,\n", " 0.5005572,\n", " 0.7317519,\n", " 0.7308919,\n", " 0.73081124,\n", " 0.49979952,\n", " 0.49989775,\n", " 0.50000733,\n", " 0.73092675,\n", " 0.5000122,\n", " 0.7308941,\n", " 0.7307099,\n", " 0.49981403,\n", " 0.4999174,\n", " 0.73107773,\n", " 0.5001563,\n", " 0.5001094,\n", " 0.73106664,\n", " 0.49960276,\n", " 0.7304853,\n", " 0.4989315,\n", " 0.73073626,\n", " 0.49933076,\n", " 0.7307914,\n", " 0.4995961,\n", " 0.7309542,\n", " 0.7305881,\n", " 0.730756,\n", " 0.730791,\n", " 0.73154485,\n", " 0.73174363,\n", " 0.7310429,\n", " 0.500371,\n", " 0.5003924,\n", " 0.49990276,\n", " 0.73099464,\n", " 0.49985507,\n", " 0.73004943,\n", " 0.7308039,\n", " 0.7303853,\n", " 0.7312729,\n", " 0.50049806,\n", " 0.73019195,\n", " 0.73089105,\n", " 0.73086566,\n", " 0.49970746,\n", " 0.5002459,\n", " 0.73114836,\n", " 0.49987105,\n", " 0.5000737,\n", " 0.73095727,\n", " 0.500732,\n", " 0.7308521,\n", " 0.7298369,\n", " 0.7311641,\n", " 0.5000605,\n", " 0.49954134,\n", " 0.7313265,\n", " 0.5002616,\n", " 0.5000128,\n", " 0.4991023,\n", " 0.7312981,\n", " 0.5001435,\n", " 0.7309735,\n", " 0.73123676,\n", " 0.5000661,\n", " 0.73077166,\n", " 0.5004365,\n", " 0.73055613,\n", " 0.49987772,\n", " 0.7314142,\n", " 0.4999144,\n", " 0.73112965,\n", " 0.49877167,\n", " 0.7313731,\n", " 0.731197,\n", " 0.7311808,\n", " 0.49961644,\n", " 0.7309114,\n", " 0.7303586,\n", " 0.7301574,\n", " 0.49988666,\n", " 0.49972376,\n", " 0.73140484,\n", " 0.4999733,\n", " 0.730716,\n", " 0.5004749,\n", " 0.4994043,\n", " 0.49974388,\n", " 0.5002577,\n", " 0.49962893,\n", " 0.7308502,\n", " 0.49997282,\n", " 0.499783,\n", " 0.50014734,\n", " 0.7308109,\n", " 0.73124427,\n", " 0.7312501,\n", " 0.73095757,\n", " 0.73110074,\n", " 0.50029385,\n", " 0.7313042,\n", " 0.73149824,\n", " 0.7311425,\n", " 0.50030893,\n", " 0.5004289,\n", " 0.500374,\n", " 0.50037163,\n", " 0.50016004,\n", " 0.73062754,\n", " 0.7315118,\n", " 0.7312957,\n", " 0.4998365,\n", " 0.5003073,\n", " 0.73148024,\n", " 0.4994193,\n", " 0.50005054,\n", " 0.500043,\n", " 0.50019634,\n", " 0.50007564,\n", " 0.730816,\n", " 0.50061077,\n", " 0.50090617,\n", " 0.7308635,\n", " 0.4996257,\n", " 0.50052005,\n", " 0.500348,\n", " 0.730758,\n", " 0.49999827,\n", " 0.73082376,\n", " 0.73042804,\n", " 0.5003271,\n", " 0.49975848,\n", " 0.7308863,\n", " 0.4998739,\n", " 0.73089147,\n", " 0.5003052,\n", " 0.7312431,\n", " 0.730764,\n", " 0.73062205,\n", " 0.73086536,\n", " 0.49991062,\n", " 0.5000819,\n", " 0.7311548,\n", " 0.73074937,\n", " 0.500564,\n", " 0.7312144,\n", " 0.4992589,\n", " 0.4999196,\n", " 0.73085165,\n", " 0.4999324,\n", " 0.5005716,\n", " 0.49969357,\n", " 0.7312011,\n", " 0.4999647,\n", " 0.50017893,\n", " 0.73152333,\n", " 0.4994444,\n", " 0.4997599,\n", " 0.5004179,\n", " 0.73094785,\n", " 0.7309258,\n", " 0.73102075,\n", " 0.5001387,\n", " 0.50104,\n", " 0.5006729,\n", " 0.49937385,\n", " 0.49972317,\n", " 0.5000464,\n", " 0.50042987,\n", " 0.7308088,\n", " 0.73105025,\n", " 0.73084617,\n", " 0.73074925,\n", " 0.5000743,\n", " 0.73082197,\n", " 0.7307466,\n", " 0.5000672,\n", " 0.7315805,\n", " 0.73120266,\n", " 0.50014526,\n", " 0.500435,\n", " 0.7312897,\n", " 0.5002499,\n", " 0.73119897,\n", " 0.7310065,\n", " 0.500142,\n", " 0.5001808,\n", " 0.49962348,\n", " 0.4998913,\n", " 0.49960577,\n", " 0.5001439,\n", " 0.50102746,\n", " 0.49943832,\n", " 0.7311595,\n", " 0.4997947,\n", " 0.7307384,\n", " 0.7310632,\n", " 0.50013834,\n", " 0.500004,\n", " 0.73076284,\n", " 0.73124766,\n", " 0.49981838,\n", " 0.50069183,\n", " 0.7311896,\n", " 0.7308603,\n", " 0.5003158,\n", " 0.49998748,\n", " 0.50050443,\n", " 0.50021243,\n", " 0.5001541,\n", " 0.5000111,\n", " 0.7316854,\n", " 0.73132277,\n", " 0.7311376,\n", " 0.73083353,\n", " 0.5003835,\n", " 0.7307755,\n", " 0.500229,\n", " 0.73131335,\n", " 0.499826,\n", " 0.50007015,\n", " 0.7306485,\n", " 0.7310175,\n", " 0.49972215,\n", " 0.73141825,\n", " 0.49995214,\n", " 0.73113877,\n", " 0.5002716,\n", " 0.7315377,\n", " 0.7305722,\n", " 0.73093694,\n", " 0.7310239,\n", " 0.50000787,\n", " 0.49976146,\n", " 0.50018376,\n", " 0.5004636,\n", " 0.7307527,\n", " 0.73130804,\n", " 0.49945676,\n", " 0.500953,\n", " 0.4996412,\n", " 0.73141664,\n", " 0.5001029,\n", " 0.730162,\n", " 0.5001869,\n", " 0.5000522,\n", " 0.7309768,\n", " 0.73109716,\n", " 0.7310637,\n", " 0.7317514,\n", " 0.5005362,\n", " 0.730811,\n", " 0.7309047,\n", " 0.7312777,\n", " 0.73080957,\n", " 0.50036913,\n", " 0.5002395,\n", " 0.7308375,\n", " 0.7310308,\n", " 0.7312786,\n", " 0.7308834,\n", " 0.50029564,\n", " 0.73095477,\n", " 0.5003481,\n", " 0.7316858,\n", " 0.7306523,\n", " 0.73072046,\n", " 0.4992834,\n", " 0.73100144,\n", " 0.7309423,\n", " 0.73151654,\n", " 0.7308609,\n", " 0.5004142,\n", " 0.7312314,\n", " 0.730987,\n", " 0.49999905,\n", " 0.5001001,\n", " 0.49988726,\n", " 0.50020576,\n", " 0.73091674,\n", " 0.49929896,\n", " 0.73074794,\n", " 0.7310196,\n", " 0.7305999,\n", " 0.7312425,\n", " 0.50066024,\n", " 0.5000778,\n", " 0.7310708,\n", " 0.730434,\n", " 0.5001822,\n", " 0.5007469,\n", " 0.7311102,\n", " 0.730909,\n", " 0.500285,\n", " 0.4995561,\n", " 0.5001437,\n", " 0.50045866,\n", " 0.500332,\n", " 0.7308288,\n", " 0.7310978,\n", " 0.730815,\n", " 0.500071,\n", " 0.73099023,\n", " 0.5006229,\n", " 0.50006354,\n", " 0.5001445,\n", " 0.49943706,\n", " 0.49958318,\n", " 0.7308718,\n", " 0.49988833,\n", " 0.7307979,\n", " 0.7308288,\n", " 0.4997801,\n", " 0.72984207,\n", " 0.7309019,\n", " 0.49993968,\n", " 0.50042665,\n", " 0.4991538,\n", " 0.7306923,\n", " 0.49991822,\n", " 0.7305326,\n", " 0.4990314,\n", " 0.7312928,\n", " 0.73076284,\n", " 0.7308306,\n", " 0.7312268,\n", " 0.49976528,\n", " 0.7313183,\n", " 0.5003918,\n", " 0.49920478,\n", " 0.4997604,\n", " 0.5002339,\n", " 0.50038224,\n", " 0.50027645,\n", " 0.7314119,\n", " 0.49989405,\n", " 0.50065523,\n", " 0.7318524,\n", " 0.49947733,\n", " 0.50022995,\n", " 0.4997493,\n", " 0.7311692,\n", " 0.4998921,\n", " 0.73108864,\n", " 0.4995824,\n", " 0.7304818,\n", " 0.49986705,\n", " 0.7307681,\n", " 0.7310052,\n", " 0.50001013,\n", " 0.5000905,\n", " 0.7309694,\n", " 0.5003729,\n", " 0.5002992,\n", " 0.73014164,\n", " 0.72944176,\n", " 0.5001378,\n", " 0.7307642,\n", " 0.50077254,\n", " 0.5000701,\n", " 0.7310156,\n", " 0.5004385,\n", " 0.50050604,\n", " 0.4999058,\n", " 0.49915445,\n", " 0.5001234,\n", " 0.5005926,\n", " 0.5000082,\n", " 0.7308409,\n", " 0.5005899,\n", " 0.7308915,\n", " 0.73139936,\n", " 0.731134,\n", " 0.73121774,\n", " 0.7314008,\n", " 0.49982893,\n", " 0.73072773,\n", " 0.73078096,\n", " 0.73120624,\n", " 0.73133135,\n", " 0.7306902,\n", " 0.5001705,\n", " 0.50016993,\n", " 0.5002077,\n", " 0.7313388,\n", " 0.7312992,\n", " 0.5003303,\n", " 0.7313944,\n", " 0.4998766,\n", " 0.7305423,\n", " 0.500419,\n", " 0.5008216,\n", " 0.5003547,\n", " 0.73080605,\n", " 0.5006243,\n", " 0.5001484,\n", " 0.73151827,\n", " 0.731059,\n", " 0.49982077,\n", " 0.5008315,\n", " 0.49964952,\n", " 0.4997144,\n", " 0.7306063,\n", " 0.73182696,\n", " 0.50019133,\n", " 0.7307757,\n", " 0.7310945,\n", " 0.50014395,\n", " 0.73123246,\n", " 0.730297,\n", " 0.7307318,\n", " 0.73001206,\n", " 0.50063276,\n", " 0.7310584,\n", " 0.5002733,\n", " 0.50041026,\n", " 0.50025004,\n", " 0.73078346,\n", " 0.7302773,\n", " 0.7309084,\n", " 0.50112975,\n", " 0.49992394,\n", " 0.73106194,\n", " 0.4997635,\n", " 0.49989715,\n", " 0.7308779,\n", " 0.7309803,\n", " 0.73007214,\n", " 0.7313329,\n", " 0.73106337,\n", " 0.73103523,\n", " 0.50003296,\n", " 0.49914697,\n", " 0.49993777,\n", " 0.7311219,\n", " 0.49961913,\n", " 0.7309497,\n", " 0.7316553,\n", " 0.49975872,\n", " 0.49949923,\n", " 0.5001163,\n", " 0.50044554,\n", " 0.5006988,\n", " 0.73081887,\n", " 0.73087275,\n", " 0.49998873,\n", " 0.50010955,\n", " 0.73076105,\n", " 0.73132974,\n", " 0.7313097,\n", " 0.73069715,\n", " 0.73104626,\n", " 0.49929303,\n", " 0.7311637,\n", " 0.730876,\n", " 0.7309419,\n", " 0.7304739,\n", " 0.50054276,\n", " 0.7308374,\n", " 0.49970663,\n", " 0.7315366,\n", " 0.7311337,\n", " 0.73107797,\n", " 0.7304013,\n", " 0.5003886,\n", " 0.7312597,\n", " 0.73072237,\n", " 0.7314522,\n", " 0.4995687,\n", " 0.49863273,\n", " 0.5002072,\n", " 0.7307129,\n", " 0.49996042,\n", " 0.7312544,\n", " 0.73110586,\n", " 0.50058234,\n", " 0.731725,\n", " 0.73114425,\n", " 0.730907,\n", " 0.7306095,\n", " 0.5005258,\n", " 0.73119164,\n", " 0.7313732,\n", " 0.73052484,\n", " 0.50010157,\n", " 0.73092484,\n", " 0.73038757,\n", " 0.73064625,\n", " 0.50040454,\n", " 0.49989793,\n", " 0.49962452,\n", " 0.7303551,\n", " 0.5004355,\n", " 0.7313864,\n", " 0.7310822,\n", " 0.50022,\n", " 0.5002571,\n", " 0.5001963,\n", " 0.73091304,\n", " 0.7310061,\n", " 0.5009337,\n", " 0.7313311,\n", " 0.49970573,\n", " 0.730657,\n", " 0.49975097,\n", " 0.50015086,\n", " 0.73106664,\n", " 0.73104453,\n", " 0.499516,\n", " 0.49997747,\n", " 0.5000285,\n", " 0.73059523,\n", " 0.7311692,\n", " 0.5001043,\n", " 0.7318259,\n", " 0.73156047,\n", " 0.5024217,\n", " 0.73113364,\n", " 0.730561,\n", " 0.50058687,\n", " 0.5003162,\n", " 0.49964982,\n", " 0.5000657,\n", " 0.7304006,\n", " 0.7315703,\n", " 0.4996328,\n", " 0.49996042,\n", " 0.7309194,\n", " 0.7315101,\n", " 0.730496,\n", " 0.50003767,\n", " 0.500382,\n", " 0.7313314,\n", " 0.7306768,\n", " 0.7305257,\n", " 0.5008147,\n", " 0.7313552,\n", " 0.50030243,\n", " 0.7311979,\n", " 0.73134893,\n", " 0.7314874,\n", " 0.7306652,\n", " 0.50004214,\n", " 0.73074484,\n", " 0.49986687,\n", " 0.7314663,\n", " 0.49975306,\n", " 0.5002723,\n", " 0.730807,\n", " 0.7312264,\n", " 0.50018156,\n", " 0.4994822,\n", " 0.5004544,\n", " 0.5003985,\n", " 0.7312361,\n", " 0.73079085,\n", " 0.49990574,\n", " 0.4999764,\n", " 0.5003374,\n", " 0.49996448,\n", " 0.73110694,\n", " 0.5001881,\n", " 0.49990138,\n", " 0.73107797,\n", " 0.5002843,\n", " 0.49970704,\n", " 0.5004353,\n", " 0.4998111,\n", " 0.73076373,\n", " 0.7308362,\n", " 0.7319336,\n", " 0.5001459,\n", " 0.5002509,\n", " 0.50068533,\n", " 0.49993563,\n", " 0.50044036,\n", " 0.73117954,\n", " 0.73077327,\n", " 0.50049245,\n", " 0.7310929,\n", " 0.73068726,\n", " 0.73148036,\n", " 0.5001762,\n", " 0.7310852,\n", " 0.5008719,\n", " 0.7308255,\n", " 0.5000462,\n", " 0.7313136,\n", " 0.73085034,\n", " 0.50015134,\n", " 0.4999105,\n", " 0.73086154,\n", " 0.49963835,\n", " 0.5004522,\n", " 0.73121697,\n", " 0.49961406,\n", " 0.50015855,\n", " 0.5000798,\n", " 0.730612,\n", " 0.49959645,\n", " 0.5004222,\n", " 0.7308763,\n", " 0.49944985,\n", " 0.73103607,\n", " 0.73106295,\n", " 0.73037004,\n", " 0.7309959,\n", " 0.50060844,\n", " 0.50053835,\n", " 0.49980637,\n", " 0.50025,\n", " 0.5003451,\n", " 0.49976826,\n", " 0.73116064,\n", " 0.49976724,\n", " 0.49998033,\n", " 0.5004538,\n", " 0.7311511,\n", " 0.7307103,\n", " 0.7309412,\n", " 0.50051445,\n", " 0.49953556,\n", " 0.4998225,\n", " 0.50022995,\n", " 0.500384,\n", " 0.49997365,\n", " 0.50016415,\n", " 0.49943322,\n", " 0.7310104,\n", " 0.5000113,\n", " 0.499704,\n", " 0.7306636,\n", " 0.49981272,\n", " 0.50003964,\n", " 0.50030863,\n", " 0.49944475,\n", " 0.5000957,\n", " 0.73141354,\n", " 0.73135346,\n", " 0.731045,\n", " 0.5008514,\n", " 0.73128545,\n", " 0.7310206,\n", " 0.73093957,\n", " 0.49999076,\n", " 0.4999869,\n", " 0.4999746,\n", " 0.49971995,\n", " 0.73199904,\n", " 0.5005905,\n", " 0.72992,\n", " 0.5000127,\n", " 0.7307081,\n", " 0.73112535,\n", " 0.4994652,\n", " 0.500238,\n", " 0.49984127,\n", " 0.5001823,\n", " 0.73131835,\n", " 0.49999475,\n", " 0.7307068,\n", " 0.4996887,\n", " 0.7308143,\n", " 0.49995798,\n", " 0.5005579,\n", " 0.7310634,\n", " 0.49969226,\n", " 0.73096895,\n", " 0.73092955,\n", " 0.50021064,\n", " 0.500414,\n", " 0.7318217,\n", " 0.730905,\n", " 0.49989417,\n", " 0.49978337,\n", " 0.73121667,\n", " 0.50032055,\n", " 0.49971464,\n", " 0.4997864,\n", " 0.7312036,\n", " 0.4998387,\n", " 0.7308906,\n", " 0.5006489,\n", " 0.73111737,\n", " 0.73128605,\n", " 0.7310055,\n", " 0.7312846,\n", " 0.7316134,\n", " 0.7308807,\n", " 0.5000009,\n", " 0.7309372,\n", " 0.4996325,\n", " 0.49940228,\n", " 0.7315719,\n", " 0.5004744,\n", " 0.4997873,\n", " 0.7315755,\n", " 0.5006533,\n", " 0.73243576,\n", " 0.7309701,\n", " 0.49973473,\n", " 0.7306138,\n", " 0.49967209,\n", " 0.7308692,\n", " 0.49989417,\n", " 0.499644,\n", " 0.7313076,\n", " 0.50007796,\n", " 0.49990037,\n", " 0.49981666,\n", " 0.73135585,\n", " 0.49960923,\n", " 0.5002801,\n", " 0.73111933,\n", " 0.7310726,\n", " 0.50022787,\n", " 0.50028414,\n", " 0.50056696,\n", " 0.5000613,\n", " 0.50014913,\n", " 0.50090104,\n", " 0.7303854,\n", " 0.5007454,\n", " 0.73085773,\n", " 0.73124987,\n", " 0.5002411,\n", " 0.73086977,\n", " 0.7310614,\n", " 0.50075513,\n", " 0.5003276,\n", " 0.49983174,\n", " 0.5000041,\n", " 0.49975735,\n", " 0.73104745,\n", " 0.7303503,\n", " 0.49990222,\n", " 0.50014263,\n", " 0.73122156,\n", " 0.73029953,\n", " 0.49983162,\n", " 0.5000852,\n", " 0.5002018,\n", " 0.7306648,\n", " 0.7312112,\n", " 0.7308832,\n", " 0.7316932,\n", " 0.7309973,\n", " 0.73141676,\n", " 0.73055524,\n", " 0.499847,\n", " 0.49998665,\n", " 0.73146766,\n", " 0.7311589,\n", " 0.7311979,\n", " 0.731412,\n", " 0.50014156,\n", " 0.73039633,\n", " 0.5000779,\n", " 0.73071265,\n", " 0.50006896,\n", " 0.7316255,\n", " 0.49966425,\n", " 0.7314927,\n", " 0.50023115,\n", " 0.7307656,\n", " 0.49892175,\n", " 0.50019544,\n", " 0.7305355,\n", " 0.4997086,\n", " 0.73106587,\n", " 0.4996937,\n", " 0.5002188,\n", " 0.49972323,\n", " 0.49997258,\n", " 0.5,\n", " 0.5000477,\n", " 0.7305484,\n", " 0.73153144,\n", " 0.7305603,\n", " 0.731513,\n", " 0.4999985,\n", " 0.500033,\n", " 0.730511,\n", " 0.5001859,\n", " 0.5002162,\n", " 0.5000392,\n", " 0.5003162,\n", " 0.50051683,\n", " 0.49987152,\n", " 0.73094255,\n", " 0.7314224,\n", " 0.7317076,\n", " 0.5001249,\n", " 0.5003861,\n", " 0.5003823,\n", " 0.49978647,\n", " 0.7307335,\n", " 0.49969274,\n", " 0.7309814,\n", " 0.73066837,\n", " 0.4998887,\n", " 0.73090047,\n", " 0.50015575,\n", " 0.5001306,\n", " 0.73052865,\n", " 0.50056857,\n", " 0.731086,\n", " 0.5000559,\n", " 0.7310916,\n", " 0.499573,\n", " 0.73083526,\n", " 0.4999178,\n", " 0.5004368,\n", " 0.4993534,\n", " 0.5001315,\n", " 0.49975836,\n", " 0.5001921,\n", " 0.5005086,\n", " 0.5008587,\n", " 0.50013745,\n", " 0.7309396,\n", " 0.49960726,\n", " 0.5003342,\n", " 0.5004612,\n", " 0.7311579,\n", " 0.7307819,\n", " 0.73081374,\n", " 0.50042266,\n", " 0.7310185,\n", " 0.5002655,\n", " 0.7309653,\n", " 0.7305959,\n", " 0.7313126,\n", " 0.7305068,\n", " 0.5002971,\n", " 0.7309019,\n", " 0.50075233,\n", " 0.7304313,\n", " 0.7310129,\n", " 0.49991062,\n", " 0.7312488,\n", " 0.5006484,\n", " 0.49992967,\n", " 0.7309884,\n", " 0.49991313,\n", " 0.73051506,\n", " 0.50041944,\n", " 0.49943376,\n", " 0.7319001,\n", " 0.7306008,\n", " 0.49951178,\n", " 0.73072976,\n", " 0.5002419,\n", " 0.50051296,\n", " 0.73090947,\n", " 0.5014391,\n", " 0.5003769,\n", " 0.49992514,\n", " 0.4996707,\n", " 0.49956706,\n", " 0.73120433,\n", " 0.7311659,\n", " 0.49975836,\n", " 0.7309957,\n", " 0.499763,\n", " 0.73082197,\n", " 0.73051035,\n", " 0.5005948,\n", " 0.7309045,\n", " 0.5007808,\n", " 0.4995122,\n", " 0.7305514,\n", " 0.5014271,\n", " 0.7309703,\n", " 0.73084766,\n", " 0.7306834,\n", " 0.49974015,\n", " 0.49984068,\n", " 0.73100436,\n", " 0.7316026,\n", " 0.73037916,\n", " 0.7322349,\n", " 0.7324667,\n", " 0.50036365,\n", " 0.7314384,\n", " 0.7314505,\n", " 0.49977347,\n", " 0.50027525,\n", " 0.7308401,\n", " 0.7313605,\n", " 0.5005531,\n", " 0.73100865,\n", " 0.7313817,\n", " 0.49972442,\n", " 0.7314638,\n", " 0.49981385,\n", " 0.73070544,\n", " 0.50021625,\n", " 0.50033945,\n", " 0.73121744,\n", " 0.5000397,\n", " 0.5002741,\n", " 0.7315321,\n", " 0.7311444,\n", " 0.49989268,\n", " 0.50027364,\n", " 0.5003563,\n", " 0.731936,\n", " 0.7310723,\n", " 0.730601,\n", " 0.5002467,\n", " 0.7309612,\n", " 0.4997855,\n", " 0.7309971,\n", " 0.4995927,\n", " 0.5003692,\n", " 0.7301233,\n", " 0.7303844,\n", " 0.5005204,\n", " 0.49985984,\n", " 0.73051286,\n", " 0.5001411,\n", " 0.7310744,\n", " 0.7300225,\n", " 0.5004673,\n", " 0.49988887,\n", " 0.7311421,\n", " 0.49943298,\n", " 0.7312286,\n", " 0.4998365,\n", " 0.73095655,\n", " 0.5001351,\n", " 0.49978837,\n", " 0.49977854,\n", " 0.73069614,\n", " 0.5001848,\n", " 0.7304375,\n", " 0.50112075,\n", " 0.49927607,\n", " 0.73103297,\n", " 0.5001429,\n", " 0.73104817,\n", " 0.7311691,\n", " 0.7313848,\n", " 0.5002024,\n", " 0.5002826,\n", " 0.73135656,\n", " 0.49949756,\n", " 0.49994028,\n", " 0.73069584,\n", " 0.73052484,\n", " 0.7310688,\n", " 0.49985936,\n", " 0.50001544,\n", " 0.49982065,\n", " 0.5007602,\n", " 0.50050986,\n", " 0.73093826,\n", " 0.7307535,\n", " 0.5006642,\n", " 0.5001168,\n", " 0.50004333,\n", " 0.73083025,\n", " 0.73080844,\n", " 0.7311554,\n", " 0.49976146,\n", " 0.50003576,\n", " 0.7307183,\n", " 0.4999683,\n", " 0.49980578,\n", " 0.49976695,\n", " 0.50103486,\n", " 0.73126686,\n", " 0.50042903,\n", " 0.7311433,\n", " 0.49924415,\n", " 0.7308227,\n", " 0.73050815,\n", " 0.7303354,\n", " 0.7309623,\n", " 0.73076224,\n", " 0.49968886,\n", " 0.73079187,\n", " 0.49998474,\n", " 0.73085666,\n", " 0.73052293,\n", " 0.4997768,\n", " 0.49978182,\n", " 0.7309219,\n", " 0.50016433,\n", " 0.49916515,\n", " ...]" ] }, "metadata": {}, "execution_count": 31 } ] }, { "cell_type": "code", "source": [ "import numpy as np\n", "\n", "# Generate thresholds to test (e.g., from 0.0 to 1.0 with a step of 0.01)\n", "thresholds = np.arange(0.35, 0.70, 0.01)\n", "\n", "# Lists to store thresholds and corresponding accuracies\n", "accuracies = []\n", "\n", "# Initialize variables to store the best threshold and highest accuracy\n", "best_threshold = 0.0\n", "best_accuracy = 0.0\n", "\n", "# Loop through thresholds to calculate accuracy\n", "for threshold in thresholds:\n", " # Convert probabilities to binary predictions using the current threshold\n", " predictions = (probabilities >= threshold).astype(int)\n", "\n", " # Calculate accuracy\n", " accuracy = accuracy_score(true_labels, predictions)\n", " accuracies.append(accuracy)\n", "\n", " # Update best threshold if current accuracy is higher\n", " if accuracy > best_accuracy:\n", " best_accuracy = accuracy\n", " best_threshold = threshold\n", "\n", "# Plot accuracy vs threshold\n", "plt.figure(figsize=(8, 6))\n", "plt.plot(thresholds, accuracies, marker='o', label='Accuracy', color='blue')\n", "plt.axvline(best_threshold, color='red', linestyle='--', label=f'Best Threshold: {best_threshold:.2f}')\n", "plt.title(\"Threshold vs Accuracy\")\n", "plt.xlabel(\"Threshold\")\n", "plt.ylabel(\"Accuracy\")\n", "plt.legend()\n", "plt.grid()\n", "plt.show()\n", "\n", "# Print the optimal threshold and corresponding accuracy\n", "print(f\"Best Threshold: {best_threshold:.2f}\")\n", "print(f\"Best Accuracy: {best_accuracy:.4f}\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 600 }, "id": "sG9ebO39jqop", "outputId": "f255e33e-146d-46b9-d53a-17c96407c7e2" }, "execution_count": 37, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "\n" }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "Best Threshold: 0.51\n", "Best Accuracy: 1.0000\n" ] } ] }, { "cell_type": "code", "source": [ "# Predictions corresponding to best_threshold\n", "predictions = (probabilities >= best_threshold).astype(int)\n", "\n", "# Calculate evaluation metrics\n", "accuracy = accuracy_score(true_labels, predictions)\n", "precision = precision_score(true_labels, predictions)\n", "recall = recall_score(true_labels, predictions)\n", "f1 = f1_score(true_labels, predictions)\n", "auc_roc = roc_auc_score(true_labels, probabilities)\n", "\n", "# Print metrics\n", "print(f\"Accuracy: {accuracy:.4f}\")\n", "print(f\"Precision: {precision:.4f}\")\n", "print(f\"Recall: {recall:.4f}\")\n", "print(f\"F1 Score: {f1:.4f}\")\n", "print(f\"AUC-ROC: {auc_roc:.4f}\")\n", "\n", "conf_matrix = confusion_matrix(true_labels, predictions)\n", "sns.heatmap(conf_matrix, annot=True, fmt='d', cmap='Blues')\n", "plt.title('Confusion Matrix')\n", "plt.xlabel('Predicted Labels')\n", "plt.ylabel('True Labels')\n", "plt.show()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 561 }, "id": "O3kZy5V3luFh", "outputId": "c8b156ae-5ffd-4b91-d0b6-82c6c89a599e" }, "execution_count": 39, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Accuracy: 1.0000\n", "Precision: 1.0000\n", "Recall: 1.0000\n", "F1 Score: 1.0000\n", "AUC-ROC: 1.0000\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ "
" ], "image/png": "iVBORw0KGgoAAAANSUhEUgAAAiQAAAHHCAYAAACPy0PBAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjguMCwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy81sbWrAAAACXBIWXMAAA9hAAAPYQGoP6dpAABOl0lEQVR4nO3de1xU1fo/8M9wGxAcEBQGjooohqB4L51M0URQ0eMFy1uKhhoe9KR4i3NMkUr6al7zVplihqVWWoKpiCKVeEPxWuQFw5IBb0AgDAL790c/9nEEHUZnu5E+7177dZy116z97HnJ8eFZa+1RCIIggIiIiEhGZnIHQERERMSEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SESEIXL15EQEAA7O3toVAosHPnTpOOf/XqVSgUCsTGxpp03GdZz5490bNnT7nDICIjMSGhOu/y5ct444030Lx5c1hbW0OlUqFbt25YsWIFiouLJb12SEgIzp49i/feew+bN29G586dJb3e0zRu3DgoFAqoVKpqP8eLFy9CoVBAoVDggw8+MHr869evIyoqCunp6SaIlohqOwu5AyCSUkJCAl555RUolUqMHTsWbdq0QWlpKX788UfMmjUL58+fx8cffyzJtYuLi5Gamor//ve/mDJliiTXcHd3R3FxMSwtLSUZ3xALCwvcvXsXu3btwquvvqp3Li4uDtbW1igpKXmssa9fv44FCxagWbNmaN++fY3ft2/fvse6HhHJiwkJ1VmZmZkYMWIE3N3dceDAAbi6uornwsPDcenSJSQkJEh2/Rs3bgAAHBwcJLuGQqGAtbW1ZOMbolQq0a1bN3zxxRdVEpItW7YgKCgIX3/99VOJ5e7du6hXrx6srKyeyvWIyLQ4ZUN11qJFi1BYWIhPP/1ULxmp5OnpiTfffFN8XVZWhnfeeQctWrSAUqlEs2bN8J///Ac6nU7vfc2aNcOAAQPw448/4oUXXoC1tTWaN2+Ozz77TOwTFRUFd3d3AMCsWbOgUCjQrFkzAH9NdVT++X5RUVFQKBR6bYmJiXjppZfg4OAAOzs7eHl54T//+Y94/mFrSA4cOIDu3bvD1tYWDg4OGDRoEH7++edqr3fp0iWMGzcODg4OsLe3x/jx43H37t2Hf7APGDVqFL7//nvk5eWJbcePH8fFixcxatSoKv1v376NmTNnwtfXF3Z2dlCpVOjXrx9Onz4t9klOTsbzzz8PABg/frw49VN5nz179kSbNm2QlpaGHj16oF69euLn8uAakpCQEFhbW1e5/8DAQDRo0ADXr1+v8b0SkXSYkFCdtWvXLjRv3hwvvvhijfpPmDAB8+bNQ8eOHbFs2TL4+fkhJiYGI0aMqNL30qVLGDZsGPr06YMlS5agQYMGGDduHM6fPw8AGDp0KJYtWwYAGDlyJDZv3ozly5cbFf/58+cxYMAA6HQ6REdHY8mSJfjnP/+Jn3766ZHv279/PwIDA5Gbm4uoqChERETg8OHD6NatG65evVql/6uvvoo///wTMTExePXVVxEbG4sFCxbUOM6hQ4dCoVDgm2++Edu2bNmCVq1aoWPHjlX6X7lyBTt37sSAAQOwdOlSzJo1C2fPnoWfn5+YHHh7eyM6OhoAMGnSJGzevBmbN29Gjx49xHFu3bqFfv36oX379li+fDl69epVbXwrVqxAo0aNEBISgvLycgDARx99hH379uHDDz+Em5tbje+ViCQkENVB+fn5AgBh0KBBNeqfnp4uABAmTJig1z5z5kwBgHDgwAGxzd3dXQAgpKSkiG25ubmCUqkUZsyYIbZlZmYKAITFixfrjRkSEiK4u7tXiWH+/PnC/T+Sy5YtEwAIN27ceGjcldfYuHGj2Na+fXvB2dlZuHXrlth2+vRpwczMTBg7dmyV673++ut6Yw4ZMkRwcnJ66DXvvw9bW1tBEARh2LBhQu/evQVBEITy8nJBrVYLCxYsqPYzKCkpEcrLy6vch1KpFKKjo8W248ePV7m3Sn5+fgIAYd26ddWe8/Pz02vbu3evAEB49913hStXrgh2dnbC4MGDDd4jET09rJBQnVRQUAAAqF+/fo367969GwAQERGh1z5jxgwAqLLWxMfHB927dxdfN2rUCF5eXrhy5cpjx/ygyrUn3377LSoqKmr0nuzsbKSnp2PcuHFwdHQU29u2bYs+ffqI93m/sLAwvdfdu3fHrVu3xM+wJkaNGoXk5GRotVocOHAAWq222uka4K91J2Zmf/1fT3l5OW7duiVOR508ebLG11QqlRg/fnyN+gYEBOCNN95AdHQ0hg4dCmtra3z00Uc1vhYRSY8JCdVJKpUKAPDnn3/WqP9vv/0GMzMzeHp66rWr1Wo4ODjgt99+02tv2rRplTEaNGiAO3fuPGbEVQ0fPhzdunXDhAkT4OLighEjRmDbtm2PTE4q4/Ty8qpyztvbGzdv3kRRUZFe+4P30qBBAwAw6l769++P+vXrY+vWrYiLi8Pzzz9f5bOsVFFRgWXLlqFly5ZQKpVo2LAhGjVqhDNnziA/P7/G1/zHP/5h1ALWDz74AI6OjkhPT8fKlSvh7Oxc4/cSkfSYkFCdpFKp4ObmhnPnzhn1vgcXlT6Mubl5te2CIDz2NSrXN1SysbFBSkoK9u/fjzFjxuDMmTMYPnw4+vTpU6Xvk3iSe6mkVCoxdOhQbNq0CTt27HhodQQAFi5ciIiICPTo0QOff/459u7di8TERLRu3brGlSDgr8/HGKdOnUJubi4A4OzZs0a9l4ikx4SE6qwBAwbg8uXLSE1NNdjX3d0dFRUVuHjxol57Tk4O8vLyxB0zptCgQQO9HSmVHqzCAICZmRl69+6NpUuX4sKFC3jvvfdw4MABHDx4sNqxK+PMyMiocu6XX35Bw4YNYWtr+2Q38BCjRo3CqVOn8Oeff1a7ELjSV199hV69euHTTz/FiBEjEBAQAH9//yqfSU2Tw5ooKirC+PHj4ePjg0mTJmHRokU4fvy4ycYnoifHhITqrNmzZ8PW1hYTJkxATk5OlfOXL1/GihUrAPw15QCgyk6YpUuXAgCCgoJMFleLFi2Qn5+PM2fOiG3Z2dnYsWOHXr/bt29XeW/lA8Ie3IpcydXVFe3bt8emTZv0/oE/d+4c9u3bJ96nFHr16oV33nkHq1atglqtfmg/c3PzKtWX7du3448//tBrq0ycqkvejDVnzhxkZWVh06ZNWLp0KZo1a4aQkJCHfo5E9PTxwWhUZ7Vo0QJbtmzB8OHD4e3trfek1sOHD2P79u0YN24cAKBdu3YICQnBxx9/jLy8PPj5+eHYsWPYtGkTBg8e/NAtpY9jxIgRmDNnDoYMGYJ///vfuHv3LtauXYvnnntOb1FndHQ0UlJSEBQUBHd3d+Tm5mLNmjVo3LgxXnrppYeOv3jxYvTr1w8ajQahoaEoLi7Ghx9+CHt7e0RFRZnsPh5kZmaGuXPnGuw3YMAAREdHY/z48XjxxRdx9uxZxMXFoXnz5nr9WrRoAQcHB6xbtw7169eHra0tunTpAg8PD6PiOnDgANasWYP58+eL25A3btyInj174u2338aiRYuMGo+IJCLzLh8iyf3666/CxIkThWbNmglWVlZC/fr1hW7dugkffvihUFJSIva7d++esGDBAsHDw0OwtLQUmjRpIkRGRur1EYS/tv0GBQVVuc6D200ftu1XEARh3759Qps2bQQrKyvBy8tL+Pzzz6ts+01KShIGDRokuLm5CVZWVoKbm5swcuRI4ddff61yjQe3xu7fv1/o1q2bYGNjI6hUKmHgwIHChQsX9PpUXu/BbcUbN24UAAiZmZkP/UwFQX/b78M8bNvvjBkzBFdXV8HGxkbo1q2bkJqaWu123W+//Vbw8fERLCws9O7Tz89PaN26dbXXvH+cgoICwd3dXejYsaNw7949vX7Tp08XzMzMhNTU1EfeAxE9HQpBMGLlGhEREZEEuIaEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZFcnn9Rq02GK3CEQ1Up3jq+SOwSiWsf6KfxLaKp/l4pP1d2fYVZIiIiISHZ1skJCRERUqyj4+78hTEiIiIikplDIHUGtx4SEiIhIaqyQGMRPiIiIiGTHCgkREZHUOGVjEBMSIiIiqXHKxiB+QkRERCQ7VkiIiIikxikbg5iQEBERSY1TNgbxEyIiIiLZsUJCREQkNU7ZGMSEhIiISGqcsjGInxARERHJjhUSIiIiqXHKxiAmJERERFLjlI1BTEiIiIikxgqJQUzZiIiISHaskBAREUmNUzYG8RMiIiKSmsLMNMcTeP/996FQKDBt2jSxraSkBOHh4XBycoKdnR2Cg4ORk5Oj976srCwEBQWhXr16cHZ2xqxZs1BWVqbXJzk5GR07doRSqYSnpydiY2ONjo8JCRERUR13/PhxfPTRR2jbtq1e+/Tp07Fr1y5s374dhw4dwvXr1zF06FDxfHl5OYKCglBaWorDhw9j06ZNiI2Nxbx588Q+mZmZCAoKQq9evZCeno5p06ZhwoQJ2Lt3r1ExMiEhIiKSmpnCNMdjKCwsxOjRo/HJJ5+gQYMGYnt+fj4+/fRTLF26FC+//DI6deqEjRs34vDhwzhy5AgAYN++fbhw4QI+//xztG/fHv369cM777yD1atXo7S0FACwbt06eHh4YMmSJfD29saUKVMwbNgwLFu2zLiP6LHujoiIiGpOximb8PBwBAUFwd/fX689LS0N9+7d02tv1aoVmjZtitTUVABAamoqfH194eLiIvYJDAxEQUEBzp8/L/Z5cOzAwEBxjJriolYiIqJnhE6ng06n02tTKpVQKpXV9v/yyy9x8uRJHD9+vMo5rVYLKysrODg46LW7uLhAq9WKfe5PRirPV557VJ+CggIUFxfDxsamRvfGCgkREZHUFAqTHDExMbC3t9c7YmJiqr3ktWvX8OabbyIuLg7W1tZP+YaNx4SEiIhIaiaasomMjER+fr7eERkZWe0l09LSkJubi44dO8LCwgIWFhY4dOgQVq5cCQsLC7i4uKC0tBR5eXl678vJyYFarQYAqNXqKrtuKl8b6qNSqWpcHQGYkBARET0zlEolVCqV3vGw6ZrevXvj7NmzSE9PF4/OnTtj9OjR4p8tLS2RlJQkvicjIwNZWVnQaDQAAI1Gg7NnzyI3N1fsk5iYCJVKBR8fH7HP/WNU9qkco6a4hoSIiEhqMjw6vn79+mjTpo1em62tLZycnMT20NBQREREwNHRESqVClOnToVGo0HXrl0BAAEBAfDx8cGYMWOwaNEiaLVazJ07F+Hh4WIiFBYWhlWrVmH27Nl4/fXXceDAAWzbtg0JCQlGxcuEhIiISGq19Emty5Ytg5mZGYKDg6HT6RAYGIg1a9aI583NzREfH4/JkydDo9HA1tYWISEhiI6OFvt4eHggISEB06dPx4oVK9C4cWOsX78egYGBRsWiEARBMNmd1RI2HabIHQJRrXTn+Cq5QyCqdayfwq/mNoEfmGSc4r0zTTJObVQ7UzYiIiL6W+GUDRERkdRq6ZRNbcKEhIiISGoyLGp91jBlIyIiItmxQkJERCQ1TtkYxISEiIhIapyyMYgpGxEREcmOFRIiIiKpccrGICYkREREUmNCYhA/ISIiIpIdKyRERERS46JWg5iQEBERSY1TNgYxISEiIpIaKyQGMWUjIiIi2bFCQkREJDVO2RjEhISIiEhqnLIxiCkbERERyY4VEiIiIokpWCExiAkJERGRxJiQGMYpGyIiIpIdKyRERERSY4HEICYkREREEuOUjWGcsiEiIiLZsUJCREQkMVZIDGNCQkREJDEmJIYxISEiIpIYExLDuIaEiIiIZMcKCRERkdRYIDGICQkREZHEOGVjGKdsiIiISHaskBAREUmMFRLDmJAQERFJjAmJYZyyISIiqoPWrl2Ltm3bQqVSQaVSQaPR4PvvvxfP9+zZEwqFQu8ICwvTGyMrKwtBQUGoV68enJ2dMWvWLJSVlen1SU5ORseOHaFUKuHp6YnY2NjHipcVEiIiIonJUSFp3Lgx3n//fbRs2RKCIGDTpk0YNGgQTp06hdatWwMAJk6ciOjoaPE99erVE/9cXl6OoKAgqNVqHD58GNnZ2Rg7diwsLS2xcOFCAEBmZiaCgoIQFhaGuLg4JCUlYcKECXB1dUVgYKBR8SoEQRBMcN+1ik2HKXKHQFQr3Tm+Su4QiGod66fwq7lTyBcmGefWppFP9H5HR0csXrwYoaGh6NmzJ9q3b4/ly5dX2/f777/HgAEDcP36dbi4uAAA1q1bhzlz5uDGjRuwsrLCnDlzkJCQgHPnzonvGzFiBPLy8rBnzx6jYuOUDRERUR1XXl6OL7/8EkVFRdBoNGJ7XFwcGjZsiDZt2iAyMhJ3794Vz6WmpsLX11dMRgAgMDAQBQUFOH/+vNjH399f71qBgYFITU01OkZO2RAREUnMVFM2Op0OOp1Or02pVEKpVFbb/+zZs9BoNCgpKYGdnR127NgBHx8fAMCoUaPg7u4ONzc3nDlzBnPmzEFGRga++eYbAIBWq9VLRgCIr7Va7SP7FBQUoLi4GDY2NjW+NyYkREREEjNVQhITE4MFCxbotc2fPx9RUVHV9vfy8kJ6ejry8/Px1VdfISQkBIcOHYKPjw8mTZok9vP19YWrqyt69+6Ny5cvo0WLFiaJ1xhMSIiIiCRmqoQkMjISERERem0Pq44AgJWVFTw9PQEAnTp1wvHjx7FixQp89NFHVfp26dIFAHDp0iW0aNECarUax44d0+uTk5MDAFCr1eL/Vrbd30elUhlVHQG4hoSIiOiZoVQqxW28lcejEpIHVVRUVJnyqZSeng4AcHV1BQBoNBqcPXsWubm5Yp/ExESoVCpx2kej0SApKUlvnMTERL11KjXFCgkREZHUZHguWmRkJPr164emTZvizz//xJYtW5CcnIy9e/fi8uXL2LJlC/r37w8nJyecOXMG06dPR48ePdC2bVsAQEBAAHx8fDBmzBgsWrQIWq0Wc+fORXh4uJgEhYWFYdWqVZg9ezZef/11HDhwANu2bUNCQoLR8TIhISIikpgczyHJzc3F2LFjkZ2dDXt7e7Rt2xZ79+5Fnz59cO3aNezfvx/Lly9HUVERmjRpguDgYMydO1d8v7m5OeLj4zF58mRoNBrY2toiJCRE77klHh4eSEhIwPTp07FixQo0btwY69evN/oZJACfQ0L0t8LnkBBV9TSeQ+IyYbtJxslZ/4pJxqmNWCEhIiKSGL/LxjAmJERERBJjQmIYd9kQERGR7FghISIikhgrJIYxISEiIpIa8xGDOGVDREREsmOFhIiISGKcsjGMCQkREZHEmJAYxoSEiIhIYkxIDOMaEiIiIpIdKyRERERSY4HEICYkREREEuOUjWGcsiEiIiLZMSEho8wc3wfFp1Zh8cxgAEADVT0snfMKTu94G7dTl+LX3dFYMnsYVHbWeu/r5NMUu9dNRXbKIlw/tAjfrQ6H73P/qPYazZs0RO6PHyA7ZZHk90P0tH25JQ79+ryM5zv4YvSIV3D2zBm5Q6KnQKFQmOSoy5iQUI118mmK0OBuOPPr72KbayN7uDayR+SyHej0ykJMnP85+rzog3XzR4t9bG2s8O3qcFzT3kGPMR+g9/ilKLxbgu9Wh8PCQv+voIWFGT6LGY+fTl1+avdF9LTs+X43PlgUgzf+FY4vt++Al1crTH4jFLdu3ZI7NJIYExLDmJBQjdjaWGHjwnH41ztfIK+gWGy/cDkbI2eux+6Uc8j8/SYOHf8VUat2oX+PNjA3/+uvl5eHGk4OtnhnbTwu/paLn69o8d5H30PdUIWmro5614n610BkZObg630nn+r9ET0NmzdtxNBhr2LwkGC08PTE3PkLYG1tjZ3ffC13aESykzUhuXnzJhYtWoQhQ4ZAo9FAo9FgyJAhWLx4MW7cuCFnaPSA5ZHDseeHczh4NMNgX1V9axQUlaC8vAIA8OvVHNy8U4iQwS/C0sIc1kpLjBuswc9XsvHb9dvi+/yefw5D+3TAtPe3SXYfRHK5V1qKny+cR1fNi2KbmZkZunZ9EWdOn5IxMnoaWCExTLaE5Pjx43juueewcuVK2Nvbo0ePHujRowfs7e2xcuVKtGrVCidOnJArPLrPK4Gd0L5VE7z94XcG+zo52CJyYj9s+Pqw2FZ4V4fAiSswsv/zuHNkGW7+tAR9XvTG4ClrxKTF0d4Wnyx4DRPnb8afRSWS3QuRXO7k3UF5eTmcnJz02p2cnHDz5k2ZoqKnRmGiow6Tbdvv1KlT8corr2DdunVVsj5BEBAWFoapU6ciNTX1kePodDrodDr991eUQ2FmbvKY/44auzhg8axgDJi8CrrSskf2rW9rjR0rJ+PnK9l496MEsd1aaYl180cj9fQVhERuhLm5GaaN7Y1vVk7GS68tRonuHta8PRJb95zATye5doSI6O9ItoTk9OnTiI2NrbYEpVAoMH36dHTo0MHgODExMViwYIFem7nL87B0fcFksf6ddfBuChcnFVK3zBHbLCzM8VLHFggb3gP2XaahokKAXT0lvlv9L/x5twTDIz5BWVmF2H94v85o6uYIv5AlEAQBABASGYvslEUY2LMttu9Ng98LzyHIzxfTxvQG8NffAXNzM/x5fAXC3/0Cn3175OneOJGJNXBoAHNz8yoLWG/duoWGDRvKFBU9LXV9usUUZEtI1Go1jh07hlatWlV7/tixY3BxcTE4TmRkJCIiIvTanLvPeUhvMtbBYxnoNOw9vbaPF7yGjMwcLIlNREWFgPq21ti1Jhy60jIMm/ZRlUpKPWsrVFQIYjICABWCAEEAzP7/D2nPkCUwN/vfDOKAnm0xY5w/eo1biuu5edLdINFTYmllBW+f1jh6JBUv9/YHAFRUVODo0VSMGPmazNGR1JiQGCZbQjJz5kxMmjQJaWlp6N27t5h85OTkICkpCZ988gk++OADg+MolUoolUq9Nk7XmE7hXR0uXM7WaysqLsXt/CJcuJyN+rbWiF8TDhtrK4z/7yaobK2hsv3rGSQ37hSiokJA0pFfsHDaYCyPfBVrvzwEM4UCM8cHoKy8HIdO/AoAyMjM0btGR5+mqBCEKtcmepaNCRmPt/8zB61bt0Eb37b4fPMmFBcXY/CQoXKHRhJjPmKYbAlJeHg4GjZsiGXLlmHNmjUoLy8HAJibm6NTp06IjY3Fq6++Kld4VEPtWzXBC209AAAXdkXpnfPqPw9Z2bfx69UcBL/5Ef77Rj8kb5qBigoBp3/5HYPC10B7s0CGqInk0bdff9y5fRtrVq3EzZs34NXKG2s+Wg8nTtkQQSHcX0eXyb1798RV5g0bNoSlpeUTjWfTYYopwiKqc+4cXyV3CES1jvVT+NW85aw9Jhnn4uK+JhmnNqoVX65naWkJV1dXucMgIiKSBKdsDOOTWomIiEh2taJCQkREVJdxl41hTEiIiIgkxnzEME7ZEBERkexYISEiIpKYmRlLJIYwISEiIpIYp2wM45QNERERyY4VEiIiIolxl41hrJAQERFJTKEwzWGMtWvXom3btlCpVFCpVNBoNPj+++/F8yUlJQgPD4eTkxPs7OwQHByMnBz97xXLyspCUFAQ6tWrB2dnZ8yaNQtlZfpfoJqcnIyOHTtCqVTC09MTsbGxj/UZMSEhIiKSmEKhMMlhjMaNG+P9999HWloaTpw4gZdffhmDBg3C+fPnAQDTp0/Hrl27sH37dhw6dAjXr1/H0KH/+6LH8vJyBAUFobS0FIcPH8amTZsQGxuLefPmiX0yMzMRFBSEXr16IT09HdOmTcOECROwd+9e4z+j2vBdNqbG77Ihqh6/y4aoqqfxXTZt5+03yThnov2f6P2Ojo5YvHgxhg0bhkaNGmHLli0YNmwYAOCXX36Bt7c3UlNT0bVrV3z//fcYMGAArl+/DhcXFwDAunXrMGfOHNy4cQNWVlaYM2cOEhIScO7cOfEaI0aMQF5eHvbsMe77e1ghISIikpipKiQ6nQ4FBQV6h06nM3j98vJyfPnllygqKoJGo0FaWhru3bsHf///JTitWrVC06ZNkZqaCgBITU2Fr6+vmIwAQGBgIAoKCsQqS2pqqt4YlX0qxzAGExIiIiKJmWoNSUxMDOzt7fWOmJiYh1737NmzsLOzg1KpRFhYGHbs2AEfHx9otVpYWVnBwcFBr7+Liwu0Wi0AQKvV6iUjlecrzz2qT0FBAYqLi436jLjLhoiI6BkRGRmJiIgIvTalUvnQ/l5eXkhPT0d+fj6++uorhISE4NChQ1KH+ViYkBAREUnMVNt+lUrlIxOQB1lZWcHT0xMA0KlTJxw/fhwrVqzA8OHDUVpairy8PL0qSU5ODtRqNQBArVbj2LFjeuNV7sK5v8+DO3NycnKgUqlgY2Nj1L1xyoaIiEhicmz7rU5FRQV0Oh06deoES0tLJCUliecyMjKQlZUFjUYDANBoNDh79ixyc3PFPomJiVCpVPDx8RH73D9GZZ/KMYzBCgkREVEdFBkZiX79+qFp06b4888/sWXLFiQnJ2Pv3r2wt7dHaGgoIiIi4OjoCJVKhalTp0Kj0aBr164AgICAAPj4+GDMmDFYtGgRtFot5s6di/DwcLFKExYWhlWrVmH27Nl4/fXXceDAAWzbtg0JCQlGx8uEhIiISGJyPKk1NzcXY8eORXZ2Nuzt7dG2bVvs3bsXffr0AQAsW7YMZmZmCA4Ohk6nQ2BgINasWSO+39zcHPHx8Zg8eTI0Gg1sbW0REhKC6OhosY+HhwcSEhIwffp0rFixAo0bN8b69esRGBhodLx8DgnR3wifQ0JU1dN4Dknndw+aZJwTc3uZZJzaiGtIiIiISHacsiEiIpIYv1zPMCYkREREEmM+YhgTEiIiIomxQmIY15AQERGR7FghISIikhgLJIYxISEiIpIYp2wM45QNERERyY4VEiIiIomxQGIYExIiIiKJccrGME7ZEBERkexYISEiIpIYCySGMSEhIiKSGKdsDOOUDREREcmOFRIiIiKJsUJiGBMSIiIiiTEfMYwJCRERkcRYITGMa0iIiIhIdqyQEBERSYwFEsOYkBAREUmMUzaGccqGiIiIZMcKCRERkcRYIDGMCQkREZHEzJiRGMQpGyIiIpIdKyREREQSY4HEMCYkREREEuMuG8OYkBAREUnMjPmIQVxDQkRERLJjhYSIiEhinLIxzOgKyaZNm5CQkCC+nj17NhwcHPDiiy/it99+M2lwREREdYFCYZqjLjM6IVm4cCFsbGwAAKmpqVi9ejUWLVqEhg0bYvr06SYPkIiIiOo+o6dsrl27Bk9PTwDAzp07ERwcjEmTJqFbt27o2bOnqeMjIiJ65ilQx8sbJmB0hcTOzg63bt0CAOzbtw99+vQBAFhbW6O4uNi00REREdUBZgrTHMaIiYnB888/j/r168PZ2RmDBw9GRkaGXp+ePXtCoVDoHWFhYXp9srKyEBQUhHr16sHZ2RmzZs1CWVmZXp/k5GR07NgRSqUSnp6eiI2NNfozMrpC0qdPH0yYMAEdOnTAr7/+iv79+wMAzp8/j2bNmhkdABEREZneoUOHEB4ejueffx5lZWX4z3/+g4CAAFy4cAG2trZiv4kTJyI6Olp8Xa9ePfHP5eXlCAoKglqtxuHDh5GdnY2xY8fC0tISCxcuBABkZmYiKCgIYWFhiIuLQ1JSEiZMmABXV1cEBgbWOF6jE5LVq1dj7ty5uHbtGr7++ms4OTkBANLS0jBy5EhjhyMiIqrz5Nhls2fPHr3XsbGxcHZ2RlpaGnr06CG216tXD2q1utox9u3bhwsXLmD//v1wcXFB+/bt8c4772DOnDmIioqClZUV1q1bBw8PDyxZsgQA4O3tjR9//BHLli0zKiExesrGwcEBq1atwrfffou+ffuK7QsWLMB///tfY4cjIiKq80y1y0an06GgoEDv0Ol0NYohPz8fAODo6KjXHhcXh4YNG6JNmzaIjIzE3bt3xXOpqanw9fWFi4uL2BYYGIiCggKcP39e7OPv7683ZmBgIFJTU436jGpUITlz5kyNB2zbtq1RARAREVHNxMTEYMGCBXpt8+fPR1RU1CPfV1FRgWnTpqFbt25o06aN2D5q1Ci4u7vDzc0NZ86cwZw5c5CRkYFvvvkGAKDVavWSEQDia61W+8g+BQUFKC4uFnfmGlKjhKR9+/ZQKBQQBKHa85XnFAoFysvLa3RhIiKivwszE03ZREZGIiIiQq9NqVQafF94eDjOnTuHH3/8Ua990qRJ4p99fX3h6uqK3r174/Lly2jRooVJYq6pGiUkmZmZUsdBRERUZ5lqCYlSqaxRAnK/KVOmID4+HikpKWjcuPEj+3bp0gUAcOnSJbRo0QJqtRrHjh3T65OTkwMA4roTtVottt3fR6VS1bg6AtQwIXF3d6/xgERERKRPjkWtgiBg6tSp2LFjB5KTk+Hh4WHwPenp6QAAV1dXAIBGo8F7772H3NxcODs7AwASExOhUqng4+Mj9tm9e7feOImJidBoNEbF+1hfrrd582Z069YNbm5u4uPily9fjm+//fZxhiMiIiITCw8Px+eff44tW7agfv360Gq10Gq14jPDLl++jHfeeQdpaWm4evUqvvvuO4wdOxY9evQQ14MGBATAx8cHY8aMwenTp7F3717MnTsX4eHhYqUmLCwMV65cwezZs/HLL79gzZo12LZtm9FPbzc6IVm7di0iIiLQv39/5OXliWtGHBwcsHz5cmOHIyIiqvPk+C6btWvXIj8/Hz179oSrq6t4bN26FQBgZWWF/fv3IyAgAK1atcKMGTMQHByMXbt2iWOYm5sjPj4e5ubm0Gg0eO211zB27Fi955Z4eHggISEBiYmJaNeuHZYsWYL169cbteUXABTCw1aqPoSPjw8WLlyIwYMHo379+jh9+jSaN2+Oc+fOoWfPnrh586ZRAUjBpsMUuUMgqpXuHF8ldwhEtY71U/je++GbTplknK0hHUwyTm1kdIUkMzMTHTpU/UCUSiWKiopMEhQRERH9vRidkHh4eIiLXu63Z88eeHt7myImIiKiOkVhoqMuM7pQFRERgfDwcJSUlEAQBBw7dgxffPEFYmJisH79eiliJCIieqbJscvmWWN0QjJhwgTY2Nhg7ty5uHv3LkaNGgU3NzesWLECI0aMkCJGIiIiquMeaynP6NGjMXr0aNy9exeFhYXi3mQiIiKqyowFEoMee21xbm4uMjIyAPxVimrUqJHJgiIiIqpLOGVjmNGLWv/880+MGTMGbm5u8PPzg5+fH9zc3PDaa6+J3yRIREREZAyjE5IJEybg6NGjSEhIQF5eHvLy8hAfH48TJ07gjTfekCJGIiKiZ5ocD0Z71hg9ZRMfH4+9e/fipZdeEtsCAwPxySefoG/fviYNjoiIqC7glI1hRickTk5OsLe3r9Jub2+PBg0amCQoIiKiuoSLWg0zespm7ty5iIiIgFarFdu0Wi1mzZqFt99+26TBERER0d9DjSokHTp00Cs3Xbx4EU2bNkXTpk0BAFlZWVAqlbhx4wbXkRARET2AUzaG1SghGTx4sMRhEBER1V1MRwyrUUIyf/58qeMgIiKiv7Gn8KXLREREf29mnLIxyOiEpLy8HMuWLcO2bduQlZWF0tJSvfO3b982WXBERER1AfMRw4zeZbNgwQIsXboUw4cPR35+PiIiIjB06FCYmZkhKipKghCJiIiorjM6IYmLi8Mnn3yCGTNmwMLCAiNHjsT69esxb948HDlyRIoYiYiInmkKhcIkR11mdEKi1Wrh6+sLALCzsxO/v2bAgAFISEgwbXRERER1AB8db5jRCUnjxo2RnZ0NAGjRogX27dsHADh+/DiUSqVpoyMiIqK/BaMTkiFDhiApKQkAMHXqVLz99tto2bIlxo4di9dff93kARIRET3rzBQKkxx1mdG7bN5//33xz8OHD4e7uzsOHz6Mli1bYuDAgSYNjoiIqC6o47mESRhdIXlQ165dERERgS5dumDhwoWmiImIiKhO4aJWw544IamUnZ3NL9cjIiKix1Inn9R65/gquUMgqpUa9H3fcCeiv5ni/W9Jfg2T/fZfh9XJhISIiKg2qevTLabApI2IiIhkV+MKSURExCPP37hx44mDISIiqovMWCAxqMYJyalTpwz26dGjxxMFQ0REVBcxITGsxgnJwYMHpYyDiIiI/sa4qJWIiEhiXNRqGBMSIiIiiXHKxjDusiEiIqqDYmJi8Pzzz6N+/fpwdnbG4MGDkZGRodenpKQE4eHhcHJygp2dHYKDg5GTk6PXJysrC0FBQahXrx6cnZ0xa9YslJWV6fVJTk5Gx44doVQq4enpidjYWKPjZUJCREQkMYXCNIcxDh06hPDwcBw5cgSJiYm4d+8eAgICUFRUJPaZPn06du3ahe3bt+PQoUO4fv06hg4dKp4vLy9HUFAQSktLcfjwYWzatAmxsbGYN2+e2CczMxNBQUHo1asX0tPTMW3aNEyYMAF79+417jMSBEEw7hZrv5Iyw32I/o74pFaiqp7Gk1rf2v2rScZ5v/9zj/3eGzduwNnZGYcOHUKPHj2Qn5+PRo0aYcuWLRg2bBgA4JdffoG3tzdSU1PRtWtXfP/99xgwYACuX78OFxcXAMC6deswZ84c3LhxA1ZWVpgzZw4SEhJw7tw58VojRoxAXl4e9uzZU+P4HqtC8sMPP+C1116DRqPBH3/8AQDYvHkzfvzxx8cZjoiIqE4zM9Gh0+lQUFCgd+h0uhrFkJ+fDwBwdHQEAKSlpeHevXvw9/cX+7Rq1QpNmzZFamoqACA1NRW+vr5iMgIAgYGBKCgowPnz58U+949R2adyjJoyOiH5+uuvERgYCBsbG5w6dUr8IPLz8/ltv0RERBKKiYmBvb293hETE2PwfRUVFZg2bRq6deuGNm3aAAC0Wi2srKzg4OCg19fFxQVarVbsc38yUnm+8tyj+hQUFKC4uLjG92Z0QvLuu+9i3bp1+OSTT2BpaSm2d+vWDSdPnjR2OCIiojrPVGtIIiMjkZ+fr3dERkYavH54eDjOnTuHL7/88inc7eMxettvRkZGtU9ktbe3R15eniliIiIiqlPMTPQcEqVSCaVSadR7pkyZgvj4eKSkpKBx48Ziu1qtRmlpKfLy8vSqJDk5OVCr1WKfY8eO6Y1XuQvn/j4P7szJycmBSqWCjY1NjeM0ukKiVqtx6dKlKu0//vgjmjdvbuxwREREJAFBEDBlyhTs2LEDBw4cgIeHh975Tp06wdLSEklJSWJbRkYGsrKyoNFoAAAajQZnz55Fbm6u2CcxMREqlQo+Pj5in/vHqOxTOUZNGZ2QTJw4EW+++SaOHj0KhUKB69evIy4uDjNnzsTkyZONHY6IiKjOk2Pbb3h4OD7//HNs2bIF9evXh1arhVarFdd12NvbIzQ0FBERETh48CDS0tIwfvx4aDQadO3aFQAQEBAAHx8fjBkzBqdPn8bevXsxd+5chIeHi5WasLAwXLlyBbNnz8Yvv/yCNWvWYNu2bZg+fbpR8Ro9ZfPWW2+hoqICvXv3xt27d9GjRw8olUrMnDkTU6dONXY4IiKiOk+OJ7WuXbsWANCzZ0+99o0bN2LcuHEAgGXLlsHMzAzBwcHQ6XQIDAzEmjVrxL7m5uaIj4/H5MmTodFoYGtri5CQEERHR4t9PDw8kJCQgOnTp2PFihVo3Lgx1q9fj8DAQKPifeznkJSWluLSpUsoLCyEj48P7OzsHmcYSfA5JETV43NIiKp6Gs8hidp30TTjBLQ0yTi10WN/l42VlZU4f0REREQPZ6pFrXWZ0QlJr169HvmthQcOHHiigIiIiOoa5iOGGZ2QtG/fXu/1vXv3kJ6ejnPnziEkJMRUcREREdHfiNEJybJly6ptj4qKQmFh4RMHREREVNfIsaj1WWOyb/t97bXXsGHDBlMNR0REVGcoTPRfXfbYi1oflJqaCmtra1MNR0REVGewQmKY0QnJ0KFD9V4LgoDs7GycOHECb7/9tskCIyIior8PoxMSe3t7vddmZmbw8vJCdHQ0AgICTBYYERFRXcEKiWFGJSTl5eUYP348fH190aBBA6liIiIiqlMe9bgM+otRi1rNzc0REBDAb/UlIiIikzJ6l02bNm1w5coVKWIhIiKqk8wUpjnqMqMTknfffRczZ85EfHw8srOzUVBQoHcQERGRPjm+7fdZU+M1JNHR0ZgxYwb69+8PAPjnP/+pNycmCAIUCgXKy8tNHyURERHVaTVOSBYsWICwsDAcPHhQyniIiIjqHH65nmE1TkgEQQAA+Pn5SRYMERFRXVTX13+YglFrSLhtiYiIiKRg1HNInnvuOYNJye3bt58oICIiorqGv88bZlRCsmDBgipPaiUiIqJHM6vjX4xnCkYlJCNGjICzs7NUsRAREdVJrJAYVuM1JFw/QkRERFIxepcNERERGYe7bAyrcUJSUVEhZRxERER1Fp9DYpjRj44nIiIiMjWjFrUSERGR8VggMYwJCRERkcQ4ZWMYp2yIiIhIdqyQEBERSYwFEsOYkBAREUmM0xGG8TMiIiIi2bFCQkREJDE+7dwwJiREREQSYzpiGBMSIiIiiXHbr2FcQ0JERFRHpaSkYODAgXBzc4NCocDOnTv1zo8bNw4KhULv6Nu3r16f27dvY/To0VCpVHBwcEBoaCgKCwv1+pw5cwbdu3eHtbU1mjRpgkWLFhkdKxMSIiIiiSlMdBirqKgI7dq1w+rVqx/ap2/fvsjOzhaPL774Qu/86NGjcf78eSQmJiI+Ph4pKSmYNGmSeL6goAABAQFwd3dHWloaFi9ejKioKHz88cdGxcopGyIiIonJNWPTr18/9OvX75F9lEol1Gp1ted+/vln7NmzB8ePH0fnzp0BAB9++CH69++PDz74AG5uboiLi0NpaSk2bNgAKysrtG7dGunp6Vi6dKle4mIIKyRERETPCJ1Oh4KCAr1Dp9M90ZjJyclwdnaGl5cXJk+ejFu3bonnUlNT4eDgICYjAODv7w8zMzMcPXpU7NOjRw9YWVmJfQIDA5GRkYE7d+7UOA4mJERERBJ7cJ3G4x4xMTGwt7fXO2JiYh47rr59++Kzzz5DUlIS/u///g+HDh1Cv379UF5eDgDQarVwdnbWe4+FhQUcHR2h1WrFPi4uLnp9Kl9X9qkJTtkQERFJzFS//UdGRiIiIkKvTalUPvZ4I0aMEP/s6+uLtm3bokWLFkhOTkbv3r0fe9zHwQoJERHRM0KpVEKlUukdT5KQPKh58+Zo2LAhLl26BABQq9XIzc3V61NWVobbt2+L607UajVycnL0+lS+ftjalOowISEiIpKYqaZspPb777/j1q1bcHV1BQBoNBrk5eUhLS1N7HPgwAFUVFSgS5cuYp+UlBTcu3dP7JOYmAgvLy80aNCgxtdmQkJERCQxubb9FhYWIj09Henp6QCAzMxMpKenIysrC4WFhZg1axaOHDmCq1evIikpCYMGDYKnpycCAwMBAN7e3ujbty8mTpyIY8eO4aeffsKUKVMwYsQIuLm5AQBGjRoFKysrhIaG4vz589i6dStWrFhRZWrJECYkREREddSJEyfQoUMHdOjQAQAQERGBDh06YN68eTA3N8eZM2fwz3/+E8899xxCQ0PRqVMn/PDDD3rTQHFxcWjVqhV69+6N/v3746WXXtJ7xoi9vT327duHzMxMdOrUCTNmzMC8efOM2vILAApBEATT3HbtUVImdwREtVODvu/LHQJRrVO8/y3Jr/HV6WyTjDOsnatJxqmNuMuGiIhIYpyOMIwJCRERkcSexoLUZx2TNiIiIpIdKyREREQSY33EMCYkREREEuOMjWGcsiEiIiLZsUJCREQkMTNO2hjEhISIiEhinLIxjFM2REREJDtWSIiIiCSm4JSNQUxIiIiIJMYpG8M4ZUNERESyY4WEiIhIYtxlYxgTEiIiIolxysYwJiREREQSY0JiGNeQEBERkexYISEiIpIYt/0axoSEiIhIYmbMRwzilA0RERHJjhUSIiIiiXHKxjAmJERERBLjLhvDOGVDREREsmOFhIiISGKcsjGMCQkREZHEuMvGME7ZEBERkexYISHJfLklDps2foqbN2/gOa9WeOs/b8O3bVu5wyJ6YhMHdsDEgR3g7mIPAPj5t5tYuPkn7Dt+BQDg4eqA9994GZo2jaG0NEfiiSuI+DARuXl3AQDd2zXFviWjqh37pfBYpGVo0bKxIz6cFohW7g1hb6tE9q1CbD1wHu999hPKyiuezo2SyXDKxjAmJCSJPd/vxgeLYjB3/gL4+rZD3OZNmPxGKL6N3wMnJye5wyN6In/c+BNvr0/GpT/uQAHgtQBfbI8ORtewjfgtJx/x/zccZy/not+sLwAA88d1x9fvDkOPqZ9BEIAj539Hs1c+1Btz3vju6NWhGdIytACAe+XliEs8h/SLOcgvLIFvC2esjugHM4UC8zekPO1bpifEXTaGMSEhSWzetBFDh72KwUOCAQBz5y9ASkoydn7zNUInTpI5OqIns/vIJb3XURtTMHFgB7zg7Qa3hnZwd7FH17CN+PNuKQBgwqIEZO+Yhp4d3HHw5G+4V1aBnDtF4vstzM0wQNMSa3emiW1Xs/NxNfus+DortwA9ks6jm28Tie+OpMB8xDCuISGTu1daip8vnEdXzYtim5mZGbp2fRFnTp+SMTIi0zMzU+CVnt6wtbbE0Qt/QGlpAQGA7l652KektAwVgoAX21SfTAx4sSWcVDbYvPdstecBoLmbA/o83xw/nMky9S0Q1Qq1ukJy7do1zJ8/Hxs2bHhoH51OB51Op9cmmCuhVCqlDo8e4k7eHZSXl1eZmnFyckJm5hWZoiIyrdYejZC8cgysrSxQWFyK4VHf4JesW7iZfxdFJaV4b0JPzNtwCAqFAu9O6AkLczOoHW2rHSukb1sknsjEHzf/rHLu4IrX0L6lGtZWFlgffwrRsT9IfWskATPO2RhUqyskt2/fxqZNmx7ZJyYmBvb29nrH4v+LeUoREtHf1a/XbqHLGxvQY8omfLLrFD6ZPQCtmjrhZn4xRkfvRH+NJ27umoGcb6fD3laJk79qUSEIVcb5R8P66NPZA5v2nKn2OmPe/RaasI0Iee9b9OvSAtNf6SL1rZEEFCY66jJZKyTffffdI89fuWL4t+nIyEhERETotQnmrI7IqYFDA5ibm+PWrVt67bdu3ULDhg1liorItO6VVeDK9TwAwKmLOejk5YrwoZ0xdfleJKVdReuxH8FJZYOy8grkF+mQuW0KribnVRlnTKAvbhUUI/7wxWqv8/uNv6omv2TdgpmZGVZP74vlXx1DRUXV5IboWSZrhWTw4MEYMmQIBg8eXO3xYKJRHaVSCZVKpXdwukZellZW8PZpjaNHUsW2iooKHD2airbtOsgYGZF0zBQKKC31f8e7VVCM/CId/Nq7w9nBFvGHL1V539i+bbEl8VyNtvKamSlgaWHG8v+zSKYSSUpKCgYOHAg3NzcoFArs3LlT77wgCJg3bx5cXV1hY2MDf39/XLyonxzfvn0bo0ePhkqlgoODA0JDQ1FYWKjX58yZM+jevTusra3RpEkTLFq0yOhYZU1IXF1d8c0336CioqLa4+TJk3KGR09gTMh4fPPVNny3cweuXL6Md6OjUFxcjMFDhsodGtETiw71QzffJmjqYo/WHo0QHeqHHu2a4suk8wD+qnq84O0GD1cHjOjdGnHzBuPDr4/j4u+39cbp2cEdHq4O2Pj96SrXGPGyD4L9WsGrqROaudoj2K8V3gn1w1fJP/M5JM8ghYn+M1ZRURHatWuH1atXV3t+0aJFWLlyJdatW4ejR4/C1tYWgYGBKCkpEfuMHj0a58+fR2JiIuLj45GSkoJJk/63W7KgoAABAQFwd3dHWloaFi9ejKioKHz88cdGxSrrlE2nTp2QlpaGQYMGVXteoVBAqGbOlWq/vv36487t21izaiVu3rwBr1beWPPRejhxyobqgEYO9fDpnAFQO9oiv0iHc5k3MPCtrThw8ioA4LkmjogO9YNjfRv8lpOPRXGHsfLr41XGGdevLVLP/Y5fr92ucq6sogIRw7uiZeMGUCgUyMrJx9pv0/DhV1XHIXqYfv36oV+/ftWeEwQBy5cvx9y5c8V/hz/77DO4uLhg586dGDFiBH7++Wfs2bMHx48fR+fOnQEAH374Ifr3748PPvgAbm5uiIuLQ2lpKTZs2AArKyu0bt0a6enpWLp0qV7iYohCkPFf/B9++AFFRUXo27dvteeLiopw4sQJ+Pn5GTVuSZkpoiOqexr0fV/uEIhqneL9b0l+jWNX8k0yTrt/WFfZWapU1mxnqUKhwI4dOzB48GAAf63TbNGiBU6dOoX27duL/fz8/NC+fXusWLECGzZswIwZM3Dnzh3xfFlZGaytrbF9+3YMGTIEY8eORUFBgd500MGDB/Hyyy/j9u3baNCgQY3uTdYpm+7duz80GQEAW1tbo5MRIiKi2sZUS0iq21kaE/N4O0u12r+eCuzi4qLX7uLiIp7TarVwdnbWO29hYQFHR0e9PtWNcf81aqJWP4eEiIiI/qe6naV1ZSMHExIiIiKpmWhjVE2nZ2pCrVYDAHJycuDq6iq25+TkiFM4arUaubm5eu8rKyvD7du3xfer1Wrk5OTo9al8XdmnJmr1g9GIiIjqArl22TyKh4cH1Go1kpKSxLaCggIcPXoUGo0GAKDRaJCXl4e0tP99z9KBAwdQUVGBLl26iH1SUlJw7949sU9iYiK8vLxqvH4EYEJCREQkOYXCNIexCgsLkZ6ejvT0dABAZmYm0tPTkZWVBYVCgWnTpuHdd9/Fd999h7Nnz2Ls2LFwc3MTF756e3ujb9++mDhxIo4dO4affvoJU6ZMwYgRI+Dm5gYAGDVqFKysrBAaGorz589j69atWLFiRY2eJXY/TtkQERHVUSdOnECvXr3E15VJQkhICGJjYzF79mwUFRVh0qRJyMvLw0svvYQ9e/bA2tpafE9cXBymTJmC3r17w8zMDMHBwVi5cqV43t7eHvv27UN4eDg6deqEhg0bYt68eUZt+QVk3vYrFW77Jaoet/0SVfU0tv2evFpgknE6NlOZZJzaiBUSIiIiqfFp/wZxDQkRERHJjhUSIiIiiZl6h0xdxISEiIhIYvyCZsM4ZUNERESyY4WEiIhIYiyQGMaEhIiISGrMSAzilA0RERHJjhUSIiIiiXGXjWFMSIiIiCTGXTaGMSEhIiKSGPMRw7iGhIiIiGTHCgkREZHUWCIxiAkJERGRxLio1TBO2RAREZHsWCEhIiKSGHfZGMaEhIiISGLMRwzjlA0RERHJjhUSIiIiqbFEYhATEiIiIolxl41hnLIhIiIi2bFCQkREJDHusjGMCQkREZHEmI8YxoSEiIhIasxIDOIaEiIiIpIdKyREREQS4y4bw5iQEBERSYyLWg3jlA0RERHJjhUSIiIiibFAYhgTEiIiIqkxIzGIUzZEREQkO1ZIiIiIJMZdNoaxQkJERCQxhcI0hzGioqKgUCj0jlatWonnS0pKEB4eDicnJ9jZ2SE4OBg5OTl6Y2RlZSEoKAj16tWDs7MzZs2ahbKyMlN8JFWwQkJERFRHtW7dGvv37xdfW1j875/96dOnIyEhAdu3b4e9vT2mTJmCoUOH4qeffgIAlJeXIygoCGq1GocPH0Z2djbGjh0LS0tLLFy40OSxMiEhIiKSmFwTNhYWFlCr1VXa8/Pz8emnn2LLli14+eWXAQAbN26Et7c3jhw5gq5du2Lfvn24cOEC9u/fDxcXF7Rv3x7vvPMO5syZg6ioKFhZWZk0Vk7ZEBERSU1hosNIFy9ehJubG5o3b47Ro0cjKysLAJCWloZ79+7B399f7NuqVSs0bdoUqampAIDU1FT4+vrCxcVF7BMYGIiCggKcP3/e+GAMYIWEiIhIYqZa1KrT6aDT6fTalEollEpllb5dunRBbGwsvLy8kJ2djQULFqB79+44d+4ctFotrKys4ODgoPceFxcXaLVaAIBWq9VLRirPV54zNVZIiIiInhExMTGwt7fXO2JiYqrt269fP7zyyito27YtAgMDsXv3buTl5WHbtm1POeqaYUJCREQkMVPtsomMjER+fr7eERkZWaMYHBwc8Nxzz+HSpUtQq9UoLS1FXl6eXp+cnBxxzYlara6y66bydXXrUp4UExIiIiKJmWoJiVKphEql0juqm66pTmFhIS5fvgxXV1d06tQJlpaWSEpKEs9nZGQgKysLGo0GAKDRaHD27Fnk5uaKfRITE6FSqeDj4/MkH0e1uIaEiIioDpo5cyYGDhwId3d3XL9+HfPnz4e5uTlGjhwJe3t7hIaGIiIiAo6OjlCpVJg6dSo0Gg26du0KAAgICICPjw/GjBmDRYsWQavVYu7cuQgPD69xEmQMJiREREQSM/ahZqbw+++/Y+TIkbh16xYaNWqEl156CUeOHEGjRo0AAMuWLYOZmRmCg4Oh0+kQGBiINWvWiO83NzdHfHw8Jk+eDI1GA1tbW4SEhCA6OlqSeBWCIAiSjCyjEmkeIkf0zGvQ9325QyCqdYr3vyX5NX6/U2qScRo3MO2zP2oTriEhIiIi2XHKhoiISGJyTNk8a5iQEBERSYz5iGGcsiEiIiLZsUJCREQkMU7ZGMaEhIiISGKm+i6buowJCRERkdSYjxjENSREREQkO1ZIiIiIJMYCiWFMSIiIiCTGRa2GccqGiIiIZMcKCRERkcS4y8YwJiRERERSYz5iEKdsiIiISHaskBAREUmMBRLDmJAQERFJjLtsDOOUDREREcmOFRIiIiKJcZeNYUxIiIiIJMYpG8M4ZUNERESyY0JCREREsuOUDRERkcQ4ZWMYExIiIiKJcVGrYZyyISIiItmxQkJERCQxTtkYxoSEiIhIYsxHDOOUDREREcmOFRIiIiKpsURiEBMSIiIiiXGXjWGcsiEiIiLZsUJCREQkMe6yMYwJCRERkcSYjxjGKRsiIiKpKUx0PIbVq1ejWbNmsLa2RpcuXXDs2LEnuhWpMCEhIiKqo7Zu3YqIiAjMnz8fJ0+eRLt27RAYGIjc3Fy5Q6uCCQkREZHEFCb6z1hLly7FxIkTMX78ePj4+GDdunWoV68eNmzYIMFdPhkmJERERBJTKExzGKO0tBRpaWnw9/cX28zMzODv74/U1FQT3+GT46JWIiKiZ4ROp4NOp9NrUyqVUCqVVfrevHkT5eXlcHFx0Wt3cXHBL7/8Immcj6NOJiTWdfKunj06nQ4xMTGIjIys9oeFnr7i/W/JHQKBPxt/R6b6dynq3RgsWLBAr23+/PmIiooyzQVkpBAEQZA7CKqbCgoKYG9vj/z8fKhUKrnDIao1+LNBj8uYCklpaSnq1auHr776CoMHDxbbQ0JCkJeXh2+//VbqcI3CNSRERETPCKVSCZVKpXc8rMpmZWWFTp06ISkpSWyrqKhAUlISNBrN0wq5xji5QUREVEdFREQgJCQEnTt3xgsvvIDly5ejqKgI48ePlzu0KpiQEBER1VHDhw/HjRs3MG/ePGi1WrRv3x579uypstC1NmBCQpJRKpWYP38+F+0RPYA/G/Q0TZkyBVOmTJE7DIO4qJWIiIhkx0WtREREJDsmJERERCQ7JiREREQkOyYkREREJDsmJCSZ1atXo1mzZrC2tkaXLl1w7NgxuUMiklVKSgoGDhwINzc3KBQK7Ny5U+6QiGoNJiQkia1btyIiIgLz58/HyZMn0a5dOwQGBiI3N1fu0IhkU1RUhHbt2mH16tVyh0JU63DbL0miS5cueP7557Fq1SoAfz2uuEmTJpg6dSreeotf8EakUCiwY8cOve8YIfo7Y4WETK60tBRpaWnw9/cX28zMzODv74/U1FQZIyMiotqKCQmZ3M2bN1FeXl7l0cQuLi7QarUyRUVERLUZExIiIiKSHRMSMrmGDRvC3NwcOTk5eu05OTlQq9UyRUVERLUZExIyOSsrK3Tq1AlJSUliW0VFBZKSkqDRaGSMjIiIait+2y9JIiIiAiEhIejcuTNeeOEFLF++HEVFRRg/frzcoRHJprCwEJcuXRJfZ2ZmIj09HY6OjmjatKmMkRHJj9t+STKrVq3C4sWLodVq0b59e6xcuRJdunSROywi2SQnJ6NXr15V2kNCQhAbG/v0AyKqRZiQEBERkey4hoSIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SESAbjxo3D4MGDxdc9e/bEtGnTnnocycnJUCgUyMvLk+waD97r43gacRKRvJiQEP1/48aNg0KhgEKhgJWVFTw9PREdHY2ysjLJr/3NN9/gnXfeqVHfp/2Pc7NmzbB8+fKnci0i+vvid9kQ3adv377YuHEjdDoddu/ejfDwcFhaWiIyMrJK39LSUlhZWZnkuo6OjiYZh4joWcUKCdF9lEol1Go13N3dMXnyZPj7++O7774D8L+ph/feew9ubm7w8vICAFy7dg2vvvoqHBwc4OjoiEGDBuHq1avimOXl5YiIiICDgwOcnJwwe/ZsPPiNDQ9O2eh0OsyZMwdNmjSBUqmEp6cnPv30U1y9elX8LpQGDRpAoVBg3LhxAP76RuWYmBh4eHjAxsYG7dq1w1dffaV3nd27d+O5556DjY0NevXqpRfn4ygvL0doaKh4TS8vL6xYsaLavgsWLECjRo2gUqkQFhaG0tJS8VxNYr/fb7/9hoEDB6JBgwawtbVF69atsXv37ie6FyKSFyskRI9gY2ODW7duia+TkpKgUqmQmJgIALh37x4CAwOh0Wjwww8/wMLCAu+++y769u2LM2fOwMrKCkuWLEFsbCw2bNgAb29vLFmyBDt27MDLL7/80OuOHTsWqampWLlyJdq1a4fMzEzcvHkTTZo0wddff43g4GBkZGRApVLBxsYGABATE4PPP/8c69atQ8uWLZGSkoLXXnsNjRo1gp+fH65du4ahQ4ciPDwckyZNwokTJzBjxown+nwqKirQuHFjbN++HU5OTjh8+DAmTZoEV1dXvPrqq3qfm7W1NZKTk3H16lWMHz8eTk5OeO+992oU+4PCw8NRWlqKlJQU2Nra4sKFC7Czs3uieyEimQlEJAiCIISEhAiDBg0SBEEQKioqhMTEREGpVAozZ84Uz7u4uAg6nU58z+bNmwUvLy+hoqJCbNPpdIKNjY2wd+9eQRAEwdXVVVi0aJF4/t69e0Ljxo3FawmCIPj5+QlvvvmmIAiCkJGRIQAQEhMTq43z4MGDAgDhzp07YltJSYlQr1494fDhw3p9Q0NDhZEjRwqCIAiRkZGCj4+P3vk5c+ZUGetB7u7uwrJlyx56/kHh4eFCcHCw+DokJERwdHQUioqKxLa1a9cKdnZ2Qnl5eY1if/CefX19haioqBrHRES1HyskRPeJj4+HnZ0d7t27h4qKCowaNQpRUVHieV9fX711I6dPn8alS5dQv359vXFKSkpw+fJl5OfnIzs7G126dBHPWVhYoHPnzlWmbSqlp6fD3Ny82srAw1y6dAl3795Fnz599NpLS0vRoUMHAMDPP/+sFwcAaDSaGl/jYVavXo0NGzYgKysLxcXFKC0tRfv27fX6tGvXDvXq1dO7bmFhIa5du4bCwkKDsT/o3//+NyZPnox9+/bB398fwcHBaNu27RPfCxHJhwkJ0X169eqFtWvXwsrKCm5ubrCw0P8RsbW11XtdWFiITp06IS4urspYjRo1eqwYKqdgjFFYWAgASEhIwD/+8Q+9c0ql8rHiqIkvv/wSM2fOxJIlS6DRaFC/fn0sXrwYR48erfEYjxP7hAkTEBgYiISEBOzbtw8xMTFYsmQJpk6d+vg3Q0SyYkJCdB9bW1t4enrWuH/Hjh2xdetWODs7Q6VSVdvH1dUVR48eRY8ePQAAZWVlSEtLQ8eOHavt7+vri4qKChw6dAj+/v5VzldWaMrLy8U2Hx8fKJVKZGVlPbSy4u3tLS7QrXTkyBHDN/kIP/30E1588UX861//EtsuX75cpd/p06dRXFwsJltHjhyBnZ0dmjRpAkdHR4OxV6dJkyYICwtDWFgYIiMj8cknnzAhIXqGcZcN0RMYPXo0GjZsiEGDBuGHH35AZmYmkpOT8e9//xu///47AODNN9/E+++/j507d+KXX37Bv/71r0c+Q6RZs2YICQnB66+/jp07d4pjbtu2DQDg7u4OhUKB+Ph43LhxA4WFhahfvz5mzpyJ6dOnY9OmTbh8+TJOnjyJDz/8EJs2bQIAhIWF4eLFi5g1axYyMjKwZcsWxMbG1ug+//jjD6Snp+sdd+7cQcuWLXHixAns3bsXv/76K95++20cP368yvtLS0sRGhqKCxcuYPfu3Zg/fz6mTJkCMzOzGsX+oGnTpmHv3r3IzMzEyZMncfDgQXh7e9foXoiolpJ7EQtRbXH/olZjzmdnZwtjx44VGjZsKCiVSqF58+bCxIkThfz8fEEQ/lrE+uabbwoqlUpwcHAQIiIihLFjxz50UasgCEJxcbEwffp0wdXVVbCyshI8PT2FDRs2iOejo6MFtVotKBQKISQkRBCEvxbiLl++XPDy8hIsLS2FRo0aCYGBgcKhQ4fE9+3atUvw9PQUlEql0L17d2HDhg01WtQKoMqxefNmoaSkRBg3bpxgb28vODg4CJMnTxbeeustoV27dlU+t3nz5glOTk6CnZ2dMHHiRKGkpETsYyj2Bxe1TpkyRWjRooWgVCqFRo0aCWPGjBFu3rz50HsgotpPIQgPWVlHRERE9JRwyoaIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGTHhISIiIhkx4SEiIiIZMeEhIiIiGT3/wBI0zEPvpUqmgAAAABJRU5ErkJggg==\n" }, "metadata": {} } ] }, { "cell_type": "markdown", "source": [ "## Pipeline" ], "metadata": { "id": "4jiOX9DBo8Yp" } }, { "cell_type": "code", "source": [ "# Define the prediction pipeline\n", "def predict_pipeline(input_df, tokenizer, model):\n", "\n", " model.eval() # Set model to evaluation mode\n", "\n", " # Combine inputs into a single text column (you can customize this)\n", " input_df['combined_text'] = (\n", " \"Title: \" + input_df['title'] + \" | \" +\n", " \"Subject: \" + input_df['subject'] + \" | \" +\n", " \"Date: \" + input_df['date'] + \" | \"\n", " \"Text: \" + input_df['text']\n", " )\n", "\n", " # Tokenize the combined text\n", " tokenized = tokenizer(\n", " input_df['combined_text'].tolist(),\n", " truncation=True,\n", " padding='longest',\n", " max_length=7000,\n", " return_tensors=\"pt\"\n", " )\n", "\n", " # Move tensors to GPU if available\n", " device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", " model.to(device)\n", " input_ids = tokenized['input_ids'].to(device)\n", " attention_mask = tokenized['attention_mask'].to(device)\n", "\n", " # Get model predictions\n", " with torch.no_grad():\n", " outputs = model(input_ids=input_ids, attention_mask=attention_mask)\n", " logits = outputs.logits.squeeze(-1) # Ensure logits is 1D for binary classification\n", "\n", " # Apply sigmoid to get probabilities\n", " probs = torch.sigmoid(logits)\n", " preds = (probs > 0.51).long()\n", "\n", " # Combine results into desired format\n", " results = [{\"title\": row['title'], \"predicted_class\": pred_class.item()}\n", " for row, pred_class in zip(input_df.to_dict(orient='records'), preds)]\n", "\n", " return results" ], "metadata": { "id": "4RBYibMvneLv" }, "execution_count": 51, "outputs": [] }, { "cell_type": "code", "source": [ "# Example DataFrame\n", "data = {\n", " \"title\": [\"Trump's new policy reviewed\", \"Shocking claims about health!\"],\n", " \"text\": [\"Policy details are emerging about new measures.\", \"A new study claims unbelievable results.\"],\n", " \"subject\": [\"Politics\", \"Health\"],\n", " \"date\": [\"2024-12-28\", \"2024-12-29\"]\n", "}\n", "input_df = pd.DataFrame(data)\n", "\n", "# Run the prediction pipeline\n", "output = predict_pipeline(input_df, tokenizer, model)\n", "\n", "# Display the output\n", "print(output)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "6qyIetsHqUak", "outputId": "f825afb3-0dd5-4ffa-a438-66c1d95e6172" }, "execution_count": 52, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "[{'title': \"Trump's new policy reviewed\", 'predicted_class': 0}, {'title': 'Shocking claims about health!', 'predicted_class': 0}]\n" ] } ] }, { "cell_type": "code", "source": [], "metadata": { "id": "1d74YbR6sOFz" }, "execution_count": null, "outputs": [] } ] }