{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Watermark Detection in Large Language Models Analysis\n", "# ==================================================\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "# !pip install transformers torch datasets scikit-learn matplotlib seaborn" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "from datasets import load_dataset\n", "from argparse import Namespace\n", "\n", "import sys\n", "sys.path.append('../')\n", "from app import load_model, generate, analyze\n", "import pandas as pd\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [], "source": [ "args = Namespace()" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "arg_dict = {\n", " 'model_name_or_path': 'bigscience/bloom-560m',\n", " 'load_fp16' : False,\n", " 'prompt_max_length': None, \n", " 'max_new_tokens': 200, \n", " 'generation_seed': 123, \n", " 'use_sampling': True, \n", " 'n_beams': 1, # 1, 2, 5\n", " 'sampling_temp': 0.7,\n", " 'use_gpu': True, \n", " 'seeding_scheme': 'simple_1', \n", " 'gamma': 0.25, # 0.1, 0.25. 0.5\n", " 'delta': 2.0, # 1.0, 2.0, 5.0\n", " 'normalizers': '', \n", " 'skip_repeated_bigrams': False,\n", " 'ignore_repeated_ngrams': False, \n", " 'detection_z_threshold': 4.0, # 4.0, 5.0, 6.0 >>>\n", " 'select_green_tokens': True,\n", " 'seed_separately': True,\n", " 'run_extended': True\n", "}\n", "args.__dict__.update(arg_dict)" ] }, { "cell_type": "code", "execution_count": 13, "metadata": {}, "outputs": [], "source": [ "model, tokenizer, device = load_model(args)" ] }, { "cell_type": "code", "execution_count": 10, "metadata": {}, "outputs": [], "source": [ "# # List to hold all results\n", "# dataset = []" ] }, { "cell_type": "code", "execution_count": 12, "metadata": {}, "outputs": [], "source": [ "# prompts = [\n", "# \"Describe the process of photosynthesis.\",\n", "# \"What is the significance of the Turing test?\",\n", "# \"How does blockchain technology work?\",\n", "# \"What are the principles of quantum mechanics?\",\n", "# \"Why is artificial intelligence valuable?\",\n", "# ]" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [], "source": [ "# # Columns for detection results\n", "# columns = [\"tokens_counted\", \"tokens_in_greelist\", \"fraction_t_greenlist\", \"z_score\", \"p_value\", \"prediction\", \"confidence\"]" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [], "source": [ "# Helper function to convert the first element (list of key-value pairs) to a dictionary\n", "def result_list_to_dict(result_tuple):\n", " key_value_pairs = result_tuple[0]\n", " # Ensure we only extract the values and not keep them as lists\n", " return {key.strip(): value.strip() for key, value in key_value_pairs}" ] }, { "cell_type": "code", "execution_count": 77, "metadata": {}, "outputs": [], "source": [ "# # Iterate over each prompt\n", "# for prompt in prompts:\n", "# print(f\"Processing prompt: {prompt}\")\n", " \n", "# # Dictionary to hold the result for the current prompt\n", "# result = {\"prompt\": prompt, \"use_sampling\": args.use_sampling, \"sampling_temp\": args.sampling_temp, \"delta\": args.delta, \"gamma\": args.gamma, \"n_beams\": args.n_beams, \"detection_z_threshold\": args.detection_z_threshold}\n", "\n", " \n", "# if args.run_extended:\n", "# # Call generate with the current prompt\n", "# _, _, advance_decoded_output_without_watermark, advance_decoded_output_with_watermark, _ = generate(\n", "# prompt, args, model=model, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Analyze the output\n", "# advance_without_watermark_detection_result = analyze(\n", "# advance_decoded_output_without_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", "# advance_with_watermark_detection_result = analyze(\n", "# advance_decoded_output_with_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Convert results list to dictionary\n", "# advance_without_watermark_dict = result_list_to_dict(advance_without_watermark_detection_result)\n", "# advance_with_watermark_dict = result_list_to_dict(advance_with_watermark_detection_result)\n", " \n", " \n", "# # Store the extended results\n", "# result[\"type\"] = \"extended\"\n", " \n", "# # Add detection results for both without and with watermark using the key names as column names\n", "# for key, value in advance_without_watermark_dict.items():\n", "# result[f\"without_watermark_{key.replace(' ', '_')}\"] = value \n", "# for key, value in advance_with_watermark_dict.items():\n", "# result[f\"with_watermark_{key.replace(' ', '_')}\"] = value\n", " \n", "# else:\n", "# # Call generate with the current prompt\n", "# _, _, basic_decoded_output_without_watermark, basic_decoded_output_with_watermark, _ = generate(\n", "# prompt, args, model=model, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Analyze the output\n", "# basic_without_watermark_detection_result = analyze(\n", "# basic_decoded_output_without_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", "# basic_with_watermark_detection_result = analyze(\n", "# basic_decoded_output_with_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Convert results list to dictionary\n", "# basic_without_watermark_dict = result_list_to_dict(basic_without_watermark_detection_result)\n", "# basic_with_watermark_dict = result_list_to_dict(basic_with_watermark_detection_result)\n", " \n", "# # print(basic_with_watermark_dict)\n", "\n", "# # Store the basic results\n", "# result[\"type\"] = \"basic\"\n", " \n", "# # Add detection results for both without and with watermark using the key names as column names\n", "# for key, value in basic_without_watermark_dict.items():\n", "# # Assign only the value to the result, not the list\n", "# result[f\"without_watermark_{key.replace(' ', '_')}\"] = value # Replacing spaces with underscores for column names\n", "\n", "# for key, value in basic_with_watermark_dict.items():\n", "# result[f\"with_watermark_{key.replace(' ', '_')}\"] = value\n", " \n", "# # Append the result for this prompt to the dataset\n", "# dataset.append(result)\n", "# # print(dataset)" ] }, { "cell_type": "code", "execution_count": 56, "metadata": {}, "outputs": [], "source": [ "# # Save the dataset as a CSV\n", "# df = pd.DataFrame(dataset)\n", "# df.to_csv(\"dataset.csv\", index=False)\n", "\n", "# print(\"Dataset created and saved successfully!\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "# # Group by \"type\" (basic vs extended) and calculate mean values for each group\n", "# print(\"\\nGroup Analysis by Type (basic vs extended):\")\n", "# grouped_stats = df.groupby('type').mean()\n", "# print(grouped_stats)\n", "\n", "# # Visualize group-wise mean for key parameters\n", "# grouped_stats[['sampling_temp', 'gamma', 'delta']].plot(kind='bar', figsize=(10, 6), title='Mean Parameters by Type')\n", "# plt.ylabel('Mean Value')\n", "# plt.show()" ] }, { "cell_type": "code", "execution_count": 72, "metadata": {}, "outputs": [], "source": [ "# # Add columns to compare outputs with and without watermark\n", "# # For example, difference in tokens counted\n", "# df['tokens_difference'] = pd.to_numeric(df['without_watermark_tokens_counted'], errors='coerce') - pd.to_numeric(df['with_watermark_tokens_counted'], errors='coerce')\n", "\n", "# # Visualize the difference in tokens counted\n", "# plt.figure(figsize=(10, 6))\n", "# sns.histplot(df['tokens_difference'], kde=True)\n", "# plt.title('Difference in Tokens Counted (Without vs With Watermark)')\n", "# plt.show()\n", "\n", "# # Group by type and compare watermark/no-watermark results\n", "# print(\"\\nWatermark vs No Watermark Comparison:\")\n", "# watermark_comparison = df[['type', 'without_watermark_tokens_counted', 'with_watermark_tokens_counted', \n", "# 'without_watermark_z_score', 'with_watermark_z_score']]\n", "\n", "# # Show the comparison for the first few rows\n", "# print(watermark_comparison.head())\n", "\n", "# # Compare Z-scores for without and with watermark by type\n", "# print(\"\\nMean Z-Scores (Without vs With Watermark):\")\n", "# mean_z_scores = df.groupby('type')[['without_watermark_z_score', 'with_watermark_z_score']].mean()\n", "# print(mean_z_scores)" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "# move visualization here..." ] }, { "cell_type": "code", "execution_count": 76, "metadata": {}, "outputs": [], "source": [ "# import matplotlib.pyplot as plt\n", "# import seaborn as sns" ] }, { "cell_type": "code", "execution_count": 75, "metadata": {}, "outputs": [], "source": [ "# # Confusion Matrix Visualization for Basic Watermark\n", "# plt.figure(figsize=(8, 6))\n", "# sns.heatmap(cm_basic, annot=True, fmt=\"d\", cmap=\"Blues\", xticklabels=[\"Non-Watermarked\", \"Basic Watermarked\", \"Advanced Watermarked\"], yticklabels=[\"Non-Watermarked\", \"Basic Watermarked\", \"Advanced Watermarked\"])\n", "# plt.xlabel(\"Predicted Label\")\n", "# plt.ylabel(\"True Label\")\n", "# plt.title(\"Confusion Matrix - Basic Watermark\")\n", "# plt.show()" ] }, { "cell_type": "code", "execution_count": 74, "metadata": {}, "outputs": [], "source": [ "# # Confusion Matrix Visualization for Advanced Watermark\n", "# plt.figure(figsize=(8, 6))\n", "# sns.heatmap(cm_advanced, annot=True, fmt=\"d\", cmap=\"Greens\", xticklabels=[\"Non-Watermarked\", \"Basic Watermarked\", \"Advanced Watermarked\"], yticklabels=[\"Non-Watermarked\", \"Basic Watermarked\", \"Advanced Watermarked\"])\n", "# plt.xlabel(\"Predicted Label\")\n", "# plt.ylabel(\"True Label\")\n", "# plt.title(\"Confusion Matrix - Advanced Watermark\")\n", "# plt.show()" ] }, { "cell_type": "code", "execution_count": 73, "metadata": {}, "outputs": [], "source": [ "# # Bar Plot of True Positives and False Positives for Basic and Advanced Watermarks\n", "# results = {\n", "# \"Basic - True Positives\": basic_true_positives,\n", "# \"Basic - False Positives\": basic_false_positives,\n", "# \"Advanced - True Positives\": advanced_true_positives,\n", "# \"Advanced - False Positives\": advanced_false_positives,\n", "# }" ] }, { "cell_type": "code", "execution_count": 68, "metadata": {}, "outputs": [], "source": [ "# plt.figure(figsize=(10, 6))\n", "# sns.barplot(x=list(results.keys()), y=list(results.values()), palette=\"viridis\")\n", "# plt.title(\"Watermark Detection Results\")\n", "# plt.ylabel(\"Count\")\n", "# plt.show()" ] }, { "cell_type": "code", "execution_count": 67, "metadata": {}, "outputs": [], "source": [ "# from datasets import load_dataset\n", "# import random\n", "# from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score" ] }, { "cell_type": "code", "execution_count": 66, "metadata": {}, "outputs": [], "source": [ "# # Load the SST-2 dataset from GLUE\n", "# dataset = load_dataset(\"glue\", \"sst2\")\n", "\n", "# # # For paraphrase detection (MRPC)\n", "# # dataset = load_dataset(\"glue\", \"mrpc\")\n", "\n", "# # # For grammatical acceptability (CoLA)\n", "# # dataset = load_dataset(\"glue\", \"cola\")" ] }, { "cell_type": "code", "execution_count": 65, "metadata": {}, "outputs": [], "source": [ "# # Print the first 5 rows of the 'train' split\n", "# print(\"First 5 rows of the training set:\")\n", "# for i in range(5):\n", "# print(dataset['train'][i])" ] }, { "cell_type": "code", "execution_count": 64, "metadata": {}, "outputs": [], "source": [ "# # Iterate over each prompt\n", "# for prompt in prompts:\n", "# print(f\"Processing prompt: {prompt}\")\n", " \n", "# # Dictionary to hold the result for the current prompt\n", "# result = {\"prompt\": prompt, \"use_sampling\": args.use_sampling, \"sampling_temp\": args.sampling_temp, \"delta\": args.delta, \"gamma\": args.gamma, \"n_beams\": args.n_beams, \"detection_z_threshold\": args.detection_z_threshold}\n", "\n", " \n", "# if args.run_extended:\n", "# # Call generate with the current prompt\n", "# _, _, advance_decoded_output_without_watermark, advance_decoded_output_with_watermark, _ = generate(\n", "# prompt, args, model=model, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Analyze the output\n", "# advance_without_watermark_detection_result = analyze(\n", "# advance_decoded_output_without_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", "# advance_with_watermark_detection_result = analyze(\n", "# advance_decoded_output_with_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Convert results list to dictionary\n", "# advance_without_watermark_dict = result_list_to_dict(advance_without_watermark_detection_result)\n", "# advance_with_watermark_dict = result_list_to_dict(advance_with_watermark_detection_result)\n", " \n", " \n", "# # Store the extended results\n", "# result[\"type\"] = \"extended\"\n", " \n", "# # Add detection results for both without and with watermark using the key names as column names\n", "# for key, value in advance_without_watermark_dict.items():\n", "# result[f\"without_watermark_{key.replace(' ', '_')}\"] = value \n", "# for key, value in advance_with_watermark_dict.items():\n", "# result[f\"with_watermark_{key.replace(' ', '_')}\"] = value\n", " \n", "# else:\n", "# # Call generate with the current prompt\n", "# _, _, basic_decoded_output_without_watermark, basic_decoded_output_with_watermark, _ = generate(\n", "# prompt, args, model=model, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Analyze the output\n", "# basic_without_watermark_detection_result = analyze(\n", "# basic_decoded_output_without_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", "# basic_with_watermark_detection_result = analyze(\n", "# basic_decoded_output_with_watermark, args, device=device, tokenizer=tokenizer\n", "# )\n", " \n", "# # Convert results list to dictionary\n", "# basic_without_watermark_dict = result_list_to_dict(basic_without_watermark_detection_result)\n", "# basic_with_watermark_dict = result_list_to_dict(basic_with_watermark_detection_result)\n", " \n", "# # print(basic_with_watermark_dict)\n", "\n", "# # Store the basic results\n", "# result[\"type\"] = \"basic\"\n", " \n", "# # Add detection results for both without and with watermark using the key names as column names\n", "# for key, value in basic_without_watermark_dict.items():\n", "# # Assign only the value to the result, not the list\n", "# result[f\"without_watermark_{key.replace(' ', '_')}\"] = value # Replacing spaces with underscores for column names\n", "\n", "# for key, value in basic_with_watermark_dict.items():\n", "# result[f\"with_watermark_{key.replace(' ', '_')}\"] = value\n", " \n", "# # Append the result for this prompt to the dataset\n", "# dataset.append(result)\n", "# # print(dataset)" ] }, { "cell_type": "code", "execution_count": 63, "metadata": {}, "outputs": [], "source": [ "# # Function to simulate model response generation\n", "# def generate_response(sentence, watermark=False):\n", "# # Simulate generating a response based on sentiment\n", "# if 'good' in sentence or 'great' in sentence or 'fantastic' in sentence:\n", "# response = \"The sentiment is positive.\"\n", "# else:\n", "# response = \"The sentiment is negative.\"\n", " \n", "# # Append watermark if requested\n", "# if watermark:\n", "# response += f\" [WM-ID: {random.randint(1000, 9999)}]\"\n", " \n", "# return response\n", "\n", "# # Function to detect watermark in the response\n", "# def detect_watermark(response):\n", "# return \"[WM-ID:\" in response" ] }, { "cell_type": "code", "execution_count": 62, "metadata": {}, "outputs": [], "source": [ "\n", "\n", "\n", "\n", "# # Evaluate the watermark detection and task performance\n", "# def evaluate_system(dataset):\n", "# detection_results = []\n", "# task_performance = []\n", "# original_labels = []\n", " \n", "# # Use the first 100 examples for evaluation\n", "# for example in dataset[\"train\"].select(range(100)): # Use `select()` to get rows\n", "# sentence = example['sentence']\n", "# original_label = example['label']\n", "# original_labels.append(original_label) # SST-2: 1 for positive, 0 for negative\n", " \n", "# # Generate non-watermarked and watermarked responses\n", "# non_watermarked_response = generate_response(sentence, watermark=False)\n", "# watermarked_response = generate_response(sentence, watermark=True)\n", " \n", "# # Detect watermark\n", "# non_watermarked_detected = detect_watermark(non_watermarked_response)\n", "# watermarked_detected = detect_watermark(watermarked_response)\n", " \n", "# # Append detection results\n", "# detection_results.append((non_watermarked_detected, watermarked_detected))\n", " \n", "# # Simulate task-specific performance (assume response gives correct sentiment classification)\n", "# non_watermarked_label = 1 if \"positive\" in non_watermarked_response else 0\n", "# watermarked_label = 1 if \"positive\" in watermarked_response else 0\n", " \n", "# task_performance.append((non_watermarked_label, watermarked_label))\n", " \n", "# return detection_results, task_performance, original_labels\n", "\n", "# # Function to calculate metrics for watermark detection and task performance\n", "# def calculate_metrics(detection_results, task_performance, original_labels):\n", "# # Extract watermark detection results\n", "# non_watermarked_detected = [1 if not detected else 0 for detected, _ in detection_results]\n", "# watermarked_detected = [1 if detected else 0 for _, detected in detection_results]\n", " \n", "# # Watermark detection accuracy metrics\n", "# detection_accuracy = accuracy_score([0] * len(non_watermarked_detected), non_watermarked_detected)\n", "# watermark_detection_accuracy = accuracy_score([1] * len(watermarked_detected), watermarked_detected)\n", " \n", "# # Extract task performance\n", "# non_watermarked_labels = [pred for pred, _ in task_performance]\n", "# watermarked_labels = [pred for _, pred in task_performance]\n", " \n", "# # Task performance accuracy\n", "# non_watermarked_accuracy = accuracy_score(original_labels, non_watermarked_labels)\n", "# watermarked_accuracy = accuracy_score(original_labels, watermarked_labels)\n", " \n", "# # F1 score for watermark detection\n", "# f1_detection = f1_score([1] * len(watermarked_detected), watermarked_detected)\n", " \n", "# # Output metrics\n", "# print(\"Watermark Detection Accuracy (non-watermarked):\", detection_accuracy)\n", "# print(\"Watermark Detection Accuracy (watermarked):\", watermark_detection_accuracy)\n", "# print(\"F1 Score for Watermark Detection:\", f1_detection)\n", " \n", "# print(\"Task Performance Accuracy (non-watermarked):\", non_watermarked_accuracy)\n", "# print(\"Task Performance Accuracy (watermarked):\", watermarked_accuracy)\n", "\n", "# # Main function to run the evaluation\n", "# def main():\n", "# # Step 1: Run the system evaluation on SST-2 dataset\n", "# detection_results, task_performance, original_labels = evaluate_system(dataset)\n", " \n", "# # Step 2: Calculate and print metrics\n", "# calculate_metrics(detection_results, task_performance, original_labels)\n", "\n", "# # Run the evaluation\n", "# main()\n" ] }, { "cell_type": "code", "execution_count": 86, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Processing task: sst2\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 0/67349 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 1/67349 [01:28<1649:05:29, 88.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 2/67349 [02:43<1508:02:44, 80.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 3/67349 [03:58<1464:28:04, 78.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 4/67349 [05:22<1502:59:01, 80.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 5/67349 [06:46<1525:21:07, 81.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 6/67349 [08:07<1522:26:44, 81.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 7/67349 [09:17<1452:27:36, 77.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 8/67349 [10:20<1369:32:06, 73.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 9/67349 [11:35<1379:28:37, 73.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 10/67349 [12:49<1378:56:59, 73.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 11/67349 [14:03<1378:22:15, 73.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 12/67349 [15:08<1333:43:30, 71.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 13/67349 [16:12<1292:11:35, 69.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 14/67349 [17:24<1307:20:29, 69.90s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 15/67349 [18:32<1296:16:21, 69.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 16/67349 [19:40<1289:37:16, 68.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 17/67349 [20:49<1286:44:48, 68.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 18/67349 [21:55<1274:56:11, 68.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 19/67349 [23:04<1275:11:24, 68.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 20/67349 [24:13<1281:46:43, 68.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 21/67349 [25:18<1262:36:40, 67.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 22/67349 [26:24<1251:47:54, 66.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 23/67349 [27:29<1244:26:59, 66.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 24/67349 [28:32<1225:11:14, 65.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 25/67349 [29:37<1218:52:05, 65.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 26/67349 [30:40<1209:16:38, 64.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 27/67349 [31:45<1210:36:18, 64.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 28/67349 [32:51<1218:59:52, 65.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 29/67349 [33:58<1226:45:28, 65.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 30/67349 [35:05<1237:13:29, 66.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 31/67349 [36:13<1245:51:17, 66.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 32/67349 [37:21<1252:02:53, 66.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 33/67349 [38:29<1257:28:55, 67.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 34/67349 [39:36<1259:01:11, 67.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 35/67349 [40:42<1247:09:56, 66.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 36/67349 [41:49<1252:27:58, 66.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 37/67349 [42:58<1263:48:02, 67.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 38/67349 [44:05<1260:53:01, 67.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 39/67349 [45:10<1245:16:04, 66.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 40/67349 [46:17<1249:55:56, 66.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 41/67349 [47:26<1262:19:48, 67.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 42/67349 [48:34<1260:49:41, 67.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 43/67349 [49:41<1260:29:25, 67.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 44/67349 [50:49<1263:50:50, 67.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 45/67349 [51:56<1259:26:58, 67.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 46/67349 [53:04<1261:24:27, 67.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 47/67349 [54:11<1263:07:05, 67.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 48/67349 [55:19<1263:17:43, 67.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 49/67349 [56:27<1267:10:37, 67.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 50/67349 [57:35<1266:04:03, 67.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 51/67349 [58:42<1261:35:32, 67.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 52/67349 [59:52<1275:48:45, 68.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 53/67349 [1:01:00<1273:32:17, 68.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 54/67349 [1:02:07<1269:49:40, 67.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 55/67349 [1:03:15<1268:53:25, 67.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 56/67349 [1:04:21<1259:36:34, 67.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 57/67349 [1:05:30<1266:19:21, 67.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 58/67349 [1:06:38<1269:21:20, 67.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 59/67349 [1:07:46<1268:13:51, 67.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 60/67349 [1:08:53<1267:09:23, 67.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 61/67349 [1:10:01<1268:00:38, 67.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 62/67349 [1:11:09<1266:50:39, 67.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 63/67349 [1:12:17<1268:14:24, 67.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 64/67349 [1:13:21<1248:19:41, 66.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 65/67349 [1:14:30<1257:26:36, 67.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 66/67349 [1:15:37<1259:03:05, 67.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 67/67349 [1:16:45<1261:23:04, 67.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 68/67349 [1:17:53<1263:31:58, 67.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 69/67349 [1:19:02<1269:22:30, 67.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 70/67349 [1:20:11<1275:17:46, 68.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 71/67349 [1:21:18<1270:47:25, 68.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 72/67349 [1:22:27<1273:07:29, 68.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 73/67349 [1:23:31<1252:15:46, 67.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 74/67349 [1:24:35<1235:13:40, 66.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 75/67349 [1:25:37<1215:02:00, 65.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 76/67349 [1:26:45<1230:59:29, 65.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 77/67349 [1:27:53<1239:08:01, 66.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 78/67349 [1:28:54<1213:03:06, 64.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 79/67349 [1:29:53<1176:36:32, 62.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 80/67349 [1:31:01<1204:26:15, 64.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 81/67349 [1:32:00<1173:33:31, 62.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 82/67349 [1:33:07<1199:45:27, 64.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 83/67349 [1:34:12<1204:48:33, 64.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 84/67349 [1:35:17<1207:34:00, 64.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 85/67349 [1:36:24<1222:22:50, 65.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 86/67349 [1:37:33<1242:19:19, 66.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 87/67349 [1:38:41<1247:11:30, 66.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 88/67349 [1:39:49<1257:01:01, 67.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 89/67349 [1:40:40<1166:01:13, 62.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 90/67349 [1:41:43<1169:20:27, 62.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 91/67349 [1:42:50<1194:49:58, 63.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 92/67349 [1:43:56<1203:33:27, 64.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 93/67349 [1:45:04<1222:07:33, 65.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 94/67349 [1:46:06<1206:48:40, 64.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 95/67349 [1:46:51<1096:20:32, 58.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 96/67349 [1:47:58<1143:24:42, 61.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 97/67349 [1:49:06<1179:50:28, 63.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 98/67349 [1:50:14<1203:50:50, 64.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 99/67349 [1:51:21<1219:14:29, 65.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 train set: 0%| | 100/67349 [1:52:28<1260:38:41, 67.49s/it]\n", "Processing sst2 validation set: 0%| | 0/872 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 0%| | 1/872 [01:07<16:17:08, 67.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 0%| | 2/872 [02:14<16:16:57, 67.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 0%| | 3/872 [03:19<15:59:59, 66.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 0%| | 4/872 [04:27<16:09:28, 67.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%| | 5/872 [05:20<14:56:02, 62.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%| | 6/872 [06:28<15:23:05, 63.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%| | 7/872 [07:36<15:39:48, 65.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%| | 8/872 [08:44<15:51:23, 66.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%| | 9/872 [09:31<14:23:58, 60.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%| | 10/872 [10:39<14:57:00, 62.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%|▏ | 11/872 [11:47<15:20:40, 64.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%|▏ | 12/872 [12:55<15:39:14, 65.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 1%|▏ | 13/872 [13:57<15:20:20, 64.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 14/872 [15:05<15:37:56, 65.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 15/872 [16:14<15:49:55, 66.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 16/872 [17:22<15:56:48, 67.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 17/872 [18:30<16:00:33, 67.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 18/872 [19:40<16:08:20, 68.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 19/872 [20:45<15:53:01, 67.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 20/872 [21:43<15:16:28, 64.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 2%|▏ | 21/872 [22:52<15:34:02, 65.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 22/872 [24:00<15:38:44, 66.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 23/872 [25:02<15:21:47, 65.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 24/872 [26:10<15:33:34, 66.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 25/872 [27:17<15:37:08, 66.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 26/872 [28:25<15:42:02, 66.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 27/872 [29:35<15:51:55, 67.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 28/872 [30:43<15:54:49, 67.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 29/872 [31:52<15:56:09, 68.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 3%|▎ | 30/872 [33:00<15:54:17, 68.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▎ | 31/872 [34:09<15:58:43, 68.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▎ | 32/872 [35:02<14:54:04, 63.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 33/872 [36:00<14:27:18, 62.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 34/872 [37:08<14:51:45, 63.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 35/872 [38:17<15:10:36, 65.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 36/872 [39:26<15:25:41, 66.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 37/872 [40:36<15:40:09, 67.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 38/872 [41:44<15:42:22, 67.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 4%|▍ | 39/872 [42:51<15:36:00, 67.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▍ | 40/872 [43:59<15:39:00, 67.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▍ | 41/872 [45:05<15:30:15, 67.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▍ | 42/872 [46:14<15:36:23, 67.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▍ | 43/872 [47:22<15:34:43, 67.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▌ | 44/872 [48:30<15:36:31, 67.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▌ | 45/872 [49:39<15:39:04, 68.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▌ | 46/872 [50:47<15:39:28, 68.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 5%|▌ | 47/872 [51:56<15:40:23, 68.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 48/872 [53:04<15:39:39, 68.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 49/872 [54:13<15:38:29, 68.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 50/872 [55:22<15:39:39, 68.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 51/872 [56:32<15:43:38, 68.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 52/872 [57:39<15:34:49, 68.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 53/872 [58:42<15:12:52, 66.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▌ | 54/872 [59:49<15:10:31, 66.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▋ | 55/872 [1:00:56<15:11:29, 66.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 6%|▋ | 56/872 [1:02:04<15:16:41, 67.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 57/872 [1:03:13<15:18:41, 67.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 58/872 [1:04:00<13:56:33, 61.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 59/872 [1:05:09<14:22:56, 63.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 60/872 [1:06:19<14:48:42, 65.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 61/872 [1:07:26<14:55:00, 66.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 62/872 [1:08:36<15:07:30, 67.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 63/872 [1:09:45<15:12:17, 67.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 64/872 [1:10:53<15:15:03, 67.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 7%|▋ | 65/872 [1:12:00<15:06:43, 67.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 66/872 [1:13:04<14:51:46, 66.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 67/872 [1:14:08<14:44:48, 65.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 68/872 [1:15:17<14:52:40, 66.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 69/872 [1:16:24<14:56:16, 66.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 70/872 [1:17:31<14:54:06, 66.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 71/872 [1:18:40<15:00:18, 67.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 72/872 [1:19:33<14:03:43, 63.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 73/872 [1:20:40<14:15:10, 64.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 8%|▊ | 74/872 [1:21:46<14:22:06, 64.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▊ | 75/872 [1:22:54<14:33:37, 65.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▊ | 76/872 [1:24:02<14:39:48, 66.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▉ | 77/872 [1:25:10<14:46:21, 66.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▉ | 78/872 [1:26:20<14:59:54, 68.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▉ | 79/872 [1:27:10<13:45:49, 62.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▉ | 80/872 [1:28:20<14:12:34, 64.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▉ | 81/872 [1:29:29<14:28:57, 65.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 9%|▉ | 82/872 [1:30:37<14:39:31, 66.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|▉ | 83/872 [1:31:43<14:35:22, 66.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|▉ | 84/872 [1:32:50<14:34:47, 66.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|▉ | 85/872 [1:33:59<14:43:58, 67.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|▉ | 86/872 [1:35:08<14:47:41, 67.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|▉ | 87/872 [1:36:17<14:51:04, 68.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|█ | 88/872 [1:37:26<14:52:58, 68.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|█ | 89/872 [1:38:36<14:59:14, 68.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|█ | 90/872 [1:39:44<14:55:28, 68.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 10%|█ | 91/872 [1:40:53<14:52:29, 68.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 92/872 [1:42:00<14:48:43, 68.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 93/872 [1:43:09<14:48:40, 68.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 94/872 [1:44:16<14:40:17, 67.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 95/872 [1:45:25<14:44:46, 68.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 96/872 [1:46:32<14:39:12, 67.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 97/872 [1:47:37<14:26:52, 67.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█ | 98/872 [1:48:33<13:42:41, 63.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█▏ | 99/872 [1:49:35<13:35:17, 63.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing sst2 validation set: 11%|█▏ | 100/872 [1:50:40<14:14:27, 66.41s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: sst2\n", "Train metrics: {'accuracy_without_watermark': 0.49, 'accuracy_with_watermark': 0.56, 'f1_without_watermark': 0.5714285714285714, 'f1_with_watermark': 0.56}\n", "Validation metrics: {'accuracy_without_watermark': 0.44, 'accuracy_with_watermark': 0.51, 'f1_without_watermark': 0.44, 'f1_with_watermark': 0.5882352941176471}\n", "Processing task: cola\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 0/8551 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 1/8551 [00:32<76:16:46, 32.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 2/8551 [01:39<126:06:35, 53.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 3/8551 [01:43<72:39:30, 30.60s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 4/8551 [02:51<107:39:42, 45.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 5/8551 [03:20<93:46:55, 39.51s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 6/8551 [03:34<72:42:46, 30.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 7/8551 [04:41<100:56:31, 42.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 8/8551 [05:10<90:37:47, 38.19s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 9/8551 [06:12<108:22:59, 45.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 10/8551 [06:47<100:26:40, 42.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 11/8551 [07:25<97:11:26, 40.97s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 12/8551 [08:25<110:59:15, 46.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 13/8551 [08:56<99:56:54, 42.14s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 14/8551 [10:01<116:16:30, 49.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 15/8551 [11:09<129:27:14, 54.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 16/8551 [11:53<122:09:06, 51.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 17/8551 [12:30<111:36:56, 47.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 18/8551 [13:37<126:14:37, 53.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 19/8551 [14:45<136:46:45, 57.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 20/8551 [15:52<143:20:40, 60.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 21/8551 [16:39<133:10:38, 56.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 22/8551 [17:14<118:12:37, 49.90s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 23/8551 [17:49<107:33:08, 45.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 24/8551 [18:09<89:30:25, 37.79s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 25/8551 [18:45<88:37:41, 37.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 26/8551 [19:52<109:19:38, 46.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 27/8551 [20:28<102:23:59, 43.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 28/8551 [21:34<117:59:27, 49.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 29/8551 [21:58<100:10:07, 42.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 30/8551 [23:06<118:25:43, 50.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 31/8551 [24:15<131:21:28, 55.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 32/8551 [24:48<115:47:02, 48.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 33/8551 [25:35<114:04:06, 48.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 34/8551 [26:21<112:56:26, 47.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 35/8551 [27:30<127:26:19, 53.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 36/8551 [28:16<122:03:40, 51.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 37/8551 [29:02<117:57:56, 49.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 38/8551 [29:47<114:32:29, 48.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 39/8551 [30:33<113:02:07, 47.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 40/8551 [31:20<112:08:37, 47.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 41/8551 [31:53<102:28:45, 43.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 0%| | 42/8551 [32:33<99:55:16, 42.27s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 43/8551 [33:28<108:34:06, 45.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 44/8551 [34:36<124:02:10, 52.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 45/8551 [35:11<111:52:52, 47.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 46/8551 [35:58<111:22:20, 47.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 47/8551 [37:04<125:18:53, 53.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 48/8551 [37:29<104:51:41, 44.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 49/8551 [38:35<120:36:01, 51.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 50/8551 [39:43<132:29:28, 56.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 51/8551 [40:46<137:27:57, 58.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 52/8551 [41:00<105:42:12, 44.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 53/8551 [41:44<105:34:26, 44.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 54/8551 [42:20<98:54:38, 41.91s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 55/8551 [43:06<101:51:21, 43.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 56/8551 [43:48<101:24:51, 42.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 57/8551 [44:21<94:02:55, 39.86s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 58/8551 [44:58<92:05:33, 39.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 59/8551 [45:43<96:39:44, 40.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 60/8551 [46:29<99:51:21, 42.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 61/8551 [46:54<87:25:26, 37.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 62/8551 [47:31<87:39:49, 37.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 63/8551 [48:37<108:15:40, 45.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 64/8551 [49:45<123:17:10, 52.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 65/8551 [50:48<130:59:19, 55.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 66/8551 [51:52<136:43:21, 58.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 67/8551 [52:59<143:37:58, 60.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 68/8551 [54:05<147:13:47, 62.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 69/8551 [54:51<135:32:59, 57.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 70/8551 [55:16<112:24:58, 47.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 71/8551 [56:09<115:46:46, 49.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 72/8551 [57:16<128:43:31, 54.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 73/8551 [57:45<110:20:14, 46.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 74/8551 [58:24<105:05:02, 44.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 75/8551 [59:00<98:29:25, 41.83s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 76/8551 [1:00:05<115:01:41, 48.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 77/8551 [1:01:12<127:41:34, 54.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 78/8551 [1:01:36<106:49:23, 45.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 79/8551 [1:02:16<102:44:49, 43.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 80/8551 [1:02:19<73:49:30, 31.37s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 81/8551 [1:03:04<83:52:34, 35.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 82/8551 [1:03:22<70:54:23, 30.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 83/8551 [1:04:08<82:13:41, 34.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 84/8551 [1:04:42<81:59:41, 34.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 85/8551 [1:05:50<105:22:36, 44.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 86/8551 [1:06:49<114:55:31, 48.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 87/8551 [1:07:56<127:48:28, 54.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 88/8551 [1:08:58<133:16:52, 56.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 89/8551 [1:10:01<137:24:28, 58.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 90/8551 [1:11:03<140:14:53, 59.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 91/8551 [1:11:56<135:22:12, 57.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 92/8551 [1:12:38<124:41:05, 53.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 93/8551 [1:13:18<115:25:26, 49.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 94/8551 [1:14:26<128:31:41, 54.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 95/8551 [1:15:29<134:21:49, 57.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 96/8551 [1:16:22<131:36:00, 56.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 97/8551 [1:17:27<137:23:55, 58.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 98/8551 [1:17:48<111:25:53, 47.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 99/8551 [1:18:53<123:45:40, 52.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola train set: 1%| | 100/8551 [1:19:32<112:02:31, 47.73s/it]\n", "Processing cola validation set: 0%| | 0/1043 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 0%| | 1/1043 [00:45<13:15:52, 45.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 0%| | 2/1043 [01:20<11:25:56, 39.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 0%| | 3/1043 [02:06<12:09:17, 42.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 0%| | 4/1043 [03:02<13:45:17, 47.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 0%| | 5/1043 [03:15<10:06:36, 35.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 6/1043 [04:23<13:21:31, 46.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 7/1043 [05:26<14:58:04, 52.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 8/1043 [06:01<13:18:46, 46.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 9/1043 [06:41<12:47:05, 44.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 10/1043 [07:15<11:48:33, 41.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 11/1043 [08:22<14:06:18, 49.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 12/1043 [08:58<12:55:28, 45.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%| | 13/1043 [09:55<13:58:15, 48.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%|▏ | 14/1043 [11:03<15:36:00, 54.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 1%|▏ | 15/1043 [11:50<14:53:40, 52.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 16/1043 [12:23<13:17:23, 46.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 17/1043 [13:29<14:54:48, 52.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 18/1043 [14:16<14:24:56, 50.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 19/1043 [15:24<15:55:37, 55.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 20/1043 [16:33<16:58:43, 59.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 21/1043 [17:38<17:25:58, 61.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 22/1043 [18:37<17:12:46, 60.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 23/1043 [19:14<15:09:10, 53.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 24/1043 [20:22<16:21:40, 57.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 25/1043 [21:30<17:12:26, 60.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 2%|▏ | 26/1043 [22:37<17:45:48, 62.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 27/1043 [23:45<18:10:38, 64.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 28/1043 [24:31<16:35:26, 58.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 29/1043 [24:45<12:48:16, 45.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 30/1043 [25:49<14:19:08, 50.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 31/1043 [26:25<13:04:39, 46.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 32/1043 [27:26<14:14:09, 50.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 33/1043 [28:26<15:03:15, 53.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 34/1043 [29:29<15:49:14, 56.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 35/1043 [30:12<14:39:20, 52.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 3%|▎ | 36/1043 [31:19<15:50:38, 56.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▎ | 37/1043 [32:26<16:42:56, 59.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▎ | 38/1043 [33:12<15:31:40, 55.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▎ | 39/1043 [33:51<14:09:31, 50.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 40/1043 [34:14<11:47:22, 42.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 41/1043 [35:07<12:42:31, 45.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 42/1043 [36:07<13:50:59, 49.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 43/1043 [36:49<13:12:50, 47.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 44/1043 [37:51<14:23:47, 51.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 45/1043 [38:36<13:51:13, 49.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 4%|▍ | 46/1043 [39:09<12:23:11, 44.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▍ | 47/1043 [40:00<12:55:05, 46.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▍ | 48/1043 [41:03<14:13:43, 51.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▍ | 49/1043 [41:16<11:02:49, 40.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▍ | 50/1043 [41:57<11:08:06, 40.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▍ | 51/1043 [42:51<12:11:42, 44.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▍ | 52/1043 [43:30<11:45:10, 42.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▌ | 53/1043 [44:06<11:11:59, 40.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▌ | 54/1043 [44:41<10:43:18, 39.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▌ | 55/1043 [45:23<10:57:21, 39.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▌ | 56/1043 [46:27<12:58:28, 47.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 5%|▌ | 57/1043 [47:03<11:58:04, 43.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 58/1043 [48:11<13:56:21, 50.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 59/1043 [48:55<13:25:06, 49.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 60/1043 [49:58<14:31:18, 53.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 61/1043 [50:51<14:27:09, 52.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 62/1043 [51:56<15:27:35, 56.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 63/1043 [52:59<15:55:26, 58.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 64/1043 [54:06<16:39:59, 61.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▌ | 65/1043 [55:11<16:53:22, 62.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▋ | 66/1043 [56:17<17:12:45, 63.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 6%|▋ | 67/1043 [57:25<17:31:55, 64.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 68/1043 [57:39<13:24:32, 49.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 69/1043 [58:47<14:54:44, 55.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 70/1043 [59:54<15:53:43, 58.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 71/1043 [1:00:54<15:58:32, 59.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 72/1043 [1:02:02<16:39:52, 61.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 73/1043 [1:02:48<15:21:47, 57.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 74/1043 [1:03:41<14:58:42, 55.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 75/1043 [1:04:47<15:50:25, 58.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 76/1043 [1:05:54<16:30:06, 61.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 77/1043 [1:06:23<13:49:54, 51.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 7%|▋ | 78/1043 [1:07:00<12:38:26, 47.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 79/1043 [1:08:03<13:53:56, 51.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 80/1043 [1:08:49<13:23:38, 50.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 81/1043 [1:09:35<13:06:08, 49.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 82/1043 [1:10:12<12:04:11, 45.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 83/1043 [1:11:19<13:52:00, 52.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 84/1043 [1:12:01<13:03:01, 48.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 85/1043 [1:12:48<12:50:08, 48.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 86/1043 [1:13:56<14:22:33, 54.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 87/1043 [1:14:48<14:15:01, 53.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 8%|▊ | 88/1043 [1:15:53<15:08:43, 57.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▊ | 89/1043 [1:16:54<15:24:41, 58.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▊ | 90/1043 [1:17:53<15:29:34, 58.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▊ | 91/1043 [1:18:49<15:17:03, 57.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 92/1043 [1:19:35<14:17:06, 54.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 93/1043 [1:19:55<11:32:58, 43.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 94/1043 [1:21:01<13:18:48, 50.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 95/1043 [1:22:08<14:37:15, 55.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 96/1043 [1:23:14<15:26:23, 58.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 97/1043 [1:24:29<16:42:24, 63.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 98/1043 [1:25:09<14:51:24, 56.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 9%|▉ | 99/1043 [1:26:37<17:18:35, 66.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing cola validation set: 10%|▉ | 100/1043 [1:27:23<13:44:06, 52.43s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: cola\n", "Train metrics: {'matthews_corr_without_watermark': -0.09611547479941228, 'matthews_corr_with_watermark': 0.11224602755526586}\n", "Validation metrics: {'matthews_corr_without_watermark': 0.2683870161053685, 'matthews_corr_with_watermark': 0.031219527052723135}\n", "Processing task: mrpc\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 0/3668 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 1/3668 [00:59<60:06:10, 59.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 2/3668 [02:26<77:23:38, 76.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 3/3668 [03:53<82:14:35, 80.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 4/3668 [05:19<84:19:46, 82.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 5/3668 [06:12<73:16:08, 72.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 6/3668 [07:11<68:58:02, 67.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 7/3668 [08:38<75:07:27, 73.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 8/3668 [09:35<69:52:37, 68.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 9/3668 [10:28<64:37:56, 63.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 10/3668 [11:55<71:58:38, 70.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 11/3668 [13:22<76:54:23, 75.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 12/3668 [14:47<79:50:33, 78.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 13/3668 [16:12<81:45:08, 80.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 14/3668 [17:39<83:56:00, 82.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 15/3668 [19:01<83:40:13, 82.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 16/3668 [20:09<79:12:30, 78.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 17/3668 [21:14<75:10:40, 74.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 0%| | 18/3668 [22:04<67:41:20, 66.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 19/3668 [23:02<65:01:22, 64.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 20/3668 [24:11<66:28:36, 65.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 21/3668 [24:59<61:14:06, 60.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 22/3668 [25:47<57:16:48, 56.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 23/3668 [26:50<59:17:44, 58.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 24/3668 [27:59<62:30:43, 61.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 25/3668 [28:50<59:17:34, 58.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 26/3668 [29:59<62:27:30, 61.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 27/3668 [31:08<64:31:48, 63.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 28/3668 [31:52<58:21:23, 57.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 29/3668 [32:40<55:25:16, 54.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 30/3668 [33:49<59:45:11, 59.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 31/3668 [34:37<56:23:26, 55.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 32/3668 [35:42<59:03:27, 58.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 33/3668 [36:48<61:31:37, 60.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 34/3668 [37:34<56:58:03, 56.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 35/3668 [38:43<60:43:47, 60.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 36/3668 [39:51<62:55:09, 62.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 37/3668 [40:31<56:15:20, 55.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 38/3668 [41:41<60:27:14, 59.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 39/3668 [42:26<55:52:31, 55.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 40/3668 [43:18<54:56:32, 54.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 41/3668 [44:00<51:14:00, 50.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 42/3668 [44:48<50:13:00, 49.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 43/3668 [45:37<49:58:20, 49.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 44/3668 [46:47<56:10:54, 55.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%| | 45/3668 [47:55<59:42:40, 59.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 46/3668 [49:00<61:22:45, 61.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 47/3668 [50:09<63:59:39, 63.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 48/3668 [50:34<52:13:57, 51.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 49/3668 [51:44<57:30:54, 57.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 50/3668 [52:52<60:44:20, 60.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 51/3668 [54:01<63:27:21, 63.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 52/3668 [55:09<64:52:48, 64.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 53/3668 [56:18<66:07:00, 65.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 54/3668 [57:27<67:14:51, 66.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 1%|▏ | 55/3668 [57:54<55:01:38, 54.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 56/3668 [59:22<64:59:08, 64.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 57/3668 [1:00:14<61:15:59, 61.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 58/3668 [1:01:41<68:53:17, 68.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 59/3668 [1:02:36<64:41:51, 64.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 60/3668 [1:03:00<52:36:22, 52.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 61/3668 [1:04:18<60:21:10, 60.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 62/3668 [1:05:12<58:28:00, 58.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 63/3668 [1:06:30<64:11:05, 64.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 64/3668 [1:07:54<70:11:44, 70.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 65/3668 [1:08:45<64:22:51, 64.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 66/3668 [1:09:43<62:38:14, 62.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 67/3668 [1:10:54<65:11:15, 65.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 68/3668 [1:11:55<63:39:55, 63.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 69/3668 [1:12:27<54:13:09, 54.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 70/3668 [1:13:50<62:50:02, 62.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 71/3668 [1:15:10<68:07:30, 68.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 72/3668 [1:16:34<72:36:08, 72.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 73/3668 [1:17:53<74:31:22, 74.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 74/3668 [1:18:17<59:18:26, 59.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 75/3668 [1:19:24<61:48:34, 61.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 76/3668 [1:20:19<59:29:29, 59.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 77/3668 [1:21:29<62:31:17, 62.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 78/3668 [1:22:14<57:15:46, 57.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 79/3668 [1:23:21<60:18:46, 60.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 80/3668 [1:24:30<62:43:26, 62.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 81/3668 [1:25:37<63:52:01, 64.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 82/3668 [1:26:48<65:50:51, 66.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 83/3668 [1:27:26<57:28:17, 57.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 84/3668 [1:28:30<59:33:18, 59.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 85/3668 [1:29:10<53:21:57, 53.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 86/3668 [1:29:56<51:04:33, 51.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 87/3668 [1:30:55<53:32:36, 53.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 88/3668 [1:32:00<56:53:43, 57.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 89/3668 [1:33:07<59:46:45, 60.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 90/3668 [1:33:56<56:13:56, 56.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 2%|▏ | 91/3668 [1:34:39<52:24:50, 52.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 92/3668 [1:35:48<57:11:27, 57.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 93/3668 [1:36:56<60:20:41, 60.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 94/3668 [1:37:42<55:46:25, 56.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 95/3668 [1:38:50<59:16:32, 59.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 96/3668 [1:39:38<55:48:42, 56.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 97/3668 [1:40:47<59:41:57, 60.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 98/3668 [1:41:33<55:13:19, 55.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 99/3668 [1:42:32<56:12:53, 56.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc train set: 3%|▎ | 100/3668 [1:43:35<61:36:07, 62.15s/it]\n", "Processing mrpc validation set: 0%| | 0/408 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 0%| | 1/408 [00:47<5:19:11, 47.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 0%| | 2/408 [01:54<6:39:04, 58.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 1%| | 3/408 [03:02<7:04:50, 62.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 1%| | 4/408 [04:09<7:16:56, 64.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 1%| | 5/408 [05:18<7:24:51, 66.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 1%|▏ | 6/408 [06:05<6:40:53, 59.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 2%|▏ | 7/408 [07:14<6:58:48, 62.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 2%|▏ | 8/408 [08:18<7:00:15, 63.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 2%|▏ | 9/408 [09:25<7:08:40, 64.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 2%|▏ | 10/408 [10:30<7:08:28, 64.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 3%|▎ | 11/408 [11:39<7:15:36, 65.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 3%|▎ | 12/408 [12:48<7:20:05, 66.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 3%|▎ | 13/408 [13:30<6:31:42, 59.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 3%|▎ | 14/408 [14:41<6:51:39, 62.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 4%|▎ | 15/408 [15:48<7:00:25, 64.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 4%|▍ | 16/408 [16:57<7:08:11, 65.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 4%|▍ | 17/408 [18:05<7:11:22, 66.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 4%|▍ | 18/408 [18:48<6:26:29, 59.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 5%|▍ | 19/408 [19:48<6:26:07, 59.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 5%|▍ | 20/408 [20:20<5:31:15, 51.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 5%|▌ | 21/408 [21:19<5:46:16, 53.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 5%|▌ | 22/408 [22:25<6:08:36, 57.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 6%|▌ | 23/408 [22:58<5:20:20, 49.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 6%|▌ | 24/408 [23:45<5:14:57, 49.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 6%|▌ | 25/408 [24:56<5:54:17, 55.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 6%|▋ | 26/408 [26:01<6:12:33, 58.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 7%|▋ | 27/408 [26:49<5:51:05, 55.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 7%|▋ | 28/408 [27:59<6:17:57, 59.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 7%|▋ | 29/408 [28:45<5:50:31, 55.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 7%|▋ | 30/408 [29:39<5:47:43, 55.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 8%|▊ | 31/408 [30:49<6:14:20, 59.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 8%|▊ | 32/408 [31:56<6:27:39, 61.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 8%|▊ | 33/408 [33:01<6:32:35, 62.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 8%|▊ | 34/408 [34:11<6:45:20, 65.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 9%|▊ | 35/408 [35:34<7:17:44, 70.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 9%|▉ | 36/408 [37:04<7:51:44, 76.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 9%|▉ | 37/408 [38:32<8:13:05, 79.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 9%|▉ | 38/408 [39:25<7:22:13, 71.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 10%|▉ | 39/408 [40:50<7:46:03, 75.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 10%|▉ | 40/408 [42:14<8:00:04, 78.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 10%|█ | 41/408 [43:23<7:41:20, 75.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 10%|█ | 42/408 [44:48<7:58:01, 78.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 11%|█ | 43/408 [46:15<8:12:14, 80.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 11%|█ | 44/408 [47:42<8:20:59, 82.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 11%|█ | 45/408 [48:54<8:01:01, 79.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 11%|█▏ | 46/408 [50:20<8:12:10, 81.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 12%|█▏ | 47/408 [51:47<8:19:24, 83.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 12%|█▏ | 48/408 [53:13<8:23:45, 83.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 12%|█▏ | 49/408 [54:33<8:16:18, 82.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 12%|█▏ | 50/408 [55:59<8:20:25, 83.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 12%|█▎ | 51/408 [57:21<8:14:09, 83.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 13%|█▎ | 52/408 [57:56<6:48:55, 68.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 13%|█▎ | 53/408 [59:03<6:43:45, 68.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 13%|█▎ | 54/408 [1:00:07<6:34:31, 66.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 13%|█▎ | 55/408 [1:01:16<6:38:09, 67.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 14%|█▎ | 56/408 [1:02:26<6:40:29, 68.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 14%|█▍ | 57/408 [1:03:31<6:34:22, 67.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 14%|█▍ | 58/408 [1:04:41<6:36:18, 67.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 14%|█▍ | 59/408 [1:05:47<6:32:10, 67.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 15%|█▍ | 60/408 [1:06:57<6:36:30, 68.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 15%|█▍ | 61/408 [1:08:08<6:38:41, 68.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 15%|█▌ | 62/408 [1:08:55<6:00:59, 62.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 15%|█▌ | 63/408 [1:10:00<6:02:47, 63.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 16%|█▌ | 64/408 [1:11:10<6:13:17, 65.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 16%|█▌ | 65/408 [1:11:57<5:42:02, 59.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 16%|█▌ | 66/408 [1:12:39<5:09:44, 54.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 16%|█▋ | 67/408 [1:13:26<4:57:19, 52.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 17%|█▋ | 68/408 [1:14:36<5:26:50, 57.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 17%|█▋ | 69/408 [1:15:45<5:44:37, 61.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 17%|█▋ | 70/408 [1:16:53<5:55:09, 63.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 17%|█▋ | 71/408 [1:18:03<6:05:44, 65.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 18%|█▊ | 72/408 [1:18:19<4:42:40, 50.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 18%|█▊ | 73/408 [1:19:05<4:34:45, 49.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 18%|█▊ | 74/408 [1:20:05<4:51:22, 52.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 18%|█▊ | 75/408 [1:20:56<4:48:39, 52.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 19%|█▊ | 76/408 [1:22:01<5:08:37, 55.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 19%|█▉ | 77/408 [1:23:07<5:25:06, 58.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 19%|█▉ | 78/408 [1:24:08<5:27:05, 59.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 19%|█▉ | 79/408 [1:24:53<5:01:39, 55.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 20%|█▉ | 80/408 [1:25:40<4:48:35, 52.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 20%|█▉ | 81/408 [1:26:48<5:11:57, 57.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 20%|██ | 82/408 [1:27:34<4:52:27, 53.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 20%|██ | 83/408 [1:28:25<4:48:13, 53.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 21%|██ | 84/408 [1:29:13<4:37:38, 51.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 21%|██ | 85/408 [1:30:22<5:05:51, 56.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 21%|██ | 86/408 [1:31:31<5:24:23, 60.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 21%|██▏ | 87/408 [1:32:41<5:39:10, 63.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 22%|██▏ | 88/408 [1:33:49<5:45:18, 64.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 22%|██▏ | 89/408 [1:34:38<5:18:57, 59.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 22%|██▏ | 90/408 [1:35:25<4:56:53, 56.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 22%|██▏ | 91/408 [1:36:18<4:51:40, 55.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 23%|██▎ | 92/408 [1:37:17<4:56:05, 56.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 23%|██▎ | 93/408 [1:38:10<4:50:47, 55.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 23%|██▎ | 94/408 [1:39:18<5:08:42, 58.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 23%|██▎ | 95/408 [1:40:26<5:23:03, 61.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 24%|██▎ | 96/408 [1:41:29<5:22:40, 62.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 24%|██▍ | 97/408 [1:42:39<5:34:13, 64.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 24%|██▍ | 98/408 [1:43:49<5:41:37, 66.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 24%|██▍ | 99/408 [1:44:58<5:45:27, 67.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mrpc validation set: 25%|██▍ | 100/408 [1:45:48<5:25:54, 63.49s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: mrpc\n", "Train metrics: {'accuracy_without_watermark': 0.53, 'accuracy_with_watermark': 0.44, 'f1_without_watermark': 0.6758620689655173, 'f1_with_watermark': 0.5882352941176471}\n", "Validation metrics: {'accuracy_without_watermark': 0.59, 'accuracy_with_watermark': 0.57, 'f1_without_watermark': 0.7210884353741497, 'f1_with_watermark': 0.6993006993006993}\n", "Processing task: qqp\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 0/363846 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 1/363846 [01:07<6791:08:12, 67.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 2/363846 [01:53<5564:38:31, 55.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 3/363846 [03:01<6161:13:49, 60.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 4/363846 [04:03<6182:56:37, 61.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 5/363846 [05:12<6492:36:53, 64.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 6/363846 [05:56<5771:41:36, 57.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 7/363846 [07:01<6055:06:29, 59.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 8/363846 [08:10<6346:03:54, 62.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 9/363846 [09:21<6588:47:27, 65.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 10/363846 [10:13<6175:27:05, 61.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 11/363846 [10:54<5576:26:28, 55.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 12/363846 [12:03<5990:48:31, 59.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 13/363846 [13:10<6237:46:32, 61.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 14/363846 [14:19<6454:53:50, 63.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 15/363846 [15:28<6588:09:12, 65.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 16/363846 [16:31<6539:34:36, 64.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 17/363846 [17:21<6099:33:55, 60.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 18/363846 [18:26<6230:28:25, 61.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 19/363846 [19:35<6440:00:36, 63.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 20/363846 [20:43<6583:17:28, 65.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 21/363846 [21:53<6717:55:00, 66.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 22/363846 [23:01<6770:51:17, 67.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 23/363846 [24:10<6847:10:27, 67.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 24/363846 [25:17<6826:31:15, 67.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 25/363846 [26:24<6782:15:26, 67.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 26/363846 [27:32<6820:56:04, 67.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 27/363846 [28:41<6854:49:08, 67.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 28/363846 [29:49<6871:27:40, 67.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 29/363846 [30:48<6592:17:43, 65.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 30/363846 [31:51<6520:40:45, 64.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 31/363846 [32:56<6561:49:04, 64.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 32/363846 [34:05<6672:45:42, 66.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 33/363846 [35:11<6672:14:14, 66.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 34/363846 [35:56<6048:46:07, 59.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 35/363846 [37:03<6260:59:15, 61.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 36/363846 [37:35<5349:56:23, 52.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 37/363846 [38:22<5163:43:15, 51.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 38/363846 [39:32<5735:50:06, 56.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 39/363846 [40:03<4956:54:38, 49.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 40/363846 [41:13<5580:36:19, 55.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 41/363846 [42:19<5905:34:07, 58.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 42/363846 [43:27<6204:17:03, 61.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 43/363846 [44:33<6359:09:35, 62.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 44/363846 [45:43<6546:45:16, 64.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 45/363846 [46:24<5833:21:51, 57.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 46/363846 [47:00<5191:48:19, 51.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 47/363846 [47:44<4942:45:52, 48.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 48/363846 [48:44<5292:08:51, 52.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 49/363846 [49:46<5586:24:22, 55.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 50/363846 [50:52<5917:44:00, 58.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 51/363846 [52:00<6194:38:38, 61.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 52/363846 [53:06<6349:31:52, 62.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 53/363846 [54:11<6415:40:44, 63.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 54/363846 [55:20<6571:51:31, 65.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 55/363846 [56:28<6661:38:07, 65.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 56/363846 [57:15<6073:04:46, 60.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 57/363846 [58:07<5843:32:10, 57.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 58/363846 [59:10<5987:44:12, 59.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 59/363846 [1:00:18<6252:54:29, 61.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 60/363846 [1:01:38<6808:41:16, 67.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 61/363846 [1:03:06<7424:26:12, 73.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 62/363846 [1:04:33<7860:01:41, 77.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 63/363846 [1:05:49<7802:57:09, 77.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 64/363846 [1:06:51<7348:12:29, 72.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 65/363846 [1:08:16<7692:14:16, 76.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 66/363846 [1:09:40<7954:21:59, 78.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 67/363846 [1:10:43<7459:01:49, 73.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 68/363846 [1:12:06<7760:40:19, 76.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 69/363846 [1:13:03<7141:09:00, 70.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 70/363846 [1:14:02<6801:33:34, 67.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 71/363846 [1:15:25<7276:34:58, 72.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 72/363846 [1:16:47<7582:08:43, 75.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 73/363846 [1:18:11<7842:46:29, 77.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 74/363846 [1:19:08<7209:09:01, 71.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 75/363846 [1:20:32<7604:11:42, 75.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 76/363846 [1:21:56<7857:21:39, 77.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 77/363846 [1:23:08<7704:25:00, 76.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 78/363846 [1:24:26<7750:24:13, 76.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 79/363846 [1:25:34<7480:30:49, 74.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 80/363846 [1:26:42<7290:36:33, 72.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 81/363846 [1:27:45<7018:49:28, 69.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 82/363846 [1:28:46<6765:31:10, 66.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 83/363846 [1:29:24<5885:10:18, 58.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 84/363846 [1:30:28<6057:03:17, 59.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 85/363846 [1:31:35<6261:50:16, 61.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 86/363846 [1:32:25<5910:10:21, 58.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 87/363846 [1:33:32<6184:36:15, 61.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 88/363846 [1:34:36<6255:07:44, 61.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 89/363846 [1:35:42<6377:14:19, 63.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 90/363846 [1:36:47<6445:28:44, 63.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 91/363846 [1:37:51<6437:40:57, 63.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 92/363846 [1:38:32<5741:36:27, 56.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 93/363846 [1:39:41<6110:15:51, 60.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 94/363846 [1:40:37<5979:42:57, 59.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 95/363846 [1:41:23<5574:29:06, 55.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 96/363846 [1:42:30<5957:55:59, 58.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 97/363846 [1:43:17<5596:17:04, 55.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 98/363846 [1:44:21<5857:20:58, 57.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 99/363846 [1:45:27<6100:44:12, 60.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp train set: 0%| | 100/363846 [1:46:15<6441:33:11, 63.75s/it]\n", "Processing qqp validation set: 0%| | 0/40430 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 1/40430 [01:08<766:15:24, 68.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 2/40430 [02:17<775:47:51, 69.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 3/40430 [03:22<752:03:18, 66.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 4/40430 [04:29<751:52:31, 66.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 5/40430 [05:35<750:49:03, 66.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 6/40430 [05:59<585:51:40, 52.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 7/40430 [06:34<523:06:14, 46.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 8/40430 [07:18<512:41:38, 45.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 9/40430 [08:25<586:28:14, 52.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 10/40430 [09:09<560:01:23, 49.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 11/40430 [10:13<607:40:04, 54.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 12/40430 [11:18<645:19:50, 57.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 13/40430 [12:25<676:41:13, 60.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 14/40430 [13:33<704:36:34, 62.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 15/40430 [14:39<715:47:16, 63.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 16/40430 [15:17<627:45:33, 55.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 17/40430 [16:26<672:27:07, 59.90s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 18/40430 [17:32<691:01:46, 61.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 19/40430 [18:41<715:31:09, 63.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 20/40430 [19:18<626:56:44, 55.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 21/40430 [20:22<654:45:38, 58.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 22/40430 [21:21<657:05:13, 58.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 23/40430 [22:03<601:08:01, 53.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 24/40430 [23:11<649:15:58, 57.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 25/40430 [24:19<683:25:15, 60.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 26/40430 [25:28<711:08:11, 63.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 27/40430 [26:33<717:28:57, 63.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 28/40430 [27:41<730:46:07, 65.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 29/40430 [28:49<739:14:11, 65.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 30/40430 [29:37<680:15:37, 60.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 31/40430 [30:43<698:30:17, 62.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 32/40430 [31:52<722:11:37, 64.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 33/40430 [32:58<724:43:25, 64.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 34/40430 [33:48<676:14:22, 60.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 35/40430 [34:51<685:17:36, 61.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 36/40430 [36:00<711:54:58, 63.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 37/40430 [37:07<725:26:00, 64.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 38/40430 [38:02<691:05:46, 61.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 39/40430 [39:10<712:34:13, 63.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 40/40430 [40:14<715:04:07, 63.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 41/40430 [40:47<611:07:06, 54.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 42/40430 [41:45<624:34:03, 55.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 43/40430 [42:52<661:13:47, 58.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 44/40430 [43:56<678:45:47, 60.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 45/40430 [44:52<664:57:37, 59.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 46/40430 [45:58<687:11:07, 61.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 47/40430 [47:03<697:36:42, 62.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 48/40430 [48:10<714:15:12, 63.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 49/40430 [49:18<729:17:05, 65.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 50/40430 [50:06<673:27:29, 60.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 51/40430 [51:07<673:58:07, 60.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 52/40430 [52:10<686:45:52, 61.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 53/40430 [53:18<706:57:14, 63.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 54/40430 [54:18<698:31:18, 62.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 55/40430 [55:25<713:36:01, 63.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 56/40430 [56:27<706:51:46, 63.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 57/40430 [57:12<646:13:26, 57.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 58/40430 [58:18<675:32:59, 60.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 59/40430 [59:27<704:24:37, 62.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 60/40430 [1:00:35<723:46:33, 64.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 61/40430 [1:01:40<725:19:05, 64.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 62/40430 [1:02:49<740:21:19, 66.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 63/40430 [1:03:55<739:23:52, 65.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 64/40430 [1:04:49<698:55:25, 62.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 65/40430 [1:05:57<718:59:48, 64.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 66/40430 [1:07:07<737:21:16, 65.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 67/40430 [1:08:15<745:19:28, 66.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 68/40430 [1:09:18<732:51:22, 65.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 69/40430 [1:10:09<684:03:22, 61.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 70/40430 [1:11:17<708:50:21, 63.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 71/40430 [1:12:24<720:48:26, 64.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 72/40430 [1:13:01<628:37:14, 56.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 73/40430 [1:13:57<629:43:38, 56.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 74/40430 [1:15:03<662:28:24, 59.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 75/40430 [1:16:12<694:25:14, 61.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 76/40430 [1:17:19<712:56:05, 63.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 77/40430 [1:18:24<718:14:52, 64.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 78/40430 [1:19:33<731:47:40, 65.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 79/40430 [1:20:37<729:25:20, 65.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 80/40430 [1:21:15<638:10:24, 56.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 81/40430 [1:22:23<675:48:17, 60.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 82/40430 [1:23:33<706:23:58, 63.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 83/40430 [1:24:39<719:09:50, 64.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 84/40430 [1:25:47<730:53:46, 65.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 85/40430 [1:26:48<717:36:46, 64.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 86/40430 [1:27:56<730:05:42, 65.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 87/40430 [1:28:59<721:36:25, 64.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 88/40430 [1:29:49<672:41:15, 60.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 89/40430 [1:30:52<684:45:04, 61.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 90/40430 [1:31:48<666:17:01, 59.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 91/40430 [1:32:52<682:44:50, 60.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 92/40430 [1:34:01<707:32:26, 63.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 93/40430 [1:35:08<723:10:38, 64.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 94/40430 [1:36:16<732:59:43, 65.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 95/40430 [1:37:22<734:47:00, 65.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 96/40430 [1:38:28<737:50:57, 65.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 97/40430 [1:39:13<667:22:43, 59.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 98/40430 [1:40:19<689:55:38, 61.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 99/40430 [1:41:28<714:56:11, 63.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qqp validation set: 0%| | 100/40430 [1:42:26<688:31:40, 61.46s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: qqp\n", "Train metrics: {'accuracy_without_watermark': 0.53, 'accuracy_with_watermark': 0.51, 'f1_without_watermark': 0.38961038961038963, 'f1_with_watermark': 0.19672131147540983}\n", "Validation metrics: {'accuracy_without_watermark': 0.54, 'accuracy_with_watermark': 0.59, 'f1_without_watermark': 0.23333333333333334, 'f1_with_watermark': 0.22641509433962265}\n", "Processing task: stsb\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 0/5749 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 1/5749 [01:07<107:51:57, 67.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 2/5749 [02:15<108:20:32, 67.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 3/5749 [03:25<109:43:42, 68.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 4/5749 [04:29<106:49:17, 66.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 5/5749 [05:38<108:01:34, 67.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 6/5749 [06:46<108:12:59, 67.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 7/5749 [07:54<108:04:50, 67.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 8/5749 [09:02<108:08:26, 67.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 9/5749 [10:11<108:55:17, 68.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 10/5749 [11:21<109:31:29, 68.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 11/5749 [12:30<109:38:59, 68.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 12/5749 [13:39<109:54:35, 68.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 13/5749 [14:49<110:08:51, 69.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 14/5749 [15:49<105:56:47, 66.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 15/5749 [16:57<106:23:28, 66.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 16/5749 [18:04<106:30:01, 66.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 17/5749 [19:10<106:01:38, 66.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 18/5749 [20:15<105:36:49, 66.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 19/5749 [21:24<106:50:17, 67.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 20/5749 [22:32<107:17:27, 67.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 21/5749 [23:41<108:04:29, 67.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 22/5749 [24:49<107:49:34, 67.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 23/5749 [25:51<104:52:35, 65.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 24/5749 [26:59<106:17:08, 66.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 25/5749 [28:09<107:20:54, 67.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 26/5749 [29:16<107:05:22, 67.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 27/5749 [30:22<106:46:49, 67.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 0%| | 28/5749 [31:32<107:52:57, 67.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 29/5749 [32:41<108:35:01, 68.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 30/5749 [33:50<108:55:23, 68.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 31/5749 [34:59<109:10:26, 68.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 32/5749 [36:02<106:01:49, 66.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 33/5749 [37:07<105:21:58, 66.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 34/5749 [38:13<105:20:47, 66.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 35/5749 [39:22<106:21:12, 67.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 36/5749 [40:31<107:16:36, 67.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 37/5749 [41:40<107:43:17, 67.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 38/5749 [42:49<108:25:58, 68.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 39/5749 [43:58<108:54:04, 68.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 40/5749 [45:03<107:08:07, 67.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 41/5749 [46:08<105:44:17, 66.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 42/5749 [47:16<106:11:48, 66.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 43/5749 [48:18<104:05:51, 65.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 44/5749 [49:28<105:58:47, 66.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 45/5749 [50:37<106:58:22, 67.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 46/5749 [51:47<107:55:55, 68.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 47/5749 [52:52<106:42:04, 67.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 48/5749 [54:00<107:05:33, 67.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 49/5749 [55:10<107:54:23, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 50/5749 [56:12<104:53:45, 66.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 51/5749 [57:16<103:52:33, 65.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 52/5749 [58:25<105:25:42, 66.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 53/5749 [59:28<103:46:52, 65.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 54/5749 [1:00:31<102:25:31, 64.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 55/5749 [1:01:38<103:52:16, 65.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 56/5749 [1:02:48<105:42:46, 66.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 57/5749 [1:03:56<106:24:43, 67.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 58/5749 [1:05:04<106:44:43, 67.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 59/5749 [1:06:10<105:59:09, 67.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 60/5749 [1:07:17<105:39:49, 66.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 61/5749 [1:08:24<105:56:19, 67.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 62/5749 [1:09:34<107:07:24, 67.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 63/5749 [1:10:41<106:49:22, 67.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 64/5749 [1:11:49<106:59:07, 67.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 65/5749 [1:12:59<107:50:25, 68.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 66/5749 [1:14:05<106:38:56, 67.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 67/5749 [1:15:12<106:35:08, 67.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 68/5749 [1:16:20<106:34:50, 67.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 69/5749 [1:17:29<107:18:39, 68.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 70/5749 [1:18:38<107:48:23, 68.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%| | 71/5749 [1:19:47<108:15:21, 68.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 72/5749 [1:20:56<108:15:03, 68.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 73/5749 [1:22:03<107:26:39, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 74/5749 [1:23:12<108:06:53, 68.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 75/5749 [1:24:20<107:35:55, 68.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 76/5749 [1:25:29<108:05:32, 68.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 77/5749 [1:26:38<108:02:10, 68.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 78/5749 [1:27:43<106:28:13, 67.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 79/5749 [1:28:53<107:27:49, 68.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 80/5749 [1:30:02<107:57:47, 68.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 81/5749 [1:31:08<106:51:15, 67.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 82/5749 [1:32:11<104:32:36, 66.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 83/5749 [1:33:19<105:15:30, 66.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 84/5749 [1:34:28<105:59:40, 67.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 85/5749 [1:35:31<104:09:15, 66.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 1%|▏ | 86/5749 [1:36:40<105:12:33, 66.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 87/5749 [1:37:49<106:27:14, 67.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 88/5749 [1:38:58<107:04:34, 68.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 89/5749 [1:40:07<107:26:01, 68.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 90/5749 [1:41:16<107:40:19, 68.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 91/5749 [1:42:26<108:14:25, 68.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 92/5749 [1:43:35<108:28:02, 69.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 93/5749 [1:44:42<107:25:20, 68.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 94/5749 [1:45:51<107:25:55, 68.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 95/5749 [1:46:50<102:59:07, 65.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 96/5749 [1:47:57<103:43:12, 66.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 97/5749 [1:49:06<105:19:56, 67.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 98/5749 [1:50:14<105:46:11, 67.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 99/5749 [1:51:23<106:11:51, 67.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb train set: 2%|▏ | 100/5749 [1:52:31<105:56:59, 67.52s/it]\n", "Processing stsb validation set: 0%| | 0/1500 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 1/1500 [01:08<28:39:03, 68.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 2/1500 [02:15<28:08:59, 67.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 3/1500 [03:24<28:19:32, 68.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 4/1500 [04:30<27:54:37, 67.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 5/1500 [05:32<27:15:36, 65.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 6/1500 [06:41<27:35:11, 66.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 0%| | 7/1500 [07:46<27:27:50, 66.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 8/1500 [08:54<27:36:25, 66.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 9/1500 [10:01<27:36:58, 66.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 10/1500 [11:02<26:54:52, 65.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 11/1500 [12:10<27:19:44, 66.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 12/1500 [13:13<26:55:55, 65.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 13/1500 [14:23<27:25:51, 66.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 14/1500 [15:30<27:31:23, 66.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 15/1500 [16:39<27:46:43, 67.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 16/1500 [17:46<27:40:51, 67.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 17/1500 [18:47<26:54:50, 65.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%| | 18/1500 [19:56<27:25:29, 66.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%|▏ | 19/1500 [21:02<27:18:18, 66.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%|▏ | 20/1500 [22:04<26:46:55, 65.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%|▏ | 21/1500 [23:13<27:09:48, 66.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 1%|▏ | 22/1500 [24:21<27:26:46, 66.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 23/1500 [25:29<27:31:53, 67.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 24/1500 [26:37<27:36:54, 67.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 25/1500 [27:45<27:42:15, 67.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 26/1500 [28:47<27:01:17, 66.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 27/1500 [29:52<26:47:43, 65.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 28/1500 [31:01<27:16:26, 66.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 29/1500 [32:08<27:13:05, 66.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 30/1500 [33:16<27:26:53, 67.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 31/1500 [34:26<27:46:49, 68.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 32/1500 [35:31<27:21:58, 67.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 33/1500 [36:34<26:48:03, 65.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 34/1500 [37:37<26:26:14, 64.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 35/1500 [38:44<26:41:09, 65.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 36/1500 [39:52<27:02:17, 66.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 2%|▏ | 37/1500 [41:02<27:25:45, 67.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 38/1500 [42:12<27:40:35, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 39/1500 [43:21<27:42:02, 68.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 40/1500 [44:27<27:26:54, 67.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 41/1500 [45:34<27:23:21, 67.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 42/1500 [46:43<27:34:32, 68.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 43/1500 [47:53<27:41:50, 68.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 44/1500 [49:00<27:31:24, 68.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 45/1500 [50:07<27:24:45, 67.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 46/1500 [51:13<27:10:04, 67.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 47/1500 [52:23<27:24:52, 67.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 48/1500 [53:32<27:32:36, 68.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 49/1500 [54:40<27:29:37, 68.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 50/1500 [55:43<26:49:52, 66.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 51/1500 [56:51<27:03:10, 67.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 3%|▎ | 52/1500 [57:59<27:07:12, 67.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▎ | 53/1500 [59:09<27:21:12, 68.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▎ | 54/1500 [1:00:18<27:31:31, 68.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▎ | 55/1500 [1:01:26<27:26:43, 68.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▎ | 56/1500 [1:02:33<27:13:47, 67.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 57/1500 [1:03:35<26:32:03, 66.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 58/1500 [1:04:45<26:54:46, 67.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 59/1500 [1:05:53<27:02:08, 67.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 60/1500 [1:07:02<27:11:26, 67.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 61/1500 [1:08:07<26:45:19, 66.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 62/1500 [1:09:16<27:03:17, 67.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 63/1500 [1:10:25<27:08:52, 68.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 64/1500 [1:11:33<27:11:06, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 65/1500 [1:12:40<26:59:06, 67.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 66/1500 [1:13:42<26:15:22, 65.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 4%|▍ | 67/1500 [1:14:49<26:24:26, 66.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 68/1500 [1:15:59<26:45:38, 67.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 69/1500 [1:17:08<27:01:19, 67.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 70/1500 [1:18:16<26:54:55, 67.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 71/1500 [1:19:21<26:38:12, 67.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 72/1500 [1:20:30<26:49:23, 67.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 73/1500 [1:21:40<27:04:52, 68.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▍ | 74/1500 [1:22:48<27:04:53, 68.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 75/1500 [1:23:57<27:02:11, 68.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 76/1500 [1:25:03<26:48:38, 67.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 77/1500 [1:26:10<26:40:15, 67.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 78/1500 [1:27:15<26:21:32, 66.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 79/1500 [1:28:24<26:39:59, 67.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 80/1500 [1:29:33<26:49:25, 68.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 81/1500 [1:30:40<26:39:59, 67.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 5%|▌ | 82/1500 [1:31:49<26:46:43, 67.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 83/1500 [1:32:57<26:49:26, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 84/1500 [1:34:06<26:52:00, 68.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 85/1500 [1:35:13<26:42:01, 67.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 86/1500 [1:36:21<26:41:08, 67.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 87/1500 [1:37:31<26:53:14, 68.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 88/1500 [1:38:39<26:45:40, 68.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 89/1500 [1:39:45<26:30:49, 67.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 90/1500 [1:40:55<26:45:26, 68.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 91/1500 [1:42:03<26:45:30, 68.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 92/1500 [1:43:07<26:11:12, 66.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▌ | 93/1500 [1:44:13<26:02:38, 66.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▋ | 94/1500 [1:45:22<26:21:55, 67.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▋ | 95/1500 [1:46:30<26:23:00, 67.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▋ | 96/1500 [1:47:37<26:19:52, 67.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 6%|▋ | 97/1500 [1:48:47<26:32:20, 68.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 7%|▋ | 98/1500 [1:49:56<26:35:30, 68.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 7%|▋ | 99/1500 [1:51:05<26:42:50, 68.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing stsb validation set: 7%|▋ | 100/1500 [1:52:13<26:11:09, 67.34s/it]\n", "/var/folders/8q/4np1n05x6wdcmh29jq9rpp840000gn/T/ipykernel_72349/1105967355.py:154: ConstantInputWarning: An input array is constant; the correlation coefficient is not defined.\n", " metrics[\"pearson_corr_without_watermark\"] = pearsonr(true_scores, pred_scores_without_watermark)[0]\n", "/var/folders/8q/4np1n05x6wdcmh29jq9rpp840000gn/T/ipykernel_72349/1105967355.py:156: ConstantInputWarning: An input array is constant; the correlation coefficient is not defined.\n", " metrics[\"spearman_corr_without_watermark\"] = spearmanr(true_scores, pred_scores_without_watermark)[0]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: stsb\n", "Train metrics: {'pearson_corr_without_watermark': nan, 'pearson_corr_with_watermark': -0.3385932975390179, 'spearman_corr_without_watermark': nan, 'spearman_corr_with_watermark': -0.3389426353569145}\n", "Validation metrics: {'pearson_corr_without_watermark': 0.01675197019312319, 'pearson_corr_with_watermark': -0.0999659022196252, 'spearman_corr_without_watermark': -0.041560976173932014, 'spearman_corr_with_watermark': -0.07632988977600694}\n", "Processing task: mnli\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 0/392702 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 1/392702 [01:03<6980:35:15, 63.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 2/392702 [02:15<7455:21:51, 68.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 3/392702 [03:24<7515:18:01, 68.90s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 4/392702 [04:34<7539:16:13, 69.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 5/392702 [05:42<7514:19:03, 68.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 6/392702 [06:20<6364:30:05, 58.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 7/392702 [07:29<6727:25:07, 61.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 8/392702 [08:38<6996:34:42, 64.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 9/392702 [09:41<6954:25:59, 63.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 10/392702 [10:52<7194:41:37, 65.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 11/392702 [12:00<7270:36:30, 66.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 12/392702 [13:02<7104:18:20, 65.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 13/392702 [14:10<7217:30:16, 66.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 14/392702 [15:17<7240:23:02, 66.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 15/392702 [16:28<7384:20:09, 67.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 16/392702 [17:36<7399:43:18, 67.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 17/392702 [18:46<7453:00:02, 68.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 18/392702 [19:50<7328:39:07, 67.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 19/392702 [20:52<7152:17:43, 65.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 20/392702 [22:02<7290:13:39, 66.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 21/392702 [23:12<7395:59:57, 67.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 22/392702 [24:20<7392:48:02, 67.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 23/392702 [25:29<7445:01:13, 68.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 24/392702 [26:36<7394:28:06, 67.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 25/392702 [27:41<7330:43:12, 67.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 26/392702 [28:53<7474:25:07, 68.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 27/392702 [30:03<7516:09:52, 68.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 28/392702 [31:09<7437:18:39, 68.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 29/392702 [32:19<7491:39:05, 68.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 30/392702 [33:29<7516:43:18, 68.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 31/392702 [34:41<7615:57:12, 69.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 32/392702 [35:50<7586:58:13, 69.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 33/392702 [36:58<7534:23:53, 69.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 34/392702 [38:05<7474:02:25, 68.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 35/392702 [39:19<7649:11:40, 70.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 36/392702 [40:30<7674:21:00, 70.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 37/392702 [41:16<6905:04:51, 63.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 38/392702 [42:19<6873:17:33, 63.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 39/392702 [43:28<7090:24:35, 65.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 40/392702 [44:37<7208:14:41, 66.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 41/392702 [45:47<7348:50:11, 67.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 42/392702 [46:56<7403:05:55, 67.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 43/392702 [48:04<7389:21:05, 67.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 44/392702 [49:14<7461:57:55, 68.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 45/392702 [50:05<6899:58:00, 63.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 46/392702 [51:14<7084:58:51, 64.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 47/392702 [52:23<7220:29:26, 66.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 48/392702 [53:32<7303:15:33, 66.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 49/392702 [54:41<7392:36:19, 67.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 50/392702 [55:52<7479:17:24, 68.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 51/392702 [56:57<7371:14:11, 67.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 52/392702 [58:04<7359:12:29, 67.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 53/392702 [58:54<6770:17:49, 62.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 54/392702 [1:00:02<6972:19:52, 63.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 55/392702 [1:01:09<7063:30:54, 64.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 56/392702 [1:02:17<7189:31:12, 65.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 57/392702 [1:03:05<6586:14:19, 60.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 58/392702 [1:04:13<6829:41:11, 62.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 59/392702 [1:05:07<6554:37:41, 60.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 60/392702 [1:06:15<6809:48:08, 62.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 61/392702 [1:07:24<7038:03:30, 64.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 62/392702 [1:08:34<7223:18:46, 66.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 63/392702 [1:09:43<7312:27:44, 67.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 64/392702 [1:10:53<7397:41:44, 67.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 65/392702 [1:11:41<6761:12:34, 61.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 66/392702 [1:12:48<6906:47:56, 63.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 67/392702 [1:14:01<7239:06:10, 66.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 68/392702 [1:15:10<7311:40:35, 67.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 69/392702 [1:16:18<7332:19:13, 67.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 70/392702 [1:17:25<7327:54:15, 67.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 71/392702 [1:18:33<7370:40:09, 67.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 72/392702 [1:19:45<7513:32:34, 68.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 73/392702 [1:20:53<7492:54:12, 68.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 74/392702 [1:21:40<6765:17:36, 62.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 75/392702 [1:22:48<6947:30:15, 63.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 76/392702 [1:23:55<7083:13:54, 64.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 77/392702 [1:24:51<6764:47:23, 62.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 78/392702 [1:25:56<6874:57:03, 63.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 79/392702 [1:27:06<7101:43:32, 65.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 80/392702 [1:28:15<7237:53:14, 66.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 81/392702 [1:29:22<7251:51:11, 66.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 82/392702 [1:30:28<7226:25:56, 66.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 83/392702 [1:31:36<7308:07:44, 67.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 84/392702 [1:32:47<7429:46:53, 68.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 85/392702 [1:34:00<7589:00:44, 69.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 86/392702 [1:34:53<7026:38:17, 64.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 87/392702 [1:35:59<7086:53:05, 64.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 88/392702 [1:37:09<7246:39:26, 66.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 89/392702 [1:38:19<7375:26:44, 67.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 90/392702 [1:39:29<7435:47:02, 68.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 91/392702 [1:40:41<7561:53:05, 69.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 92/392702 [1:41:30<6921:34:02, 63.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 93/392702 [1:42:38<7060:37:57, 64.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 94/392702 [1:43:49<7255:36:49, 66.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 95/392702 [1:44:57<7310:12:19, 67.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 96/392702 [1:46:07<7392:52:53, 67.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 97/392702 [1:47:17<7470:42:25, 68.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 98/392702 [1:48:26<7507:56:37, 68.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 99/392702 [1:49:14<6804:35:38, 62.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli train set: 0%| | 100/392702 [1:50:20<7220:26:08, 66.21s/it]\n", "Processing mnli validation_matched set: 0%| | 0/9815 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 1/9815 [01:09<189:31:27, 69.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 2/9815 [02:19<189:57:22, 69.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 3/9815 [03:26<187:10:14, 68.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 4/9815 [04:35<187:31:47, 68.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 5/9815 [05:43<185:56:33, 68.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 6/9815 [06:50<185:34:03, 68.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 7/9815 [08:00<186:58:09, 68.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 8/9815 [09:12<189:29:43, 69.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 9/9815 [10:22<190:03:32, 69.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 10/9815 [11:30<188:31:49, 69.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 11/9815 [12:38<187:36:27, 68.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 12/9815 [13:48<188:35:32, 69.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 13/9815 [15:01<191:37:56, 70.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 14/9815 [16:09<189:35:51, 69.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 15/9815 [17:23<192:47:37, 70.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 16/9815 [18:32<191:38:42, 70.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 17/9815 [19:41<190:03:45, 69.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 18/9815 [20:52<191:08:32, 70.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 19/9815 [21:58<188:03:47, 69.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 20/9815 [23:07<188:03:37, 69.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 21/9815 [24:16<188:01:29, 69.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 22/9815 [25:07<172:29:18, 63.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 23/9815 [26:17<178:08:36, 65.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 24/9815 [27:26<180:44:02, 66.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 25/9815 [28:30<179:05:24, 65.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 26/9815 [29:37<180:14:18, 66.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 27/9815 [30:40<177:10:18, 65.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 28/9815 [31:49<180:47:53, 66.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 29/9815 [32:57<181:57:33, 66.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 30/9815 [34:06<183:09:45, 67.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 31/9815 [35:12<182:12:50, 67.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 32/9815 [36:23<185:13:59, 68.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 33/9815 [37:31<185:27:39, 68.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 34/9815 [38:42<187:28:11, 69.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 35/9815 [39:48<184:47:08, 68.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 36/9815 [40:55<184:09:16, 67.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 37/9815 [42:01<182:49:10, 67.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 38/9815 [43:07<181:25:55, 66.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 39/9815 [44:16<183:26:44, 67.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 40/9815 [45:23<182:44:01, 67.30s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 41/9815 [46:09<165:03:47, 60.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 42/9815 [47:12<167:28:08, 61.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 43/9815 [48:21<173:09:33, 63.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 44/9815 [49:31<178:36:02, 65.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 45/9815 [50:35<177:05:27, 65.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 46/9815 [51:43<178:53:05, 65.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 47/9815 [52:45<175:32:25, 64.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 48/9815 [53:51<176:41:53, 65.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 0%| | 49/9815 [54:58<178:28:55, 65.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 50/9815 [55:49<166:06:51, 61.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 51/9815 [56:57<172:01:30, 63.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 52/9815 [58:05<175:41:09, 64.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 53/9815 [59:07<172:54:29, 63.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 54/9815 [1:00:20<180:38:06, 66.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 55/9815 [1:01:51<200:03:41, 73.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 56/9815 [1:03:22<214:11:52, 79.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 57/9815 [1:04:51<222:05:47, 81.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 58/9815 [1:06:17<225:36:07, 83.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 59/9815 [1:07:43<228:17:55, 84.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 60/9815 [1:09:16<235:22:40, 86.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 61/9815 [1:10:20<216:33:32, 79.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 62/9815 [1:11:43<218:33:07, 80.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 63/9815 [1:13:09<223:35:49, 82.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 64/9815 [1:14:32<223:26:07, 82.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 65/9815 [1:15:58<226:04:04, 83.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 66/9815 [1:17:23<227:36:35, 84.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 67/9815 [1:18:49<229:26:22, 84.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 68/9815 [1:20:01<219:14:29, 80.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 69/9815 [1:21:08<207:31:04, 76.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 70/9815 [1:22:35<215:52:06, 79.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 71/9815 [1:24:02<221:58:15, 82.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 72/9815 [1:25:30<226:49:42, 83.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 73/9815 [1:26:58<229:42:02, 84.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 74/9815 [1:28:26<232:11:10, 85.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 75/9815 [1:29:41<223:35:46, 82.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 76/9815 [1:31:07<226:32:42, 83.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 77/9815 [1:32:37<231:11:15, 85.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 78/9815 [1:34:02<230:50:18, 85.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 79/9815 [1:35:28<231:29:58, 85.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 80/9815 [1:36:57<234:27:29, 86.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 81/9815 [1:38:25<235:12:02, 86.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 82/9815 [1:39:42<226:45:17, 83.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 83/9815 [1:40:50<214:01:21, 79.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 84/9815 [1:42:00<207:09:09, 76.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 85/9815 [1:43:06<198:17:40, 73.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 86/9815 [1:44:13<192:56:01, 71.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 87/9815 [1:45:24<192:49:59, 71.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 88/9815 [1:46:32<189:35:15, 70.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 89/9815 [1:47:38<186:53:00, 69.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 90/9815 [1:48:47<186:42:29, 69.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 91/9815 [1:49:56<186:09:44, 68.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 92/9815 [1:51:06<187:20:37, 69.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 93/9815 [1:52:16<187:20:31, 69.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 94/9815 [1:53:25<187:31:29, 69.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 95/9815 [1:54:34<187:11:47, 69.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 96/9815 [1:55:44<187:03:53, 69.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 97/9815 [1:56:50<184:42:11, 68.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 98/9815 [1:57:58<184:33:09, 68.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 99/9815 [1:59:08<185:27:53, 68.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing mnli validation_matched set: 1%| | 100/9815 [1:59:57<194:13:41, 71.97s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: mnli\n", "Train metrics: {'accuracy_without_watermark': 0.47, 'accuracy_with_watermark': 0.37, 'f1_without_watermark': 0.39293604945778854, 'f1_with_watermark': 0.24262017885423737}\n", "Validation metrics: {'accuracy_without_watermark': 0.37, 'accuracy_with_watermark': 0.35, 'f1_without_watermark': 0.26940892298948566, 'f1_with_watermark': 0.25000682333033103}\n", "Processing task: qnli\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 0/104743 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 1/104743 [01:15<2183:47:59, 75.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 2/104743 [02:07<1804:31:54, 62.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 3/104743 [03:14<1859:51:30, 63.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 4/104743 [04:09<1764:28:50, 60.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 5/104743 [05:08<1744:44:05, 59.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 6/104743 [06:15<1810:07:52, 62.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 7/104743 [07:14<1787:38:00, 61.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 8/104743 [08:24<1858:35:21, 63.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 9/104743 [09:34<1917:34:13, 65.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 10/104743 [10:26<1792:25:59, 61.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 11/104743 [11:37<1875:38:08, 64.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 12/104743 [12:48<1932:59:42, 66.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 13/104743 [13:50<1899:19:24, 65.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 14/104743 [14:07<1469:40:03, 50.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 15/104743 [15:17<1638:13:10, 56.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 16/104743 [16:25<1740:44:16, 59.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 17/104743 [17:35<1833:13:37, 63.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 18/104743 [18:46<1906:54:16, 65.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 19/104743 [19:56<1943:22:44, 66.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 20/104743 [21:07<1974:46:14, 67.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 21/104743 [22:17<2000:22:47, 68.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 22/104743 [23:14<1889:55:35, 64.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 23/104743 [24:24<1935:36:05, 66.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 24/104743 [25:13<1782:32:23, 61.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 25/104743 [26:19<1824:20:01, 62.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 26/104743 [27:26<1861:24:16, 63.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 27/104743 [28:13<1718:14:52, 59.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 28/104743 [29:25<1823:15:08, 62.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 29/104743 [30:35<1889:33:48, 64.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 30/104743 [31:39<1882:18:15, 64.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 31/104743 [32:22<1691:31:18, 58.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 32/104743 [33:31<1786:12:20, 61.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 33/104743 [34:42<1875:23:34, 64.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 34/104743 [35:54<1936:55:29, 66.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 35/104743 [36:41<1766:10:02, 60.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 36/104743 [37:22<1590:07:32, 54.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 37/104743 [38:31<1721:41:04, 59.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 38/104743 [39:42<1821:05:43, 62.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 39/104743 [40:54<1904:38:27, 65.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 40/104743 [41:41<1747:13:13, 60.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 41/104743 [42:52<1835:11:34, 63.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 42/104743 [44:03<1905:31:09, 65.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 43/104743 [45:13<1950:10:19, 67.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 44/104743 [46:24<1981:51:14, 68.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 45/104743 [47:34<1998:36:44, 68.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 46/104743 [48:43<1995:20:08, 68.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 47/104743 [49:55<2027:29:14, 69.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 48/104743 [51:08<2053:30:56, 70.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 49/104743 [52:17<2042:28:03, 70.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 50/104743 [53:28<2046:51:08, 70.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 51/104743 [54:37<2040:12:27, 70.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 52/104743 [55:40<1974:01:21, 67.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 53/104743 [56:51<2006:58:36, 69.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 54/104743 [58:01<2007:16:36, 69.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 55/104743 [58:59<1918:43:42, 65.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 56/104743 [1:00:07<1934:58:44, 66.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 57/104743 [1:00:59<1809:44:13, 62.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 58/104743 [1:02:11<1891:42:44, 65.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 59/104743 [1:03:10<1835:32:20, 63.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 60/104743 [1:04:20<1900:06:36, 65.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 61/104743 [1:05:32<1955:33:46, 67.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 62/104743 [1:06:40<1963:04:35, 67.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 63/104743 [1:07:50<1986:17:40, 68.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 64/104743 [1:09:01<2003:52:15, 68.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 65/104743 [1:10:11<2016:54:29, 69.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 66/104743 [1:11:21<2021:54:48, 69.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 67/104743 [1:12:26<1983:47:37, 68.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 68/104743 [1:13:35<1987:53:10, 68.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 69/104743 [1:14:46<2012:14:19, 69.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 70/104743 [1:15:57<2028:39:49, 69.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 71/104743 [1:17:08<2036:00:17, 70.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 72/104743 [1:18:16<2017:40:36, 69.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 73/104743 [1:19:11<1896:09:32, 65.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 74/104743 [1:20:23<1957:59:14, 67.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 75/104743 [1:21:35<1991:40:37, 68.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 76/104743 [1:22:46<2017:38:35, 69.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 77/104743 [1:23:33<1824:14:05, 62.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 78/104743 [1:24:44<1896:16:28, 65.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 79/104743 [1:25:33<1755:36:34, 60.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 80/104743 [1:26:15<1590:03:46, 54.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 81/104743 [1:27:25<1721:55:02, 59.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 82/104743 [1:28:35<1817:28:01, 62.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 83/104743 [1:29:25<1710:38:23, 58.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 84/104743 [1:30:32<1784:10:15, 61.37s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 85/104743 [1:31:43<1864:22:52, 64.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 86/104743 [1:32:47<1867:04:45, 64.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 87/104743 [1:33:57<1912:20:04, 65.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 88/104743 [1:35:02<1912:00:38, 65.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 89/104743 [1:36:11<1934:40:57, 66.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 90/104743 [1:36:55<1738:09:26, 59.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 91/104743 [1:38:06<1841:07:25, 63.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 92/104743 [1:39:19<1921:39:35, 66.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 93/104743 [1:40:09<1779:18:28, 61.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 94/104743 [1:41:19<1854:26:09, 63.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 95/104743 [1:42:30<1920:18:53, 66.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 96/104743 [1:43:36<1918:39:17, 66.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 97/104743 [1:44:39<1893:39:55, 65.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 98/104743 [1:45:38<1841:46:53, 63.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 99/104743 [1:46:44<1866:54:58, 64.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli train set: 0%| | 100/104743 [1:47:50<1880:55:17, 64.71s/it]\n", "Processing qnli validation set: 0%| | 0/5463 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 1/5463 [01:03<96:05:36, 63.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 2/5463 [02:14<103:12:37, 68.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 3/5463 [03:21<102:30:22, 67.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 4/5463 [04:28<102:08:29, 67.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 5/5463 [05:40<104:18:28, 68.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 6/5463 [06:51<105:48:53, 69.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 7/5463 [07:41<95:40:34, 63.13s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 8/5463 [08:51<99:13:25, 65.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 9/5463 [09:50<95:52:35, 63.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 10/5463 [11:00<98:55:44, 65.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 11/5463 [11:21<78:30:07, 51.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 12/5463 [12:23<83:17:49, 55.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 13/5463 [13:34<90:30:22, 59.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 14/5463 [14:31<89:14:52, 58.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 15/5463 [15:38<92:55:25, 61.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 16/5463 [16:51<98:13:02, 64.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 17/5463 [18:05<102:19:39, 67.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 18/5463 [19:11<101:33:46, 67.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 19/5463 [20:16<100:38:29, 66.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 20/5463 [21:07<93:28:51, 61.83s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 21/5463 [22:00<89:32:56, 59.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 22/5463 [23:11<94:56:56, 62.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 23/5463 [24:20<97:34:27, 64.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 24/5463 [25:24<97:10:31, 64.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 25/5463 [26:35<100:23:00, 66.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 26/5463 [27:46<102:08:16, 67.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 0%| | 27/5463 [28:54<102:16:00, 67.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 28/5463 [29:42<93:30:21, 61.94s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 29/5463 [30:43<93:05:29, 61.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 30/5463 [31:56<98:03:35, 64.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 31/5463 [33:07<100:45:24, 66.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 32/5463 [34:18<102:36:32, 68.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 33/5463 [34:59<90:20:10, 59.89s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 34/5463 [36:07<94:05:13, 62.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 35/5463 [37:02<91:03:47, 60.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 36/5463 [38:13<95:30:13, 63.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 37/5463 [39:19<96:59:55, 64.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 38/5463 [40:29<99:25:34, 65.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 39/5463 [41:33<98:28:51, 65.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 40/5463 [42:19<89:35:04, 59.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 41/5463 [43:26<92:49:27, 61.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 42/5463 [44:35<96:10:19, 63.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 43/5463 [45:45<99:13:40, 65.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 44/5463 [46:56<101:15:21, 67.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 45/5463 [48:04<101:31:54, 67.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 46/5463 [49:07<99:36:04, 66.19s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 47/5463 [50:16<100:56:16, 67.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 48/5463 [51:28<103:11:49, 68.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 49/5463 [52:12<92:02:08, 61.20s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 50/5463 [53:23<96:31:46, 64.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 51/5463 [54:35<99:44:02, 66.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 52/5463 [55:42<100:01:19, 66.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 53/5463 [56:51<101:18:53, 67.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 54/5463 [58:03<103:09:59, 68.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 55/5463 [59:09<102:12:39, 68.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 56/5463 [1:00:21<103:48:23, 69.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 57/5463 [1:01:30<103:34:37, 68.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 58/5463 [1:02:40<104:22:55, 69.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 59/5463 [1:03:53<105:43:02, 70.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 60/5463 [1:05:03<105:24:38, 70.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 61/5463 [1:06:13<105:19:19, 70.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 62/5463 [1:07:20<103:59:19, 69.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 63/5463 [1:08:34<106:03:54, 70.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 64/5463 [1:09:46<106:42:22, 71.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 65/5463 [1:10:49<102:47:18, 68.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 66/5463 [1:11:59<103:44:22, 69.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 67/5463 [1:13:04<101:44:51, 67.88s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%| | 68/5463 [1:14:13<102:07:49, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 69/5463 [1:15:19<100:57:07, 67.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 70/5463 [1:16:14<95:24:23, 63.69s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 71/5463 [1:17:26<99:12:04, 66.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 72/5463 [1:18:33<99:49:24, 66.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 73/5463 [1:19:44<101:44:01, 67.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 74/5463 [1:20:43<97:22:56, 65.05s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 75/5463 [1:21:47<97:12:33, 64.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 76/5463 [1:22:30<86:58:19, 58.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 77/5463 [1:23:38<91:40:44, 61.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 78/5463 [1:24:44<93:37:41, 62.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 79/5463 [1:25:35<88:28:19, 59.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 80/5463 [1:26:15<79:45:14, 53.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 1%|▏ | 81/5463 [1:27:26<87:51:34, 58.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 82/5463 [1:28:37<93:21:43, 62.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 83/5463 [1:29:47<96:39:55, 64.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 84/5463 [1:30:58<99:35:24, 66.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 85/5463 [1:32:09<101:20:08, 67.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 86/5463 [1:33:11<98:51:31, 66.19s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 87/5463 [1:34:07<94:16:31, 63.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 88/5463 [1:35:11<94:40:56, 63.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 89/5463 [1:36:15<94:46:52, 63.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 90/5463 [1:37:03<87:48:29, 58.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 91/5463 [1:38:10<91:18:00, 61.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 92/5463 [1:39:15<93:04:09, 62.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 93/5463 [1:40:18<93:34:48, 62.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 94/5463 [1:41:21<93:20:16, 62.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 95/5463 [1:42:30<96:09:03, 64.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 96/5463 [1:43:26<92:39:28, 62.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 97/5463 [1:44:36<96:10:53, 64.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 98/5463 [1:45:16<85:05:41, 57.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 99/5463 [1:46:27<91:03:53, 61.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing qnli validation set: 2%|▏ | 100/5463 [1:47:33<96:08:12, 64.53s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: qnli\n", "Train metrics: {'accuracy_without_watermark': 0.56, 'accuracy_with_watermark': 0.54, 'f1_without_watermark': 0.5280995280995281, 'f1_with_watermark': 0.4875222816399287}\n", "Validation metrics: {'accuracy_without_watermark': 0.57, 'accuracy_with_watermark': 0.49, 'f1_without_watermark': 0.5501621508525996, 'f1_with_watermark': 0.4498975299320462}\n", "Processing task: rte\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 0/2490 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 1/2490 [01:00<41:37:04, 60.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 2/2490 [01:59<41:25:07, 59.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 3/2490 [02:20<28:59:56, 41.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 4/2490 [03:25<35:16:27, 51.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 5/2490 [04:31<38:55:52, 56.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 6/2490 [05:22<37:39:04, 54.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 7/2490 [06:25<39:30:59, 57.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 8/2490 [07:36<42:36:09, 61.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 9/2490 [08:44<43:58:18, 63.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 10/2490 [09:43<42:46:39, 62.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 11/2490 [10:57<45:24:57, 65.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 0%| | 12/2490 [12:09<46:39:45, 67.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 13/2490 [13:17<46:34:26, 67.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 14/2490 [14:21<45:45:17, 66.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 15/2490 [15:28<45:47:50, 66.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 16/2490 [16:36<46:12:51, 67.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 17/2490 [17:45<46:33:18, 67.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 18/2490 [18:57<47:22:55, 69.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 19/2490 [20:15<49:12:51, 71.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 20/2490 [21:25<48:47:43, 71.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 21/2490 [22:30<47:34:17, 69.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 22/2490 [23:38<47:14:57, 68.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 23/2490 [24:38<45:17:06, 66.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 24/2490 [25:48<46:16:11, 67.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 25/2490 [27:00<46:59:17, 68.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 26/2490 [28:07<46:42:44, 68.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 27/2490 [29:16<46:53:07, 68.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 28/2490 [30:22<46:15:07, 67.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 29/2490 [31:19<44:09:34, 64.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 30/2490 [32:16<42:33:27, 62.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%| | 31/2490 [33:28<44:27:27, 65.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%|▏ | 32/2490 [34:11<40:00:06, 58.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%|▏ | 33/2490 [35:19<41:52:23, 61.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%|▏ | 34/2490 [35:59<37:32:13, 55.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%|▏ | 35/2490 [37:09<40:34:24, 59.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%|▏ | 36/2490 [38:21<43:06:27, 63.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 1%|▏ | 37/2490 [39:30<44:10:52, 64.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 38/2490 [40:40<45:15:21, 66.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 39/2490 [41:50<45:59:29, 67.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 40/2490 [43:01<46:39:53, 68.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 41/2490 [43:53<43:16:36, 63.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 42/2490 [45:04<44:51:12, 65.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 43/2490 [46:15<45:42:28, 67.25s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 44/2490 [47:25<46:12:46, 68.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 45/2490 [48:31<45:47:46, 67.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 46/2490 [49:42<46:39:02, 68.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 47/2490 [50:56<47:34:35, 70.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 48/2490 [52:09<48:09:22, 70.99s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 49/2490 [53:20<48:13:45, 71.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 50/2490 [54:28<47:32:35, 70.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 51/2490 [55:35<46:56:17, 69.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 52/2490 [56:47<47:25:22, 70.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 53/2490 [57:49<45:44:48, 67.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 54/2490 [58:10<36:21:07, 53.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 55/2490 [59:21<39:50:39, 58.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 56/2490 [1:00:28<41:27:26, 61.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 57/2490 [1:01:32<41:57:05, 62.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 58/2490 [1:02:46<44:18:19, 65.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 59/2490 [1:03:58<45:34:04, 67.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 60/2490 [1:05:06<45:38:08, 67.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 61/2490 [1:06:15<45:57:31, 68.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 2%|▏ | 62/2490 [1:07:26<46:36:21, 69.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 63/2490 [1:08:38<47:01:08, 69.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 64/2490 [1:09:34<44:18:03, 65.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 65/2490 [1:10:44<45:05:02, 66.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 66/2490 [1:11:46<44:05:58, 65.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 67/2490 [1:12:52<44:12:16, 65.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 68/2490 [1:14:02<44:58:07, 66.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 69/2490 [1:15:03<43:55:59, 65.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 70/2490 [1:16:19<45:57:49, 68.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 71/2490 [1:17:22<44:48:26, 66.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 72/2490 [1:18:26<44:17:26, 65.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 73/2490 [1:19:24<42:38:56, 63.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 74/2490 [1:20:33<43:48:54, 65.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 75/2490 [1:21:41<44:23:44, 66.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 76/2490 [1:22:47<44:15:50, 66.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 77/2490 [1:23:49<43:29:55, 64.90s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 78/2490 [1:24:49<42:32:59, 63.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 79/2490 [1:25:56<43:05:44, 64.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 80/2490 [1:27:07<44:23:32, 66.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 81/2490 [1:28:21<45:54:39, 68.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 82/2490 [1:29:37<47:24:26, 70.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 83/2490 [1:30:30<43:47:28, 65.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 84/2490 [1:31:41<44:49:37, 67.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 85/2490 [1:32:52<45:40:10, 68.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 86/2490 [1:34:02<46:01:39, 68.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 3%|▎ | 87/2490 [1:35:14<46:33:04, 69.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▎ | 88/2490 [1:36:08<43:27:50, 65.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▎ | 89/2490 [1:37:18<44:22:14, 66.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▎ | 90/2490 [1:38:20<43:27:23, 65.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▎ | 91/2490 [1:39:18<42:04:48, 63.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▎ | 92/2490 [1:40:29<43:34:30, 65.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▎ | 93/2490 [1:41:39<44:23:49, 66.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 94/2490 [1:42:55<46:21:15, 69.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 95/2490 [1:43:39<41:06:07, 61.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 96/2490 [1:44:17<36:27:41, 54.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 97/2490 [1:45:29<39:48:43, 59.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 98/2490 [1:46:09<35:55:03, 54.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 99/2490 [1:47:17<38:36:04, 58.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte train set: 4%|▍ | 100/2490 [1:48:25<43:11:18, 65.05s/it]\n", "Processing rte validation set: 0%| | 0/277 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 0%| | 1/277 [01:11<5:30:58, 71.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 1%| | 2/277 [02:07<4:46:12, 62.45s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 1%| | 3/277 [03:18<5:03:15, 66.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 1%|▏ | 4/277 [04:20<4:53:32, 64.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 2%|▏ | 5/277 [05:17<4:40:46, 61.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 2%|▏ | 6/277 [06:23<4:45:47, 63.27s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 3%|▎ | 7/277 [07:38<5:01:07, 66.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 3%|▎ | 8/277 [08:27<4:34:29, 61.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 3%|▎ | 9/277 [09:40<4:50:50, 65.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 4%|▎ | 10/277 [11:07<5:19:31, 71.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 4%|▍ | 11/277 [12:32<5:36:13, 75.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 4%|▍ | 12/277 [12:43<4:08:11, 56.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 5%|▍ | 13/277 [14:12<4:50:57, 66.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 5%|▌ | 14/277 [15:26<4:59:32, 68.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 5%|▌ | 15/277 [16:52<5:21:18, 73.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 6%|▌ | 16/277 [18:18<5:37:22, 77.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 6%|▌ | 17/277 [19:47<5:50:07, 80.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 6%|▋ | 18/277 [21:17<6:01:44, 83.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 7%|▋ | 19/277 [22:42<6:01:43, 84.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 7%|▋ | 20/277 [23:44<5:31:35, 77.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 8%|▊ | 21/277 [25:14<5:45:41, 81.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 8%|▊ | 22/277 [26:48<6:00:53, 84.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 8%|▊ | 23/277 [27:38<5:16:01, 74.65s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 9%|▊ | 24/277 [29:12<5:39:34, 80.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 9%|▉ | 25/277 [30:22<5:23:54, 77.12s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 9%|▉ | 26/277 [31:01<4:35:37, 65.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 10%|▉ | 27/277 [32:11<4:39:00, 66.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 10%|█ | 28/277 [32:59<4:14:43, 61.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 10%|█ | 29/277 [34:08<4:22:26, 63.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 11%|█ | 30/277 [35:19<4:31:33, 65.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 11%|█ | 31/277 [36:31<4:37:45, 67.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 12%|█▏ | 32/277 [37:48<4:48:03, 70.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 12%|█▏ | 33/277 [38:46<4:31:44, 66.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 12%|█▏ | 34/277 [39:39<4:12:50, 62.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 13%|█▎ | 35/277 [40:48<4:20:28, 64.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 13%|█▎ | 36/277 [42:00<4:27:58, 66.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 13%|█▎ | 37/277 [43:13<4:34:25, 68.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 14%|█▎ | 38/277 [44:26<4:38:49, 70.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 14%|█▍ | 39/277 [45:04<3:59:34, 60.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 14%|█▍ | 40/277 [46:14<4:09:47, 63.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 15%|█▍ | 41/277 [47:26<4:18:58, 65.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 15%|█▌ | 42/277 [48:39<4:26:27, 68.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 16%|█▌ | 43/277 [49:55<4:34:37, 70.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 16%|█▌ | 44/277 [51:03<4:30:08, 69.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 16%|█▌ | 45/277 [52:14<4:30:44, 70.02s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 17%|█▋ | 46/277 [53:29<4:35:11, 71.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 17%|█▋ | 47/277 [54:40<4:33:40, 71.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 17%|█▋ | 48/277 [55:08<3:42:34, 58.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 18%|█▊ | 49/277 [56:17<3:54:09, 61.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 18%|█▊ | 50/277 [57:29<4:05:10, 64.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 18%|█▊ | 51/277 [58:39<4:09:29, 66.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 19%|█▉ | 52/277 [59:50<4:13:57, 67.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 19%|█▉ | 53/277 [1:01:01<4:16:54, 68.81s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 19%|█▉ | 54/277 [1:02:13<4:18:32, 69.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 20%|█▉ | 55/277 [1:03:20<4:15:18, 69.00s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 20%|██ | 56/277 [1:04:06<3:48:11, 61.95s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 21%|██ | 57/277 [1:05:11<3:50:43, 62.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 21%|██ | 58/277 [1:06:16<3:52:12, 63.62s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 21%|██▏ | 59/277 [1:07:20<3:51:34, 63.74s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 22%|██▏ | 60/277 [1:08:33<3:59:55, 66.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 22%|██▏ | 61/277 [1:09:57<4:18:08, 71.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 22%|██▏ | 62/277 [1:11:25<4:34:09, 76.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 23%|██▎ | 63/277 [1:12:53<4:45:43, 80.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 23%|██▎ | 64/277 [1:14:25<4:57:10, 83.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 23%|██▎ | 65/277 [1:15:53<4:59:34, 84.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 24%|██▍ | 66/277 [1:17:21<5:01:49, 85.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 24%|██▍ | 67/277 [1:18:46<4:59:16, 85.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 25%|██▍ | 68/277 [1:20:15<5:01:37, 86.59s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 25%|██▍ | 69/277 [1:21:43<5:02:19, 87.21s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 25%|██▌ | 70/277 [1:23:14<5:04:45, 88.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 26%|██▌ | 71/277 [1:24:39<4:59:11, 87.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 26%|██▌ | 72/277 [1:25:48<4:39:03, 81.67s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 26%|██▋ | 73/277 [1:27:09<4:37:51, 81.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 27%|██▋ | 74/277 [1:28:29<4:33:59, 80.98s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 27%|██▋ | 75/277 [1:29:38<4:20:38, 77.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 27%|██▋ | 76/277 [1:30:30<3:53:49, 69.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 28%|██▊ | 77/277 [1:31:39<3:51:36, 69.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 28%|██▊ | 78/277 [1:32:51<3:53:49, 70.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 29%|██▊ | 79/277 [1:33:34<3:25:08, 62.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 29%|██▉ | 80/277 [1:34:44<3:31:34, 64.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 29%|██▉ | 81/277 [1:35:54<3:35:50, 66.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 30%|██▉ | 82/277 [1:37:05<3:39:32, 67.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 30%|██▉ | 83/277 [1:38:15<3:40:56, 68.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 30%|███ | 84/277 [1:39:25<3:41:11, 68.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 31%|███ | 85/277 [1:40:36<3:42:54, 69.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 31%|███ | 86/277 [1:41:46<3:41:21, 69.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 31%|███▏ | 87/277 [1:42:52<3:36:58, 68.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 32%|███▏ | 88/277 [1:44:04<3:39:28, 69.68s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 32%|███▏ | 89/277 [1:44:45<3:11:38, 61.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 32%|███▏ | 90/277 [1:46:01<3:23:52, 65.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 33%|███▎ | 91/277 [1:47:13<3:29:12, 67.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 33%|███▎ | 92/277 [1:48:16<3:24:02, 66.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 34%|███▎ | 93/277 [1:49:32<3:31:51, 69.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 34%|███▍ | 94/277 [1:50:37<3:26:59, 67.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 34%|███▍ | 95/277 [1:51:45<3:25:59, 67.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 35%|███▍ | 96/277 [1:53:03<3:33:26, 70.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 35%|███▌ | 97/277 [1:54:16<3:34:54, 71.63s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 35%|███▌ | 98/277 [1:55:29<3:34:17, 71.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 36%|███▌ | 99/277 [1:56:39<3:32:19, 71.57s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing rte validation set: 36%|███▌ | 100/277 [1:57:55<3:28:44, 70.76s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: rte\n", "Train metrics: {'accuracy_without_watermark': 0.53, 'accuracy_with_watermark': 0.49, 'f1_without_watermark': 0.5123975516132379, 'f1_with_watermark': 0.4357782940590773}\n", "Validation metrics: {'accuracy_without_watermark': 0.53, 'accuracy_with_watermark': 0.55, 'f1_without_watermark': 0.5123975516132379, 'f1_with_watermark': 0.4950061721467849}\n", "Processing task: wnli\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 0%| | 0/635 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 0%| | 1/635 [01:09<12:12:21, 69.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 0%| | 2/635 [01:13<5:24:06, 30.72s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 0%| | 3/635 [02:24<8:39:06, 49.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 1%| | 4/635 [03:29<9:43:42, 55.50s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 1%| | 5/635 [04:39<10:38:44, 60.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 1%| | 6/635 [05:30<10:02:28, 57.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 1%| | 7/635 [06:38<10:38:35, 61.01s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 1%|▏ | 8/635 [07:41<10:42:49, 61.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 1%|▏ | 9/635 [08:29<9:58:02, 57.32s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 2%|▏ | 10/635 [09:37<10:30:47, 60.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 2%|▏ | 11/635 [10:45<10:54:34, 62.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 2%|▏ | 12/635 [11:20<9:24:38, 54.38s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 2%|▏ | 13/635 [12:29<10:10:44, 58.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 2%|▏ | 14/635 [13:36<10:33:38, 61.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 2%|▏ | 15/635 [14:48<11:07:32, 64.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 16/635 [15:58<11:21:39, 66.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 17/635 [17:08<11:33:21, 67.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 18/635 [18:22<11:51:33, 69.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 19/635 [19:33<11:57:05, 69.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 20/635 [20:21<10:48:23, 63.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 21/635 [21:32<11:12:39, 65.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 3%|▎ | 22/635 [22:42<11:22:57, 66.85s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 4%|▎ | 23/635 [23:46<11:13:35, 66.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 4%|▍ | 24/635 [24:53<11:13:44, 66.16s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 4%|▍ | 25/635 [25:56<11:03:59, 65.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 4%|▍ | 26/635 [27:07<11:20:46, 67.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 4%|▍ | 27/635 [28:17<11:27:26, 67.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 4%|▍ | 28/635 [29:28<11:37:42, 68.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 5%|▍ | 29/635 [30:26<11:02:06, 65.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 5%|▍ | 30/635 [31:37<11:18:53, 67.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 5%|▍ | 31/635 [32:43<11:12:25, 66.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 5%|▌ | 32/635 [33:48<11:05:09, 66.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 5%|▌ | 33/635 [34:58<11:15:30, 67.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 5%|▌ | 34/635 [36:10<11:28:45, 68.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▌ | 35/635 [37:21<11:33:48, 69.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▌ | 36/635 [38:36<11:50:58, 71.22s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▌ | 37/635 [39:35<11:13:51, 67.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▌ | 38/635 [41:02<12:10:40, 73.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▌ | 39/635 [42:33<13:00:30, 78.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▋ | 40/635 [43:20<11:25:38, 69.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 6%|▋ | 41/635 [44:47<12:17:53, 74.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 7%|▋ | 42/635 [45:35<10:58:11, 66.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 7%|▋ | 43/635 [47:01<11:55:03, 72.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 7%|▋ | 44/635 [48:05<11:26:36, 69.71s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 7%|▋ | 45/635 [49:32<12:19:08, 75.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 7%|▋ | 46/635 [51:00<12:55:10, 78.97s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 7%|▋ | 47/635 [52:24<13:09:03, 80.52s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 8%|▊ | 48/635 [53:53<13:32:31, 83.05s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 8%|▊ | 49/635 [55:22<13:47:46, 84.76s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 8%|▊ | 50/635 [56:51<13:59:34, 86.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 8%|▊ | 51/635 [58:21<14:09:39, 87.29s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 8%|▊ | 52/635 [59:31<13:17:26, 82.07s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 8%|▊ | 53/635 [1:00:35<12:21:05, 76.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▊ | 54/635 [1:01:44<11:59:37, 74.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▊ | 55/635 [1:02:50<11:34:40, 71.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▉ | 56/635 [1:03:57<11:19:20, 70.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▉ | 57/635 [1:05:06<11:14:56, 70.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▉ | 58/635 [1:06:19<11:21:28, 70.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▉ | 59/635 [1:07:30<11:21:04, 70.94s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 9%|▉ | 60/635 [1:08:41<11:18:38, 70.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 10%|▉ | 61/635 [1:09:48<11:07:55, 69.82s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 10%|▉ | 62/635 [1:10:59<11:09:29, 70.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 10%|▉ | 63/635 [1:11:47<10:04:42, 63.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 10%|█ | 64/635 [1:12:58<10:26:01, 65.78s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 10%|█ | 65/635 [1:14:10<10:41:31, 67.53s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 10%|█ | 66/635 [1:15:13<10:28:54, 66.32s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█ | 67/635 [1:16:27<10:49:32, 68.61s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█ | 68/635 [1:17:36<10:50:01, 68.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█ | 69/635 [1:18:44<10:44:20, 68.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█ | 70/635 [1:19:56<10:53:31, 69.40s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█ | 71/635 [1:21:02<10:43:06, 68.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█▏ | 72/635 [1:21:46<9:33:07, 61.08s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 11%|█▏ | 73/635 [1:22:49<9:37:48, 61.69s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 12%|█▏ | 74/635 [1:24:03<10:11:53, 65.44s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 12%|█▏ | 75/635 [1:25:14<10:26:58, 67.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 12%|█▏ | 76/635 [1:25:59<9:22:29, 60.38s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 12%|█▏ | 77/635 [1:27:09<9:48:04, 63.23s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 12%|█▏ | 78/635 [1:28:20<10:09:31, 65.66s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 12%|█▏ | 79/635 [1:29:29<10:16:45, 66.56s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 13%|█▎ | 80/635 [1:30:40<10:30:22, 68.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 13%|█▎ | 81/635 [1:31:49<10:30:27, 68.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 13%|█▎ | 82/635 [1:32:46<9:57:54, 64.87s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 13%|█▎ | 83/635 [1:33:57<10:14:04, 66.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 13%|█▎ | 84/635 [1:35:03<10:11:56, 66.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 13%|█▎ | 85/635 [1:36:16<10:28:20, 68.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▎ | 86/635 [1:37:07<9:38:21, 63.21s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▎ | 87/635 [1:38:12<9:42:44, 63.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▍ | 88/635 [1:39:12<9:31:05, 62.64s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▍ | 89/635 [1:40:24<9:55:50, 65.48s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▍ | 90/635 [1:41:36<10:11:44, 67.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▍ | 91/635 [1:42:46<10:17:30, 68.11s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 14%|█▍ | 92/635 [1:43:54<10:15:04, 67.96s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 15%|█▍ | 93/635 [1:45:03<10:17:28, 68.35s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 15%|█▍ | 94/635 [1:46:10<10:12:24, 67.92s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 15%|█▍ | 95/635 [1:47:10<9:49:45, 65.53s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 15%|█▌ | 96/635 [1:48:18<9:55:03, 66.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 15%|█▌ | 97/635 [1:49:27<10:01:03, 67.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 15%|█▌ | 98/635 [1:50:38<10:12:26, 68.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 16%|█▌ | 99/635 [1:51:50<10:19:35, 69.36s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli train set: 16%|█▌ | 100/635 [1:53:04<10:04:56, 67.84s/it]\n", "Processing wnli validation set: 0%| | 0/71 [00:00, ?it/s]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 1%|▏ | 1/71 [01:11<1:23:50, 71.87s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 3%|▎ | 2/71 [02:00<1:06:51, 58.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 4%|▍ | 3/71 [03:05<1:09:21, 61.20s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 6%|▌ | 4/71 [04:07<1:09:00, 61.80s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 7%|▋ | 5/71 [05:12<1:09:00, 62.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 8%|▊ | 6/71 [06:21<1:10:11, 64.79s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 10%|▉ | 7/71 [07:28<1:10:09, 65.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 11%|█▏ | 8/71 [08:06<59:41, 56.85s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 13%|█▎ | 9/71 [09:11<1:01:24, 59.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 14%|█▍ | 10/71 [10:02<57:46, 56.83s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 15%|█▌ | 11/71 [11:15<1:01:35, 61.60s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 17%|█▋ | 12/71 [12:21<1:02:06, 63.17s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 18%|█▊ | 13/71 [13:30<1:02:45, 64.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 20%|█▉ | 14/71 [14:40<1:02:53, 66.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 21%|██ | 15/71 [15:51<1:03:12, 67.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 23%|██▎ | 16/71 [17:03<1:03:10, 68.93s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 24%|██▍ | 17/71 [18:03<59:42, 66.35s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 25%|██▌ | 18/71 [18:42<51:19, 58.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 27%|██▋ | 19/71 [19:50<53:05, 61.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 28%|██▊ | 20/71 [21:06<55:38, 65.47s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 30%|██▉ | 21/71 [22:38<1:01:11, 73.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 31%|███ | 22/71 [23:41<57:36, 70.54s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 32%|███▏ | 23/71 [25:07<1:00:08, 75.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 34%|███▍ | 24/71 [26:36<1:01:57, 79.10s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 35%|███▌ | 25/71 [28:04<1:02:39, 81.72s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 37%|███▋ | 26/71 [29:28<1:01:55, 82.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 38%|███▊ | 27/71 [30:57<1:01:54, 84.42s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 39%|███▉ | 28/71 [32:23<1:00:58, 85.09s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 41%|████ | 29/71 [33:53<1:00:31, 86.46s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 42%|████▏ | 30/71 [35:22<59:36, 87.23s/it] " ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 44%|████▎ | 31/71 [36:09<50:07, 75.19s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 45%|████▌ | 32/71 [37:41<52:10, 80.26s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 46%|████▋ | 33/71 [39:08<52:02, 82.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 48%|████▊ | 34/71 [39:52<43:40, 70.83s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 49%|████▉ | 35/71 [41:07<43:13, 72.04s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 51%|█████ | 36/71 [42:15<41:14, 70.70s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 52%|█████▏ | 37/71 [43:26<40:09, 70.86s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 54%|█████▎ | 38/71 [44:37<38:54, 70.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 55%|█████▍ | 39/71 [45:43<37:05, 69.54s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 56%|█████▋ | 40/71 [46:51<35:43, 69.15s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 58%|█████▊ | 41/71 [48:01<34:33, 69.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 59%|█████▉ | 42/71 [49:12<33:42, 69.75s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 61%|██████ | 43/71 [50:23<32:41, 70.06s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 62%|██████▏ | 44/71 [51:32<31:22, 69.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 63%|██████▎ | 45/71 [52:43<30:23, 70.13s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 65%|██████▍ | 46/71 [53:53<29:16, 70.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 66%|██████▌ | 47/71 [55:00<27:45, 69.39s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 68%|██████▊ | 48/71 [56:06<26:09, 68.24s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 69%|██████▉ | 49/71 [57:18<25:25, 69.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 70%|███████ | 50/71 [57:58<21:12, 60.58s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 72%|███████▏ | 51/71 [59:10<21:18, 63.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 73%|███████▎ | 52/71 [1:00:19<20:45, 65.55s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 75%|███████▍ | 53/71 [1:01:29<20:04, 66.91s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 76%|███████▌ | 54/71 [1:02:41<19:22, 68.41s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 77%|███████▋ | 55/71 [1:03:26<16:21, 61.34s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 79%|███████▉ | 56/71 [1:04:32<15:41, 62.77s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 80%|████████ | 57/71 [1:05:36<14:43, 63.08s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 82%|████████▏ | 58/71 [1:06:14<12:01, 55.49s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 83%|████████▎ | 59/71 [1:06:50<09:58, 49.84s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 85%|████████▍ | 60/71 [1:08:15<11:03, 60.31s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 86%|████████▌ | 61/71 [1:09:28<10:41, 64.14s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 87%|████████▋ | 62/71 [1:10:58<10:45, 71.73s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 89%|████████▊ | 63/71 [1:12:27<10:17, 77.18s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 90%|█████████ | 64/71 [1:13:56<09:23, 80.51s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 92%|█████████▏| 65/71 [1:15:22<08:14, 82.38s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 93%|█████████▎| 66/71 [1:16:51<07:01, 84.28s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 94%|█████████▍| 67/71 [1:18:19<05:41, 85.43s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 96%|█████████▌| 68/71 [1:19:46<04:17, 85.89s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 97%|█████████▋| 69/71 [1:21:13<02:52, 86.03s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 99%|█████████▊| 70/71 [1:22:40<01:26, 86.33s/it]" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Generating with Namespace(model_name_or_path='bigscience/bloom-560m', load_fp16=False, prompt_max_length=1848, max_new_tokens=200, generation_seed=123, use_sampling=True, n_beams=1, sampling_temp=0.7, use_gpu=True, seeding_scheme='simple_1', gamma=0.25, delta=2.0, normalizers='', skip_repeated_bigrams=False, ignore_repeated_ngrams=False, detection_z_threshold=4.0, select_green_tokens=True, seed_separately=True, run_extended=True, is_decoder_only_model=True)\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Processing wnli validation set: 100%|██████████| 71/71 [1:24:09<00:00, 71.12s/it]\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Task: wnli\n", "Train metrics: {'accuracy_without_watermark': 0.44, 'accuracy_with_watermark': 0.52, 'f1_without_watermark': 0.43977591036414565, 'f1_with_watermark': 0.5198079231692677}\n", "Validation metrics: {'accuracy_without_watermark': 0.4788732394366197, 'accuracy_with_watermark': 0.49295774647887325, 'f1_without_watermark': 0.47845940043676793, 'f1_with_watermark': 0.49043062200956933}\n", "Overall GLUE score: 0.40536016077856096\n", "Results saved in results\n" ] } ], "source": [ "from datasets import load_dataset\n", "from sklearn.metrics import accuracy_score, f1_score, matthews_corrcoef, precision_recall_fscore_support\n", "from scipy.stats import pearsonr, spearmanr\n", "import torch\n", "from tqdm import tqdm\n", "import json\n", "import os\n", "import re\n", "\n", "\n", "def create_prompt(example, task_name):\n", " if task_name == \"sst2\":\n", " return f\"Classify the sentiment of the following sentence as positive or negative:\\n{example['sentence']}\\nSentiment:\"\n", " elif task_name == \"cola\":\n", " return f\"Is the following sentence grammatically acceptable? Answer 'yes' or 'no':\\n{example['sentence']}\\nAnswer:\"\n", " elif task_name == \"mrpc\":\n", " return f\"Are the following two sentences paraphrases of each other? Answer 'yes' or 'no':\\nSentence 1: {example['sentence1']}\\nSentence 2: {example['sentence2']}\\nAnswer:\"\n", " elif task_name == \"qqp\":\n", " return f\"Are the following two questions asking the same thing? Answer 'yes' or 'no':\\nQuestion 1: {example['question1']}\\nQuestion 2: {example['question2']}\\nAnswer:\"\n", " elif task_name == \"stsb\":\n", " return f\"Rate the semantic similarity of the following sentences on a scale from 0 to 5, where 0 means no similarity and 5 means semantic equivalence:\\nSentence 1: {example['sentence1']}\\nSentence 2: {example['sentence2']}\\nSimilarity score:\"\n", " elif task_name == \"mnli\":\n", " return f\"Determine if the premise entails the hypothesis. Answer with 'entailment', 'contradiction', or 'neutral':\\nPremise: {example['premise']}\\nHypothesis: {example['hypothesis']}\\nRelation:\"\n", " elif task_name == \"qnli\":\n", " return f\"Does the given context contain the answer to the question? Answer 'yes' or 'no':\\nQuestion: {example['question']}\\nContext: {example['sentence']}\\nAnswer:\"\n", " elif task_name == \"rte\":\n", " return f\"Determine if the premise entails the hypothesis. Answer 'yes' for entailment or 'no' for not entailment:\\nPremise: {example['sentence1']}\\nHypothesis: {example['sentence2']}\\nEntailment:\"\n", " elif task_name == \"wnli\":\n", " return f\"Determine if the sentence with the pronoun replaced is entailed by the original sentence. Answer 'yes' for entailment or 'no' for not entailment:\\nOriginal: {example['sentence1']}\\nWith pronoun replaced: {example['sentence2']}\\nEntailment:\"\n", " else:\n", " raise ValueError(f\"Unknown task: {task_name}\")\n", " \n", "\n", "def process_glue_dataset(task_name, split, args, model, tokenizer, device, limit=100):\n", " dataset = load_dataset(\"glue\", task_name)\n", " results = []\n", " \n", " # Handle the special case for MNLI\n", " if task_name == \"mnli\" and split == \"validation\":\n", " split = \"validation_matched\"\n", " else:\n", " split = split\n", "\n", " for i, example in enumerate(tqdm(dataset[split], desc=f\"Processing {task_name} {split} set\")):\n", " # for example in tqdm(dataset[split], desc=f\"Processing {task_name} {split} set\"):\n", " if i >= limit:\n", " break\n", " \n", " prompt = create_prompt(example, task_name)\n", " true_label = example[\"label\"]\n", "\n", " result = {\n", " \"prompt\": prompt,\n", " \"true_label\": true_label,\n", " \"use_sampling\": args.use_sampling,\n", " \"sampling_temp\": args.sampling_temp,\n", " \"delta\": args.delta,\n", " \"gamma\": args.gamma,\n", " \"n_beams\": args.n_beams,\n", " \"detection_z_threshold\": args.detection_z_threshold\n", " }\n", "\n", " # Generate outputs with and without watermark\n", " _, _, outputs_without_watermark, outputs_with_watermark, _ = generate(\n", " prompt, args, model=model, device=device, tokenizer=tokenizer\n", " )\n", " \n", " # Analyze outputs\n", " result_without_watermark = analyze(outputs_without_watermark, args, device=device, tokenizer=tokenizer)\n", " result_with_watermark = analyze(outputs_with_watermark, args, device=device, tokenizer=tokenizer)\n", " \n", " # Convert results list to dictionary\n", " result_without_watermark_dict = result_list_to_dict(result_without_watermark)\n", " result_with_watermark_dict = result_list_to_dict(result_with_watermark)\n", "\n", " # Store results\n", " result[\"without_watermark\"] = result_without_watermark_dict\n", " result[\"with_watermark\"] = result_with_watermark_dict\n", "\n", " # Predict label based on model output\n", " predicted_label_without_watermark = predict_label(outputs_without_watermark, task_name)\n", " predicted_label_with_watermark = predict_label(outputs_with_watermark, task_name)\n", "\n", " result[\"predicted_label_without_watermark\"] = predicted_label_without_watermark\n", " result[\"predicted_label_with_watermark\"] = predicted_label_with_watermark\n", "\n", " results.append(result)\n", "\n", " return results\n", "\n", "def predict_label(model_output, task_name):\n", " model_output = model_output.lower().strip()\n", " \n", " if task_name == \"sst2\":\n", " return 1 if \"positive\" in model_output else 0\n", " elif task_name == \"cola\":\n", " return 1 if \"yes\" in model_output else 0\n", " elif task_name == \"mrpc\" or task_name == \"qqp\":\n", " return 1 if \"yes\" in model_output else 0\n", " elif task_name == \"stsb\":\n", " # Extract the first number from the output\n", " match = re.search(r'\\d+(\\.\\d+)?', model_output)\n", " if match:\n", " score = float(match.group())\n", " return min(max(score, 0), 5) # Clamp between 0 and 5\n", " else:\n", " return 2.5 # Default to middle score if no number found\n", " elif task_name == \"mnli\":\n", " if \"entailment\" in model_output:\n", " return 0\n", " elif \"contradiction\" in model_output:\n", " return 1\n", " else:\n", " return 2 # Neutral\n", " elif task_name == \"qnli\":\n", " return 0 if \"yes\" in model_output else 1 # 0 for entailment, 1 for not entailment\n", " elif task_name == \"rte\" or task_name == \"wnli\":\n", " return 0 if \"yes\" in model_output else 1 # 0 for entailment, 1 for not entailment\n", " else:\n", " raise ValueError(f\"Unknown task: {task_name}\")\n", "\n", "\n", "\n", "def calculate_metrics(results, task_name):\n", " true_labels = [r[\"true_label\"] for r in results]\n", " pred_labels_without_watermark = [r[\"predicted_label_without_watermark\"] for r in results]\n", " pred_labels_with_watermark = [r[\"predicted_label_with_watermark\"] for r in results]\n", "\n", " # Initialize a dictionary to hold the metrics\n", " metrics = {}\n", "\n", " # Determine the metrics based on the task\n", " if task_name in [\"sst2\", \"mrpc\", \"qqp\"]: # Binary classification tasks\n", " metrics[\"accuracy_without_watermark\"] = accuracy_score(true_labels, pred_labels_without_watermark)\n", " metrics[\"accuracy_with_watermark\"] = accuracy_score(true_labels, pred_labels_with_watermark)\n", " metrics[\"f1_without_watermark\"] = f1_score(true_labels, pred_labels_without_watermark, average='binary')\n", " metrics[\"f1_with_watermark\"] = f1_score(true_labels, pred_labels_with_watermark, average='binary')\n", "\n", " elif task_name == \"cola\": # CoLA task, uses Matthews correlation coefficient\n", " metrics[\"matthews_corr_without_watermark\"] = matthews_corrcoef(true_labels, pred_labels_without_watermark)\n", " metrics[\"matthews_corr_with_watermark\"] = matthews_corrcoef(true_labels, pred_labels_with_watermark)\n", "\n", " elif task_name in [\"mnli\", \"qnli\", \"rte\", \"wnli\"]: # Multi-class classification tasks\n", " metrics[\"accuracy_without_watermark\"] = accuracy_score(true_labels, pred_labels_without_watermark)\n", " metrics[\"accuracy_with_watermark\"] = accuracy_score(true_labels, pred_labels_with_watermark)\n", " metrics[\"f1_without_watermark\"] = f1_score(true_labels, pred_labels_without_watermark, average='macro')\n", " metrics[\"f1_with_watermark\"] = f1_score(true_labels, pred_labels_with_watermark, average='macro')\n", "\n", " elif task_name == \"stsb\": # STS-B task, uses Pearson and Spearman correlation\n", " true_scores = [float(label) for label in true_labels]\n", " pred_scores_without_watermark = [float(score) for score in pred_labels_without_watermark]\n", " pred_scores_with_watermark = [float(score) for score in pred_labels_with_watermark]\n", "\n", " metrics[\"pearson_corr_without_watermark\"] = pearsonr(true_scores, pred_scores_without_watermark)[0]\n", " metrics[\"pearson_corr_with_watermark\"] = pearsonr(true_scores, pred_scores_with_watermark)[0]\n", " metrics[\"spearman_corr_without_watermark\"] = spearmanr(true_scores, pred_scores_without_watermark)[0]\n", " metrics[\"spearman_corr_with_watermark\"] = spearmanr(true_scores, pred_scores_with_watermark)[0]\n", "\n", " return metrics\n", "\n", "\n", "def calculate_glue_score(all_results):\n", " # Define weights for each task in GLUE score calculation\n", " weights = {\n", " \"cola\": 0.05, \"sst2\": 0.05, \"mrpc\": 0.1, \"qqp\": 0.1, \"stsb\": 0.1,\n", " \"mnli\": 0.2, \"qnli\": 0.2, \"rte\": 0.1, \"wnli\": 0.1\n", " }\n", " \n", " scores = []\n", " \n", " for task, weight in weights.items():\n", " if task in all_results:\n", " # Select appropriate metric based on the task\n", " task_metrics = all_results[task][\"validation\"][\"metrics\"]\n", "\n", " if task == \"cola\": # Use Matthews correlation coefficient for CoLA\n", " task_score = task_metrics.get(\"matthews_corr_with_watermark\", 0)\n", " elif task == \"stsb\": # Use Pearson correlation for STS-B\n", " task_score = task_metrics.get(\"pearson_corr_with_watermark\", 0)\n", " else: # Use accuracy for all other tasks\n", " task_score = task_metrics.get(\"accuracy_with_watermark\", 0)\n", " \n", " # Add weighted task score to the list\n", " scores.append(weight * task_score)\n", " \n", " # Return weighted average of the task scores\n", " return sum(scores) / sum(weights.values())\n", "\n", "\n", "def save_results(all_results, output_dir):\n", " if not os.path.exists(output_dir):\n", " os.makedirs(output_dir)\n", " \n", " # Save detailed results\n", " with open(os.path.join(output_dir, \"detailed_results.json\"), \"w\") as f:\n", " json.dump(all_results, f, indent=2)\n", " \n", " # Save summary metrics\n", " summary = {}\n", " for task, data in all_results.items():\n", " summary[task] = {\n", " \"train\": data[\"train\"][\"metrics\"],\n", " \"validation\": data[\"validation\"][\"metrics\"]\n", " }\n", " \n", " with open(os.path.join(output_dir, \"summary_metrics.json\"), \"w\") as f:\n", " json.dump(summary, f, indent=2)\n", " \n", " print(f\"Results saved in {output_dir}\")\n", "\n", "\n", "glue_tasks = [\"sst2\", \"cola\", \"mrpc\", \"qqp\", \"stsb\", \"mnli\", \"qnli\", \"rte\", \"wnli\" ]\n", " \n", "all_results = {}\n", "for task in glue_tasks:\n", " print(f\"Processing task: {task}\")\n", " train_results = process_glue_dataset(task, \"train\", args, model, tokenizer, device)\n", " val_results = process_glue_dataset(task, \"validation\", args, model, tokenizer, device)\n", " \n", " train_metrics = calculate_metrics(train_results, task)\n", " val_metrics = calculate_metrics(val_results, task)\n", "\n", " all_results[task] = {\n", " \"train\": {\"results\": train_results, \"metrics\": train_metrics},\n", " \"validation\": {\"results\": val_results, \"metrics\": val_metrics}\n", " }\n", "\n", " print(f\"Task: {task}\")\n", " print(f\"Train metrics: {train_metrics}\")\n", " print(f\"Validation metrics: {val_metrics}\")\n", "\n", "\n", "# Calculate overall GLUE score\n", "glue_score = calculate_glue_score(all_results)\n", "print(f\"Overall GLUE score: {glue_score}\")\n", "\n", "# Save results\n", "save_results(all_results, \"results\")" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "# Load the detailed results\n", "import json\n", "with open('results/detailed_results.json', 'r') as f:\n", " all_results = json.load(f)\n", "\n", "# # Convert to DataFrame for easier manipulation\n", "# df = pd.json_normalize(all_results[\"sst2\"][\"train\"][\"results\"])\n", "# df.head()" ] }, { "cell_type": "code", "execution_count": 90, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | prompt | \n", "true_label | \n", "use_sampling | \n", "sampling_temp | \n", "delta | \n", "gamma | \n", "n_beams | \n", "detection_z_threshold | \n", "predicted_label_without_watermark | \n", "predicted_label_with_watermark | \n", "... | \n", "with_watermark.Confidence | \n", "without_watermark.Confidence | \n", "task | \n", "set | \n", "Fraction of T in Greenlist_without | \n", "Fraction of T in Greenlist_with | \n", "z_score_without_watermark | \n", "z_score_with_watermark | \n", "label_match_without_watermark | \n", "label_match_with_watermark | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "Is the following sentence grammatically accept... | \n", "1 | \n", "True | \n", "0.7 | \n", "2.0 | \n", "0.25 | \n", "1 | \n", "4.0 | \n", "1 | \n", "0 | \n", "... | \n", "100.000% | \n", "NaN | \n", "cola | \n", "train | \n", "0.000 | \n", "0.571 | \n", "-0.577 | \n", "10.40 | \n", "True | \n", "False | \n", "
1 | \n", "Is the following sentence grammatically accept... | \n", "1 | \n", "True | \n", "0.7 | \n", "2.0 | \n", "0.25 | \n", "1 | \n", "4.0 | \n", "1 | \n", "0 | \n", "... | \n", "100.000% | \n", "NaN | \n", "cola | \n", "train | \n", "0.261 | \n", "0.719 | \n", "0.368 | \n", "15.30 | \n", "True | \n", "False | \n", "
2 | \n", "Is the following sentence grammatically accept... | \n", "1 | \n", "True | \n", "0.7 | \n", "2.0 | \n", "0.25 | \n", "1 | \n", "4.0 | \n", "1 | \n", "0 | \n", "... | \n", "NaN | \n", "NaN | \n", "cola | \n", "train | \n", "0.000 | \n", "0.400 | \n", "-0.577 | \n", "1.34 | \n", "True | \n", "False | \n", "
3 | \n", "Is the following sentence grammatically accept... | \n", "1 | \n", "True | \n", "0.7 | \n", "2.0 | \n", "0.25 | \n", "1 | \n", "4.0 | \n", "1 | \n", "0 | \n", "... | \n", "100.000% | \n", "NaN | \n", "cola | \n", "train | \n", "0.191 | \n", "0.663 | \n", "-1.920 | \n", "13.50 | \n", "True | \n", "False | \n", "
4 | \n", "Is the following sentence grammatically accept... | \n", "1 | \n", "True | \n", "0.7 | \n", "2.0 | \n", "0.25 | \n", "1 | \n", "4.0 | \n", "1 | \n", "0 | \n", "... | \n", "NaN | \n", "NaN | \n", "cola | \n", "train | \n", "0.189 | \n", "0.417 | \n", "-1.790 | \n", "1.33 | \n", "True | \n", "False | \n", "
5 rows × 36 columns
\n", "