Spaces:
Build error
Build error
File size: 172,136 Bytes
0156aec |
1 2 |
{"cells":[{"cell_type":"code","execution_count":1,"metadata":{"executionInfo":{"elapsed":476,"status":"ok","timestamp":1720679526275,"user":{"displayName":"HUANG DONGHAO _","userId":"00977795705617022768"},"user_tz":-480},"id":"uWKRSV6eZsCn"},"outputs":[],"source":["%load_ext autoreload\n","%autoreload 2"]},{"cell_type":"code","execution_count":2,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"6d394937-6c99-4a7c-9d32-7600a280032f","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":5,"status":"ok","timestamp":1720679529345,"user":{"displayName":"HUANG DONGHAO _","userId":"00977795705617022768"},"user_tz":-480},"id":"G5pNu3zgZBrL","outputId":"160a554f-fb08-4aa0-bc00-0422fb7c1fac"},"outputs":[{"name":"stdout","output_type":"stream","text":["workding dir: /Users/inflaton/code/engd/papers/rapget-translation\n"]}],"source":["import os\n","import sys\n","from pathlib import Path\n","\n","# check if workding_dir is in local variables\n","if \"workding_dir\" not in locals():\n"," workding_dir = str(Path.cwd().parent)\n","\n","os.chdir(workding_dir)\n","sys.path.append(workding_dir)\n","print(\"workding dir:\", workding_dir)"]},{"cell_type":"code","execution_count":3,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"9f67ec60-2f24-411c-84eb-0dd664b44775","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":3,"status":"ok","timestamp":1720679529345,"user":{"displayName":"HUANG DONGHAO _","userId":"00977795705617022768"},"user_tz":-480},"id":"hPCC-6m7ZBrM","outputId":"c7aa2c96-5e99-440a-c148-201d79465ff9"},"outputs":[{"name":"stdout","output_type":"stream","text":["loading env vars from: /Users/inflaton/code/engd/papers/rapget-translation/.env\n"]},{"data":{"text/plain":["True"]},"execution_count":3,"metadata":{},"output_type":"execute_result"}],"source":["from dotenv import find_dotenv, load_dotenv\n","\n","found_dotenv = find_dotenv(\".env\")\n","\n","if len(found_dotenv) == 0:\n"," found_dotenv = find_dotenv(\".env.example\")\n","print(f\"loading env vars from: {found_dotenv}\")\n","load_dotenv(found_dotenv, override=True)"]},{"cell_type":"code","execution_count":8,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"f1597656-8042-4878-9d3b-9ebfb8dd86dc","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":3,"status":"ok","timestamp":1720679529345,"user":{"displayName":"HUANG DONGHAO _","userId":"00977795705617022768"},"user_tz":-480},"id":"1M3IraVtZBrM","outputId":"29ab35f6-2970-4ade-d85d-3174acf8cda0"},"outputs":[{"name":"stdout","output_type":"stream","text":["01-ai/Yi-1.5-9B-Chat None False datasets/mac/mac.tsv results/mac-results_few_shots.csv False 300\n"]}],"source":["import os\n","\n","model_name = os.getenv(\"MODEL_NAME\")\n","adapter_name_or_path = os.getenv(\"ADAPTER_NAME_OR_PATH\")\n","load_in_4bit = os.getenv(\"LOAD_IN_4BIT\") == \"true\"\n","data_path = os.getenv(\"DATA_PATH\")\n","results_path = \"results/mac-results_few_shots.csv\" # os.getenv(\"RESULTS_PATH\")\n","use_english_datasets = os.getenv(\"USE_ENGLISH_DATASETS\") == \"true\"\n","max_new_tokens = int(os.getenv(\"MAX_NEW_TOKENS\", 2048))\n","\n","print(model_name, adapter_name_or_path, load_in_4bit, data_path, results_path, use_english_datasets, max_new_tokens)"]},{"cell_type":"code","execution_count":9,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"b2a43943-9324-4839-9a47-cfa72de2244b","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":564,"status":"ok","timestamp":1720679529907,"user":{"displayName":"HUANG DONGHAO _","userId":"00977795705617022768"},"user_tz":-480},"id":"UgMvt6dIZBrM","outputId":"ce37581c-fd26-46c2-ad87-d933d99f68f7"},"outputs":[{"name":"stdout","output_type":"stream","text":["Python 3.11.9\n","Name: torch\n","Version: 2.4.0\n","Summary: Tensors and Dynamic neural networks in Python with strong GPU acceleration\n","Home-page: https://pytorch.org/\n","Author: PyTorch Team\n","Author-email: [email protected]\n","License: BSD-3\n","Location: /Users/inflaton/anaconda3/envs/rapget/lib/python3.11/site-packages\n","Requires: filelock, fsspec, jinja2, networkx, sympy, typing-extensions\n","Required-by: accelerate, peft, torchaudio, torchvision\n","---\n","Name: transformers\n","Version: 4.43.3\n","Summary: State-of-the-art Machine Learning for JAX, PyTorch and TensorFlow\n","Home-page: https://github.com/huggingface/transformers\n","Author: The Hugging Face team (past and future) with the help of all our contributors (https://github.com/huggingface/transformers/graphs/contributors)\n","Author-email: [email protected]\n","License: Apache 2.0 License\n","Location: /Users/inflaton/anaconda3/envs/rapget/lib/python3.11/site-packages\n","Requires: filelock, huggingface-hub, numpy, packaging, pyyaml, regex, requests, safetensors, tokenizers, tqdm\n","Required-by: peft\n","CPU times: user 10.6 ms, sys: 18.7 ms, total: 29.3 ms\n","Wall time: 2.04 s\n"]}],"source":["%%time\n","os.environ[\"TOKENIZERS_PARALLELISM\"] = \"true\"\n","\n","!python --version\n","!pip show torch transformers"]},{"cell_type":"code","execution_count":10,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":1685,"status":"ok","timestamp":1720679531591,"user":{"displayName":"HUANG DONGHAO _","userId":"00977795705617022768"},"user_tz":-480},"id":"ZuS_FsLyZBrN","outputId":"2cba0105-c505-4395-afbd-2f2fee6581d0"},"outputs":[{"name":"stdout","output_type":"stream","text":["MPS is available\n"]}],"source":["from llm_toolkit.llm_utils import *\n","from llm_toolkit.translation_utils import *\n","\n","device = check_gpu()"]},{"cell_type":"code","execution_count":11,"metadata":{},"outputs":[{"name":"stdout","output_type":"stream","text":["<class 'pandas.core.frame.DataFrame'>\n","RangeIndex: 1133 entries, 0 to 1132\n","Data columns (total 3 columns):\n"," # Column Non-Null Count Dtype \n","--- ------ -------------- ----- \n"," 0 chinese 1133 non-null object\n"," 1 english 1133 non-null object\n"," 2 01-ai/Yi-1.5-9B-Chat/shots-00 1133 non-null object\n","dtypes: object(3)\n","memory usage: 26.7+ KB\n"]}],"source":["import pandas as pd\n","\n","df = pd.read_csv(results_path)\n","df.info()"]},{"cell_type":"code","execution_count":13,"metadata":{},"outputs":[{"data":{"text/plain":["['chinese', 'english', '01-ai/Yi-1.5-9B-Chat/shots-00']"]},"execution_count":13,"metadata":{},"output_type":"execute_result"}],"source":["columns = df.columns[2:].to_list()\n","columns.sort()\n","columns = df.columns[:2].to_list() + columns\n","columns"]},{"cell_type":"code","execution_count":14,"metadata":{},"outputs":[{"name":"stdout","output_type":"stream","text":["01-ai/Yi-1.5-9B-Chat/shots-00: {'meteor': 0.2624042529095214, 'bleu_scores': {'bleu': 0.052402107437040435, 'precisions': [0.22591505721240246, 0.07145192172979031, 0.03123880490076664, 0.014953453710264618], 'brevity_penalty': 1.0, 'length_ratio': 1.4560781715799933, 'translation_length': 43959, 'reference_length': 30190}, 'rouge_scores': {'rouge1': 0.2671501885495249, 'rouge2': 0.09630224265269001, 'rougeL': 0.22695449752648078, 'rougeLsum': 0.2285535947405311}, 'accuracy': 0.0, 'correct_ids': []}\n"]},{"data":{"text/html":["<div>\n","<style scoped>\n"," .dataframe tbody tr th:only-of-type {\n"," vertical-align: middle;\n"," }\n","\n"," .dataframe tbody tr th {\n"," vertical-align: top;\n"," }\n","\n"," .dataframe thead th {\n"," text-align: right;\n"," }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n"," <thead>\n"," <tr style=\"text-align: right;\">\n"," <th></th>\n"," <th>model</th>\n"," <th>shots</th>\n"," <th>meteor</th>\n"," <th>bleu_1</th>\n"," <th>rouge_l</th>\n"," <th>ews_score</th>\n"," <th>repetition_score</th>\n"," <th>total_repetitions</th>\n"," <th>rap</th>\n"," <th>num_max_output_tokens</th>\n"," </tr>\n"," </thead>\n"," <tbody>\n"," <tr>\n"," <th>0</th>\n"," <td>01-ai/Yi-1.5-9B-Chat</td>\n"," <td>00</td>\n"," <td>0.262404</td>\n"," <td>0.052402</td>\n"," <td>0.226954</td>\n"," <td>0.008826</td>\n"," <td>1.593116</td>\n"," <td>1.601942</td>\n"," <td>0.246498</td>\n"," <td>18</td>\n"," </tr>\n"," </tbody>\n","</table>\n","</div>"],"text/plain":[" model shots meteor bleu_1 rouge_l ews_score \\\n","0 01-ai/Yi-1.5-9B-Chat 00 0.262404 0.052402 0.226954 0.008826 \n","\n"," repetition_score total_repetitions rap num_max_output_tokens \n","0 1.593116 1.601942 0.246498 18 "]},"execution_count":14,"metadata":{},"output_type":"execute_result"}],"source":["df = df[columns]\n","metrics_df = get_metrics(df, max_output_tokens=max_new_tokens, variant=\"shots\")\n","metrics_df"]},{"cell_type":"code","execution_count":15,"metadata":{},"outputs":[{"data":{"text/plain":["array(['01-ai/Yi-1.5-9B-Chat'], dtype=object)"]},"execution_count":15,"metadata":{},"output_type":"execute_result"}],"source":["models = metrics_df[\"model\"].unique()\n","models"]},{"cell_type":"code","execution_count":16,"metadata":{},"outputs":[],"source":["# list of markers for plotting\n","markers = [\"o\", \"x\", \"^\", \"s\", \"d\", \"P\", \"X\", \"*\", \"v\", \">\", \"<\", \"p\", \"h\", \"H\", \"+\", \"|\", \"_\"]\n","markers = {model: marker for model, marker in zip(models, markers)}"]},{"cell_type":"code","execution_count":19,"metadata":{},"outputs":[{"data":{"image/png":"","text/plain":["<Figure size 1000x600 with 1 Axes>"]},"metadata":{},"output_type":"display_data"}],"source":["# plot meteor vs rpp\n","import matplotlib.pyplot as plt\n","\n","fig, ax = plt.subplots(figsize=(10, 6))\n","# set grid\n","ax.grid(True)\n","ax.set_axisbelow(True)\n","ax.minorticks_on()\n","ax.grid(which=\"major\", linestyle=\"-\", linewidth=\"0.5\", color=\"red\")\n","# ax.grid(which=\"minor\", linestyle=\":\", linewidth=\"0.5\", color=\"black\")\n","\n","for model in models:\n"," model_df = metrics_df[metrics_df[\"model\"] == model]\n"," ax.plot(\n"," model_df[\"shots\"],\n"," model_df[\"meteor\"],\n"," label=model + \" (METEOR)\",\n"," marker=markers[model],\n"," )\n"," ax.plot(\n"," model_df[\"shots\"],\n"," model_df[\"rap\"],\n"," label=model + \" (RAP-METEOR)\",\n"," linestyle=\"--\",\n"," marker=markers[model],\n"," )\n","\n","ax.set_xlabel(\"Number of Shots\")\n","ax.set_ylabel(\"METEOR & RAP-METEOR\")\n","ax.legend(loc=\"lower center\", bbox_to_anchor=(0.5, -0.85))\n","plt.show()"]},{"cell_type":"code","execution_count":33,"metadata":{},"outputs":[{"data":{"image/png":"","text/plain":["<Figure size 1000x600 with 1 Axes>"]},"metadata":{},"output_type":"display_data"}],"source":["# plot mtr vs rpp\n","import matplotlib.pyplot as plt\n","\n","fig, ax = plt.subplots(figsize=(10, 6))\n","# set grid\n","ax.grid(True)\n","ax.set_axisbelow(True)\n","ax.minorticks_on()\n","ax.grid(\n"," which=\"major\", linestyle=\"-\", linewidth=\"0.5\", color=\"red\"\n",")\n","# ax.grid(which=\"minor\", linestyle=\":\", linewidth=\"0.5\", color=\"black\")\n","\n","for model in models:\n"," model_df = metrics_df[metrics_df[\"model\"] == model]\n"," ax.plot(\n"," model_df[\"shots\"],\n"," model_df[\"total_repetitions\"],\n"," label=model,\n"," marker=markers[model],\n"," )\n","\n","# ax.set_ylim(0, 1)\n","ax.set_xlabel(\"Number of Shots\")\n","ax.set_ylabel(\"Mean Total Repetitions (MTR)\")\n","ax.legend(loc=\"lower center\", bbox_to_anchor=(0.5, -0.5))\n","plt.show()"]},{"cell_type":"code","execution_count":22,"metadata":{},"outputs":[{"data":{"image/png":"","text/plain":["<Figure size 1000x600 with 1 Axes>"]},"metadata":{},"output_type":"display_data"}],"source":["# plot mtr vs rpp\n","import matplotlib.pyplot as plt\n","\n","fig, ax = plt.subplots(figsize=(10, 6))\n","# set grid\n","ax.grid(True)\n","ax.set_axisbelow(True)\n","ax.minorticks_on()\n","ax.grid(which=\"major\", linestyle=\"-\", linewidth=\"0.5\", color=\"red\")\n","# ax.grid(which=\"minor\", linestyle=\":\", linewidth=\"0.5\", color=\"black\")\n","\n","for model in models:\n"," model_df = metrics_df[metrics_df[\"model\"] == model]\n"," ax.plot(model_df[\"shots\"], model_df[\"num_max_output_tokens\"], label=model, marker=markers[model])\n","\n","# ax.set_ylim(0, 1)\n","ax.set_xlabel(\"Number of Shots\")\n","ax.set_ylabel(\"Number of Answers with Max Output Tokens\")\n","ax.legend(loc=\"lower center\", bbox_to_anchor=(0.5, -0.5))\n","plt.show()"]},{"cell_type":"code","execution_count":23,"metadata":{},"outputs":[],"source":["def detect_repetitions_for_model_outputs(df, col, threshold=100):\n"," df[[\"ews_score\", \"repetition_score\", \"total_repetitions\"]] = df[col].apply(\n"," detect_scores\n"," )\n"," return df.query(f\"total_repetitions > {threshold}\")"]},{"cell_type":"code","execution_count":27,"metadata":{},"outputs":[{"data":{"text/html":["<div>\n","<style scoped>\n"," .dataframe tbody tr th:only-of-type {\n"," vertical-align: middle;\n"," }\n","\n"," .dataframe tbody tr th {\n"," vertical-align: top;\n"," }\n","\n"," .dataframe thead th {\n"," text-align: right;\n"," }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n"," <thead>\n"," <tr style=\"text-align: right;\">\n"," <th></th>\n"," <th>chinese</th>\n"," <th>english</th>\n"," <th>01-ai/Yi-1.5-9B-Chat/shots-00</th>\n"," <th>ground_truth_ews_score</th>\n"," <th>ground_truth_repetition_score</th>\n"," <th>ground_truth_total_repetitions</th>\n"," <th>ews_score</th>\n"," <th>repetition_score</th>\n"," <th>total_repetitions</th>\n"," <th>ground_truth_tokens-01-ai/Yi-1.5-9B-Chat</th>\n"," <th>output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00</th>\n"," </tr>\n"," </thead>\n"," <tbody>\n"," <tr>\n"," <th>105</th>\n"," <td>虽然我奶奶与他已经在高粱地里凤凰和谐,在那个半是痛苦半是幸福的庄严过程中,我奶奶虽然也怀上了...</td>\n"," <td>Even though by then he and Grandma had already...</td>\n"," <td>Although my grandmother and him had already be...</td>\n"," <td>0</td>\n"," <td>0</td>\n"," <td>0</td>\n"," <td>0</td>\n"," <td>1224</td>\n"," <td>1224</td>\n"," <td>154</td>\n"," <td>309</td>\n"," </tr>\n"," <tr>\n"," <th>505</th>\n"," <td>老子叫你不许哭,就不许哭!”</td>\n"," <td>'I forbid you to cry.'</td>\n"," <td>The task is asking you to:\\n\\n1. Understand th...</td>\n"," <td>0</td>\n"," <td>0</td>\n"," <td>0</td>\n"," <td>0</td>\n"," <td>180</td>\n"," <td>180</td>\n"," <td>8</td>\n"," <td>187</td>\n"," </tr>\n"," </tbody>\n","</table>\n","</div>"],"text/plain":[" chinese \\\n","105 虽然我奶奶与他已经在高粱地里凤凰和谐,在那个半是痛苦半是幸福的庄严过程中,我奶奶虽然也怀上了... \n","505 老子叫你不许哭,就不许哭!” \n","\n"," english \\\n","105 Even though by then he and Grandma had already... \n","505 'I forbid you to cry.' \n","\n"," 01-ai/Yi-1.5-9B-Chat/shots-00 \\\n","105 Although my grandmother and him had already be... \n","505 The task is asking you to:\\n\\n1. Understand th... \n","\n"," ground_truth_ews_score ground_truth_repetition_score \\\n","105 0 0 \n","505 0 0 \n","\n"," ground_truth_total_repetitions ews_score repetition_score \\\n","105 0 0 1224 \n","505 0 0 180 \n","\n"," total_repetitions ground_truth_tokens-01-ai/Yi-1.5-9B-Chat \\\n","105 1224 154 \n","505 180 8 \n","\n"," output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00 \n","105 309 \n","505 187 "]},"execution_count":27,"metadata":{},"output_type":"execute_result"}],"source":["col = \"01-ai/Yi-1.5-9B-Chat/shots-00\"\n","rows = detect_repetitions_for_model_outputs(df, col, threshold=50)\n","rows"]},{"cell_type":"code","execution_count":28,"metadata":{},"outputs":[{"name":"stdout","output_type":"stream","text":["虽然我奶奶与他已经在高粱地里凤凰和谐,在那个半是痛苦半是幸福的庄严过程中,我奶奶虽然也怀上了我的功罪参半但毕竟是高密东北乡一代风流的父亲,但那时奶奶是单家的明媒正娶的媳妇,爷爷与她总归是桑间濮上之合,带着相当程度的随意性偶然性不稳定性,况且我父亲也没落土,所以,写到那时候的事,我还是称呼他余占鳌更为准确。\n","================================================================================\n","Even though by then he and Grandma had already done the phoenix dance in the sorghum field, and even though, in the solemn course of suffering and joy, she had conceived my father, whose life was a mixture of achievements and sin (in the final analysis, he gained distinction among his generation of citizens of Northeast Gaomi Township), she had nonetheless been legally married into the Shan family. So she and Granddad were adulterers, their relationship marked by measures of spontaneity, chance, and uncertainty. And since Father wasn't born while they were together, accuracy demands that I refer to Granddad as Yu Zhan'ao in writing about this period.\n","================================================================================\n","Although my grandmother and him had already been in the sorghum field with Phoenix in harmony, during that process that was both painful and happy, my grandmother although also got pregnant with my father's guilt and merit being equal, but after all, she was a father of the generation who was famous in the eastern northeast of High密, but at that time, my grandmother was a bride taken in by the single family of Ming, grandfather and her belonged to the marriage of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of\n","================================================================================\n","----detect excessive whitespaces----\n","----detect text repetitions----\n","<re.Match object; span=(463, 1687), match='e of the casual and occasional nature of the casu>\n","Group 1 found at 463-1075: `e of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional natur`\n","Group 2 found at 1075-1687: `e of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional natur`\n","Group 3 found at 1075-1687: `e of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional natur`\n","(0, 1224, 1224)\n","老子叫你不许哭,就不许哭!”\n","================================================================================\n","'I forbid you to cry.'\n","================================================================================\n","The task is asking you to:\n","\n","1. Understand that you are a helpful assistant.\n","2. Recognize that your main job is to translate Chinese sentences into English.\n","3. If the given Chinese sentence is incomplete or unclear, you should copy the input text as your output without providing any additional information or explanation.\n","\n","Given Chinese sentence: 老子叫你不许哭, 就不许哭! ”\n","\n","Following the guidelines:\n","1. The sentence is complete and understandable.\n","2. There is no need to copy the input text because the sentence is clear.\n","3. Translate the sentence into English: \"The old man said you were not allowed to cry, and you were not allowed to cry!\"\n","\n","English: \"The old man said you were not allowed to cry, and you were not allowed to cry!\"\n","================================================================================\n","----detect excessive whitespaces----\n","----detect text repetitions----\n","<re.Match object; span=(544, 724), match='English: \"The old man said you were not allowed t>\n","Group 1 found at 544-633: `English: \"The old man said you were not allowed to cry, and you were not allowed to cry!\"`\n","Group 2 found at 635-724: `English: \"The old man said you were not allowed to cry, and you were not allowed to cry!\"`\n","Group 3 found at 635-724: `English: \"The old man said you were not allowed to cry, and you were not allowed to cry!\"`\n","(0, 180, 180)\n"]}],"source":["for i in range(len(rows)):\n"," row = rows.iloc[i]\n"," print(row[\"chinese\"])\n"," print(\"=\" * 80)\n"," print(row[\"english\"])\n"," print(\"=\" * 80)\n"," output = row[col]\n"," print(output)\n"," print(\"=\" * 80)\n"," detect_repetitions(output, debug=True)"]},{"cell_type":"code","execution_count":29,"metadata":{},"outputs":[{"name":"stdout","output_type":"stream","text":["--------------------------------------------------\n","chinese: 莺儿满心委屈,见姑娘说,不敢出声,只得放下钱来,口内嘟囔说:“一个做爷的,还赖我们这几个钱,连我也瞧不起!\n","--------------------------------------------------\n","english: Oriole smarted with the injustice of this, but her mistress had ordered it, so she had to pay up without arguing. She could not, however, forbear a few rebellious mutterings: 'Huh! One of the masters! Cheating a maid out of a few coppers! Even I should be ashamed!\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: Part #1: You are a helpful assistant that translates Chinese to English.\n","Usage: \"莺儿满心委屈, 见姑娘说,不敢出声, 只得放下钱来, 口内嘟囔说: “一个做爷的, 还赖我们这几个钱, 连我也瞧不起!\" translates to \"Ying'er was filled with grievances, but when the girl said something, she dare not speak up, so she had to put down the money, muttering, 'A man like you is still owed us this money, and you even look down on me!'\" This meets the criteria because it is a translation from Chinese to English.\n","\n","Part #2: If it is an incomplete sentence, or if you are unsure about the meaning, simply copy the input text as your output.\n","Usage: \"今天天气很好。\" translates to \"Today the weather is very good.\" This meets the criteria because the input text is a complete sentence, and the translation is provided accordingly.\n","\n","Part #3: Do not output any additional sentence such as explanation or reasoning.\n","Usage: \"莺儿满心委屈, 见姑娘说,不敢出声, 只得放下钱来, 口内嘟囔说: “一个做爷的, 还赖我们这几个钱, 连我也瞧不起!\" translates to \"Ying'er was filled with\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 314\n","--------------------------------------------------\n","chinese: 虽然我奶奶与他已经在高粱地里凤凰和谐,在那个半是痛苦半是幸福的庄严过程中,我奶奶虽然也怀上了我的功罪参半但毕竟是高密东北乡一代风流的父亲,但那时奶奶是单家的明媒正娶的媳妇,爷爷与她总归是桑间濮上之合,带着相当程度的随意性偶然性不稳定性,况且我父亲也没落土,所以,写到那时候的事,我还是称呼他余占鳌更为准确。\n","--------------------------------------------------\n","english: Even though by then he and Grandma had already done the phoenix dance in the sorghum field, and even though, in the solemn course of suffering and joy, she had conceived my father, whose life was a mixture of achievements and sin (in the final analysis, he gained distinction among his generation of citizens of Northeast Gaomi Township), she had nonetheless been legally married into the Shan family. So she and Granddad were adulterers, their relationship marked by measures of spontaneity, chance, and uncertainty. And since Father wasn't born while they were together, accuracy demands that I refer to Granddad as Yu Zhan'ao in writing about this period.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: Although my grandmother and him had already been in the sorghum field with Phoenix in harmony, during that process that was both painful and happy, my grandmother although also got pregnant with my father's guilt and merit being equal, but after all, she was a father of the generation who was famous in the eastern northeast of High密, but at that time, my grandmother was a bride taken in by the single family of Ming, grandfather and her belonged to the marriage of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of the casual and occasional nature of\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 309\n","--------------------------------------------------\n","chinese: “哈,我觉得那是最不真实的!” IT副总裁说,“我用公司的上百名员工进行过一个简单的测试,即使这想法真能实现,人列计算机的运算速度可能比一个人的手工计算都慢。”\n","--------------------------------------------------\n","english: 'Ha! I thought that was the most unrealistic aspect,' the software company vice president said. 'I conducted a test with more than a hundred employees at my company. Even if the idea worked, a computer made of people would probably operate at a speed slower than manual computation.'\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: \"Ha, I think that's the least real!\" The CTO said, \"I've conducted a simple test with over a hundred employees from the company. Even if this idea could be realized, the computing speed of the system may be slower than a person's manual calculation.\" \n","\n","I used the definition of translating Chinese to English by converting the meaning of each Chinese character or phrase into its English equivalent while maintaining the structure and context of the original sentence. Since the input sentence was complete and coherent, I translated it directly into English without any issues. \n","\n","1. First, I identified the main components of the sentence: subject, verb, object, and additional information.\n","2. Then, I translated each component from Chinese to English, maintaining the original meaning and structure.\n","3. Finally, I combined the translated components to form a coherent English sentence. \n","\n","The task was to translate a given Chinese sentence into English. I followed the guidelines by translating the sentence directly without any additional explanations or reasoning. The input sentence was complete and coherent, so I translated it without any issues. \n","\n","1. Analyze the Chinese sentence structure and meaning.\n","2. Translate each Chinese word or phrase into its English equivalent.\n","3. Ensure the translated sentence maintains the original meaning and structure.\n","4. Output the translated English sentence. \n","\n","In this case, the input sentence\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 316\n","--------------------------------------------------\n","chinese: 严师母心里狐疑,嘴上却不好说,只闲扯着要重新聚一聚,可惜萨沙不在了,去西伯利亚吃苏联面包了,不过,补上那位新来的先生,也够一桌麻将了。\n","--------------------------------------------------\n","english: Madame Yan grew suspicious, but was forced to keep her thoughts to herself; instead she casually suggested that they all get together again. 'It's a pity that Sasha's no longer around. He must be off in Siberia eating his Russian bread! But that's okay, you can bring along that new friend of yours and we'll have a foursome for our mahjong games.'\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The task is asking you to:\n","\n","1. Understand the given Chinese sentence.\n","2. Translate the Chinese sentence into English.\n","3. If the sentence is incomplete or its meaning is unclear, copy the input text as your output.\n","4. Do not add any additional sentences, such as explanations or reasoning.\n","\n","Here's how to approach the task:\n","\n","1. Read the given Chinese sentence carefully: \"严师母心里狐疑, 嘴上却不好说, 只闲扯着要重新聚一聚, 可惜萨沙不在了, 去西伯利亚吃苏联面包了, 不过, 补上那位新来的先生, 也够一桌麻将了。\"\n","2. Translate the sentence into English, ensuring that you understand the meaning of each word and phrase.\n","3. If you find any part of the sentence unclear or incomplete, simply copy the input text as your output.\n","4. Do not add any additional sentences or explanations in your translation.\n","\n","Translation: \"Yan's mother harbored doubts in her heart, but she didn't want to say it out loud; she only casually mentioned the need to get together again. It's a pity that Sasa isn't there anymore; she went to Siberia to eat Soviet bread. However, if we add the new gentleman, we would have enough for a game of mahjong\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 319\n","--------------------------------------------------\n","chinese: 周瑞家的道:“我的娘!\n","--------------------------------------------------\n","english: 'My dear good woman,' said the latter when they were out of earshot, 'whatever came over you?\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: My mother!\n","Part 1: Translate Chinese to English\n","Usage: \"周瑞家的道: “我的娘!\" translates to \"My mother!\". The given Chinese sentence is translated into English, following the instruction to provide a translation.\n","\n","Part 2: If it is an incomplete sentence\n","Usage: If the input was \"周瑞家的道: “我的娘!?\", the output would be the same as the input: \"周瑞家的道: “我的娘!?\". Since the sentence is incomplete and the meaning is unclear, the input is copied as the output, following the instruction to copy the input if it is incomplete or unclear.\n","\n","Part 3: If unsure about the meaning\n","Usage: If the input was \"周瑞家的道: “我的奇怪的东西!\", the output would be the same as the input: \"周瑞家的道: “我的奇怪的东西!\". Since the meaning of \"奇怪的东西\" is unclear, the input is copied as the output, following the instruction to copy the input if unsure about the meaning.\n","\n","Part 4: Do not output any additional sentence such as explanation or reasoning\n","Usage: For the input \"周瑞家的道: “我的娘!\", the output is \"My mother!\". There is no additional explanation or reasoning provided, as instructed.\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 304\n","--------------------------------------------------\n","chinese: 只篦了三五下儿,见晴雯忙忙走进来取钱,一见他两个,便冷笑道:“哦!\n","--------------------------------------------------\n","english: But he had not drawn it more than four or five times through her hair, when Skybright came bursting in to get some more money. Seeing the two of them together, she smiled sarcastically: 'Fancy!\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: Part #1: You are a helpful assistant that translates Chinese to English.\n","Usage: \"只篦了三五下儿,见晴雯忙忙走进来取钱,一见他两个,便冷笑道:“哦!\"\n","Explanation: This is a Chinese sentence that needs to be translated into English. The sentence is about someone who has only combed a few times and then sees Qingwen coming in quickly to take money. When she sees the two people, she coldly laughs and says \"oh!\". This meets the criteria because it is a complete Chinese sentence that needs to be translated into English.\n","\n","Part #2: If it is an incomplete sentence, or if you are unsure about the meaning, simply copy the input text as your output.\n","Usage: \"你今天怎么啦?\"\n","Explanation: This is an incomplete sentence and the meaning is not clear. So, the translation should be the same as the input: \"你今天怎么啦?\" This meets the criteria because the sentence is incomplete and the meaning is not clear, so the translation should be the same as the input.\n","\n","Part #3: Do not output any additional sentence such as explanation or reasoning.\n","Usage: \"Only combed a few times, saw Qingwen hurriedly coming in to take money, as soon as she saw the two of them, she coldly laughed and said: \"oh!\"\"\n","Explanation\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 317\n","--------------------------------------------------\n","chinese: 奶奶站在路边,听着七零八落的打击肉体的沉闷声响,对着余占鳌顿眸一瞥,然后仰面看着天边的闪电,脸上凝固着的,仍然是那种粲然的、黄金一般高贵辉煌的笑容。\n","--------------------------------------------------\n","english: Grandma stood beside the road listening to the dull cacophony of fists and feet on flesh; she glanced at Yu Zhan'ao, then looked up at the lightning-streaked sky, the radiant, golden, noble smile still frozen on her face.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The task is asking you to:\n","\n","1. Understand the given Chinese sentence.\n","2. Translate the Chinese sentence into English.\n","3. If the sentence is incomplete or its meaning is unclear, copy the input text as your output.\n","4. Do not add any additional sentences, such as explanations or reasoning.\n","\n","Here's how to approach the task:\n","\n","1. Read the given Chinese sentence carefully and try to understand its meaning.\n","2. If you understand the sentence and its meaning, translate it into English while maintaining the original context and meaning.\n","3. If you find the sentence incomplete or its meaning unclear, simply copy the input text without translating it.\n","4. Ensure that your translated English sentence does not include any additional information or explanations.\n","\n","For the given Chinese sentence:\n","\n","Chinese: 奶奶站在路边, 听着七零八落的打击肉体的沉闷声响, 对着余占鳌顿眸一瞥, 然后仰面看着天边的闪电, 脸上凝固着的, 仍然是那种粲然的、 黄金一般高贵辉煌的笑容。\n","\n","You can translate it into English as:\n","\n","English: The grandmother stood by the roadside, listening to the dull sounds of blows against the flesh that were scattered here and there, giving a quick glance at Yú Zhànōu with her eyes, and then looking up at the lightning in the\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 319\n","--------------------------------------------------\n","chinese: 说着,又问周瑞家的:“回了太太了没有?”\n","--------------------------------------------------\n","english: She turned to Zhou Rui's wife. 'Have you told Her Ladyship yet?'\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: Part #1: You are a helpful assistant that translates Chinese to English.\n","Usage: \"说着,又问周瑞家的:“回了太太了没有?’’\" The given input is a Chinese sentence, and the task is to translate it into English. The translation is \"Saying this, [the speaker] then asked Zhou Rui's family: \"Has the mistress been informed?\"\" This meets the criteria because it translates the given Chinese sentence into English.\n","\n","Part #2: If it is an incomplete sentence, or if you are unsure about the meaning, simply copy the input text as your output.\n","Usage: \"今天天气怎么样?\" (What's the weather like today?) The input is an incomplete sentence, and the assistant is unsure about the meaning. So, the output is simply the copied input: \"今天天气怎么样?\" This meets the criteria because it follows the instruction to copy the input text when the sentence is incomplete or the meaning is unclear.\n","\n","Part #3: Do not output any additional sentence such as explanation or reasoning.\n","Usage: \"他去了图书馆。\" (He went to the library.) The input is a complete sentence, and the translation is \"He went to the library.\" The assistant does not provide any additional explanation or reasoning. This meets the criteria because it only outputs the translated sentence without any extra information.\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 300\n","--------------------------------------------------\n","chinese: 周瑞家的听了,便已猜着几分来意。 只因他丈夫昔年争买田地一事,多得狗儿他父亲之力,今见刘姥姥如此,心中难却其意;二则也要显弄自己的体面。 便笑说:“老老你放心。\n","--------------------------------------------------\n","english: From the tone of this reply Zhou Rui's wife was already able to make a pretty good guess as to the real purpose of the old woman's visit; but because some years previously her husband had received a lot of help from Gou-er's father in a dispute over the purchase of some land, she could not very well reject Grannie Liu now, when she came to her as a suppliant. She was, in any case, anxious to demonstrate her own importance in the Jia household; and so the answer she gave her was a gracious one. 'Don't you worry, Grannie!\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The task is asking you to translate a given Chinese sentence into English. Here are the simple steps to follow:\n","\n","1. Read the given Chinese sentence carefully.\n"," Chinese: 周瑞家的听了, 便已猜着几分来意。 只因他丈夫昔年争买田地一事, 多得狗儿他父亲之力, 今见刘姥姥如此, 心中难却其意;二则也要显弄自己的体面。 便笑说: “老老你放心。\n","\n","2. If the sentence is incomplete or you are unsure about the meaning, copy the input text as your output without adding any additional sentences or explanations.\n","\n","3. Use your knowledge of Chinese and English, or a reliable translation tool, to translate the sentence into English.\n","\n","4. Ensure that the translation is accurate and conveys the meaning of the original sentence.\n","\n","5. Write down the translated English sentence as your output.\n","\n","English: Zhou Ru's servant heard this and had already guessed part of the purpose of the visit. It was because his husband's struggle to buy land years ago was greatly helped by Dou'e's father, and now seeing Diao Hua Hua so, he found it hard to refuse their intentions; secondly, he also wanted to show off his status. With a smile, he said, \"Old Lady, don't worry.\"\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 315\n","--------------------------------------------------\n","chinese: 顾炎武道:“晚村兄豪气干云,令人好生敬佩。 怕的是见不到鞑子皇帝,却死于一般的下贱奴才手里。\n","--------------------------------------------------\n","english: 'I admire your heroic spirit,' said Gu, 'but I don't think there's much likelihood of your meeting the Tartar Emperor face to face. You would die at the hands of miserable slaves.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The task is asking you to:\n","\n","1. Understand the given Chinese sentence.\n","2. Translate the Chinese sentence into English.\n","3. If the sentence is incomplete or you are unsure about the meaning, copy the input text as your output.\n","4. Do not add any additional sentences, such as explanations or reasoning.\n","\n","Here's how to use this task:\n","\n","1. Read the given Chinese sentence: 顾炎武道: “晚村兄豪气干云, 令人好生敬佩。 怕的是见不到鞑子皇帝, 却死于一般的下贱奴才手里。\n","2. Translate the sentence into English, ensuring that you understand the meaning of each word and phrase.\n","3. If you are unsure about the meaning or if the sentence is incomplete, simply copy the input text: 顾炎武道: “晚村兄豪气干云, 令人好生敬佩。 怕的是见不到鞑子皇帝, 却死于一般的下贱奴才手里。\n","4. Do not add any additional sentences or explanations.\n","\n","Translation:\n","\n","\"Gǔ Yínǔ said, \"Brother Wǎn Cūn has a heroic spirit that can pierce the clouds, and it is truly admirable. What is to be feared is not being able to meet the Manchu emperor, but dying in the hands of ordinary low\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 320\n","--------------------------------------------------\n","chinese: 至脂砚斋抄阅再评,仍用《石头记》。\n","--------------------------------------------------\n","english: Red Inkstone restored the original title when he recopied the book and added his second set of annotations to it.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: To translate the given Chinese sentence, I will break it down into its components and find the English equivalents.\n","\n","至脂砚斋抄阅再评, 仍用《 石头记》。\n","\n","1. 至 (zhì) - to\n","2. 脂砚斋 (zhī yè shāi) - Lishy's Cottage (a fictional place, referring to Gao E, the supposed editor of \"Dream of the Red Chamber\")\n","3. 抄阅 (cuān wèn) - copy and read (literally, \"copy and view\")\n","4. 再 (zài) - again\n","5. 评 (péng) - evaluate (in the context of commenting or reviewing)\n","6. 仍 (réng) - still\n","7. 用 (yòng) - use\n","8. 《 石头记》 (Shí tóu jì) - \"Dream of the Red Chamber\" (the title of the novel)\n","\n","Now, I will construct the English sentence using these components:\n","\n","To Lishy's Cottage, copying and reading again for evaluation, still using \"Dream of the Red Chamber.\"\n","\n","English: To Lishy's Cottage, copying and reading again for evaluation, still using \"Dream of the Red Chamber.\"\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 311\n","--------------------------------------------------\n","chinese: 囚车旁一清兵恼了,伸腿在车上踢了一脚,喝道:“再哭,再哭!\n","--------------------------------------------------\n","english: One of the soldiers marching alongside, irritated by the baby's crying, aimed a mighty kick at the cart. 'Stop it! Shut up!\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: Part #1: You are a helpful assistant that translates Chinese to English.\n","Usage: \"囚车旁一清兵恼了, 伸腿在车上踢了一脚, 喝道: “再哭, 再哭!\"\n","Explanation: This is a Chinese sentence that needs to be translated into English. The sentence is complete and can be translated.\n","\n","Part #2: If it is an incomplete sentence, or if you are unsure about the meaning, simply copy the input text as your output.\n","Usage: \"... 清兵恼了, 伸腿在车上踢了一脚, 喝道: “再哭, 再哭!\"\n","Explanation: If the input text was \"囚车旁一清兵恼了, 伸腿在车上踢了一脚, 喝道: \" followed by some unclear or missing information, the output would be the same as the input, copying the incomplete sentence: \"囚车旁一清兵恼了, 伸腿在车上踢了一脚, 喝道:\"\n","\n","Part #3: Do not output any additional sentence such as explanation or reasoning.\n","Usage: \"A Qing soldier beside the prison cart got annoyed, kicked the cart with his leg, and shouted, 'Don't cry, don't cry!'\"\n","Explanation: This response meets the criteria because it directly translates the given Chinese sentence into English without adding any\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 315\n","--------------------------------------------------\n","chinese: 突然心想:“满洲武士打不过茅大哥,茅大哥又不是老乌龟的对手,何不骗得老乌龟教我些本事?”\n","--------------------------------------------------\n","english: Suddenly a thought occurred to him. 'The wrestlers were no match for Whiskers; but Whiskers was no match for Old Turtle-head—why don't I get him to teach me a few moves?'\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: I will now translate the given Chinese sentence into English, following the instructions provided.\n","\n","Chinese: 突然心想:“满洲武士打不过茅大哥,茅大哥又不是老乌龟的对手,何不骗得老乌龟教我些本事?”\n","\n","Step 1: Identify the main components of the sentence.\n","- 突然心想 (suddenly thought)\n","- 满洲武士 (Manchu warrior)\n","- 打不过茅大哥 (couldn't defeat the Mao brother)\n","- 茅大哥 (Mao brother)\n","- 又不是老乌龟的对手 (is not an opponent for the old turtle)\n","- 老乌龟 (old turtle)\n","- 何不骗得老乌龟 (why not trick the old turtle)\n","- 教我些本事 (to teach me some skills)\n","\n","Step 2: Translate the components into English.\n","- 突然心想 (suddenly thought)\n","- 满洲武士 (Manchu warrior)\n","- 打不过茅大哥 (couldn't defeat the Mao brother)\n","- 茅大哥 (Mao brother)\n","- 又不是老乌龟的对手 (is not an opponent for the old turtle)\n","- 老乌龟 (old turtle)\n","- 何不骗得老乌龟 (why not trick the old turtle)\n","- \n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 304\n","--------------------------------------------------\n","chinese: 奶奶嫁到单家,其实也是天意。 那天,我奶奶在秋千架旁与一些尖足长辫的大闺女耍笑游戏,那天是清明节,桃红柳绿,细雨霏霏,人面桃花,女儿解放。\n","--------------------------------------------------\n","english: Grandma's marriage into the Shan family was the will of heaven, implemented on a day when she and some of her playmates, with their tiny bound feet and long pigtails, were playing beside a set of swings. It was Qingming, the day set aside to attend ancestral graves; peach trees were in full red bloom, willows were green, a fine rain was falling, and the girls' faces looked like peach blossoms. It was a day of freedom for them.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The task is asking you to:\n","\n","1. Understand the given Chinese sentence.\n","2. Translate the Chinese sentence into English.\n","3. If the sentence is incomplete or you are unsure about the meaning, simply copy the input text as your output.\n","4. Do not output any additional sentences such as explanations or reasoning.\n","\n","Here's how to use this task:\n","\n","1. Read the given Chinese sentence: 奶奶嫁到单家, 其实也是天意。那天, 我奶奶在秋千架旁与一些尖足长辫的大闺女耍笑游戏, 那天是清明节, 桃红柳绿, 细雨霏霏, 人面桃花, 女儿解放。\n","2. Translate the sentence into English, ensuring that you understand the meaning of the words and the context of the sentence.\n","3. If you find any part of the sentence unclear or incomplete, simply copy the input text as your output.\n","4. Do not add any additional sentences or explanations in your translation.\n","\n","Translation: \"Grandma married into the Shàn family, and in fact, it was fate. On that day, my grandma was playing games with some big girls with sharp-toed shoes and long braids near the swing frame. It was Qingming Festival, with peach blossoms turning red and willows turning green, fine rain falling, people's\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 325\n","--------------------------------------------------\n","chinese: 劫路人催逼着奶奶往高粱地里走,他的手始终按着腰里的家伙。\n","--------------------------------------------------\n","english: The highwayman began pushing her into the sorghum field, his hand never leaving the object at his belt.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The sentence you provided is a complete Chinese sentence. To translate it into English, I will break it down into its components and then reconstruct the sentence in English.\n","\n","劫路人 (jiǎolù rén) - bandit/robber thief\n","催逼着 (cūpì zhe) - urged/persuaded\n","奶奶 (nǎniángiān) - grandmother\n","往 (wǎng) - towards/to\n","高粱地 (gāoláng dì) - sorghum field\n","里 (lǐ) - inside/within\n","走 (zǒu) - to walk/go\n","他的 (tā de) - his\n","手 (shǒu) - hand\n","始终 (shǐzhōng) - always/all the time\n","按着 (àn zhe) - holding/pressing\n","腰里 (yāolǐ) - in the waist/at the waist\n","的家伙 (jiāwǒ) - thing/weapon\n","\n","Translating the sentence:\n","\n","\"The bandit thief urged his grandmother to go towards the sorghum field, his hand always holding the thing at his waist.\"\n","\n","So, the English translation of the given Chinese sentence is:\n","\n","\"The bandit thief urged his grandmother to go towards the sorghum field, his hand\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 316\n","--------------------------------------------------\n","chinese: “听到了吗?\n","--------------------------------------------------\n","english: 'Did you hear that?'\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: \"Did you hear that?\"\n","Part 1: Translate Chinese to English\n","Usage: \"听到了吗?\" translates to \"Did you hear that?\". This meets the criteria because the given Chinese sentence is translated into its English equivalent.\n","\n","Part 2: If it is an incomplete sentence\n","Usage: If the input was \"听到\", it would be considered an incomplete sentence. In this case, the output should be the same as the input: \"听到\". This meets the criteria because the input is an incomplete sentence, so no translation is provided.\n","\n","Part 3: If unsure about the meaning\n","Usage: If the input was \"吃了吗?\", which means \"Have you eaten?\", the assistant could be unsure about the exact meaning. In this case, the output should be the same as the input: \"吃了吗?\". This meets the criteria because the assistant is unsure about the meaning, so the input is copied as the output.\n","Task: Translate the given Chinese sentence to English. If the sentence is incomplete or the meaning is unclear, simply copy the input text as the output.\n","\n","Example input: “你叫什么名字?”\n","\n","Step 1: Identify if the sentence is incomplete or unclear. In this case, the sentence is complete and clear.\n","\n","Step 2: Translate the\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 300\n","--------------------------------------------------\n","chinese: 好在吴佩珍是压得起的,她的人生任务不如王琦瑶来得重,有一点吃老本,也有一点不计较,本是一身轻,也是为王琦瑶分担的意思。\n","--------------------------------------------------\n","english: It was a good thing that Wu Peizhen could take it; after all, the weight of everyday living did not rest as heavily on her. This was partly because she had plenty of psychic capital to draw on, but also because she simply did not mind. Things came easy to her and she was willing to bear more than her share.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: The task is asking you to translate a given Chinese sentence into English. Here are the simple steps to follow:\n","\n","1. Read the given Chinese sentence carefully and try to understand its meaning.\n","2. If the sentence is incomplete or you are unsure about its meaning, copy the input text as your output without attempting to translate it.\n","3. If you understand the meaning of the sentence, translate it into English while maintaining the original meaning as closely as possible.\n","4. Do not add any additional sentences, explanations, or reasoning in your translation.\n","\n","For the given Chinese sentence: 好在吴佩珍是压得起的,她的人生任务不如王琦瑶来得重,有一点吃老本,也有一点不计较,本是一身轻,也是为王琦瑶分担的意思。\n","\n","1. Read the sentence and try to understand its meaning.\n","2. The sentence is complete, so you can proceed to translate it.\n","3. Translate the sentence into English: \"Fortunately, Wu Peizhen can bear the weight, her life's tasks are not as heavy as those of Wang Qiliao. She has a little bit of relying on the old, a little bit of not caring, and she is light-hearted, which also means sharing the burden with Wang Qiliao.\"\n","4. Your final output should be: \"Fortunately, Wu Peizhen can bear the weight, her life's tasks are not\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 331\n","--------------------------------------------------\n","chinese: 又想:“倘若这里真是皇宫,那么老吴、温家哥儿,还有那个小玄子都是太监了。\n","--------------------------------------------------\n","english: If this really is the Forbidden City, then old Wu and the Wen brothers and little Misty must all of them be eunuchs.\n","--------------------------------------------------\n","01-ai/Yi-1.5-9B-Chat/shots-00: I am translating the given Chinese sentence into English.\n","\n","Chinese: 又想: “倘若这里真是皇宫, 那么老吴、 温家哥儿, 还有那个小玄子都是太监了。\n","\n","Step 1: Break down the sentence into smaller parts.\n","- 又想:\n","- “倘若这里真是皇宫,\n","- 那么\n","- 老吴、\n","- 温家哥儿,\n","- 还有那个\n","- 小玄子\n","- 都是太监了。\n","\n","Step 2: Translate each part into English.\n","- 又想: (Once again, he thought)\n","- “倘若这里真是皇宫, (If this really is the imperial palace,)\n","- 那么 (then)\n","- 老吴、 (Old Wu,)\n","- 温家哥儿, (the young man from the Wen family,)\n","- 还有那个 (and that little Xuanzi)\n","- 小玄子 (also)\n","- 都是太监了。 (are eunuchs.)\n","\n","Step 3: Combine the translated parts into a coherent English sentence.\n","\n","English: Once again, he thought: \"If this really is the imperial palace, then Old Wu, the young man from the Wen family, and that little Xuanzi are all eunuchs.\"\n","--------------------------------------------------\n","output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00: 302\n"]}],"source":["output_tokens = f\"output_tokens-{col}\"\n","df2 = df[df[output_tokens] >= max_new_tokens][\n"," [\"chinese\", \"english\", col, output_tokens]\n","]\n","print_row_details(df2, range(len(df2)))"]},{"cell_type":"code","execution_count":30,"metadata":{},"outputs":[{"data":{"text/plain":["18"]},"execution_count":30,"metadata":{},"output_type":"execute_result"}],"source":["len(df2)"]},{"cell_type":"code","execution_count":31,"metadata":{},"outputs":[{"data":{"text/html":["<div>\n","<style scoped>\n"," .dataframe tbody tr th:only-of-type {\n"," vertical-align: middle;\n"," }\n","\n"," .dataframe tbody tr th {\n"," vertical-align: top;\n"," }\n","\n"," .dataframe thead th {\n"," text-align: right;\n"," }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n"," <thead>\n"," <tr style=\"text-align: right;\">\n"," <th></th>\n"," <th>ground_truth_ews_score</th>\n"," <th>ground_truth_repetition_score</th>\n"," <th>ground_truth_total_repetitions</th>\n"," <th>ews_score</th>\n"," <th>repetition_score</th>\n"," <th>total_repetitions</th>\n"," <th>ground_truth_tokens-01-ai/Yi-1.5-9B-Chat</th>\n"," <th>output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00</th>\n"," </tr>\n"," </thead>\n"," <tbody>\n"," <tr>\n"," <th>count</th>\n"," <td>1133.0</td>\n"," <td>1133.000000</td>\n"," <td>1133.000000</td>\n"," <td>1133.000000</td>\n"," <td>1133.000000</td>\n"," <td>1133.000000</td>\n"," <td>1133.000000</td>\n"," <td>1133.000000</td>\n"," </tr>\n"," <tr>\n"," <th>mean</th>\n"," <td>0.0</td>\n"," <td>0.312445</td>\n"," <td>0.312445</td>\n"," <td>0.008826</td>\n"," <td>1.614298</td>\n"," <td>1.623124</td>\n"," <td>33.044131</td>\n"," <td>59.693733</td>\n"," </tr>\n"," <tr>\n"," <th>std</th>\n"," <td>0.0</td>\n"," <td>7.193649</td>\n"," <td>7.193649</td>\n"," <td>0.209980</td>\n"," <td>36.834513</td>\n"," <td>36.834724</td>\n"," <td>22.889653</td>\n"," <td>65.755925</td>\n"," </tr>\n"," <tr>\n"," <th>min</th>\n"," <td>0.0</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>1.000000</td>\n"," <td>4.000000</td>\n"," </tr>\n"," <tr>\n"," <th>25%</th>\n"," <td>0.0</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>17.000000</td>\n"," <td>21.000000</td>\n"," </tr>\n"," <tr>\n"," <th>50%</th>\n"," <td>0.0</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>28.000000</td>\n"," <td>37.000000</td>\n"," </tr>\n"," <tr>\n"," <th>75%</th>\n"," <td>0.0</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>0.000000</td>\n"," <td>42.000000</td>\n"," <td>66.000000</td>\n"," </tr>\n"," <tr>\n"," <th>max</th>\n"," <td>0.0</td>\n"," <td>239.000000</td>\n"," <td>239.000000</td>\n"," <td>5.000000</td>\n"," <td>1224.000000</td>\n"," <td>1224.000000</td>\n"," <td>154.000000</td>\n"," <td>331.000000</td>\n"," </tr>\n"," </tbody>\n","</table>\n","</div>"],"text/plain":[" ground_truth_ews_score ground_truth_repetition_score \\\n","count 1133.0 1133.000000 \n","mean 0.0 0.312445 \n","std 0.0 7.193649 \n","min 0.0 0.000000 \n","25% 0.0 0.000000 \n","50% 0.0 0.000000 \n","75% 0.0 0.000000 \n","max 0.0 239.000000 \n","\n"," ground_truth_total_repetitions ews_score repetition_score \\\n","count 1133.000000 1133.000000 1133.000000 \n","mean 0.312445 0.008826 1.614298 \n","std 7.193649 0.209980 36.834513 \n","min 0.000000 0.000000 0.000000 \n","25% 0.000000 0.000000 0.000000 \n","50% 0.000000 0.000000 0.000000 \n","75% 0.000000 0.000000 0.000000 \n","max 239.000000 5.000000 1224.000000 \n","\n"," total_repetitions ground_truth_tokens-01-ai/Yi-1.5-9B-Chat \\\n","count 1133.000000 1133.000000 \n","mean 1.623124 33.044131 \n","std 36.834724 22.889653 \n","min 0.000000 1.000000 \n","25% 0.000000 17.000000 \n","50% 0.000000 28.000000 \n","75% 0.000000 42.000000 \n","max 1224.000000 154.000000 \n","\n"," output_tokens-01-ai/Yi-1.5-9B-Chat/shots-00 \n","count 1133.000000 \n","mean 59.693733 \n","std 65.755925 \n","min 4.000000 \n","25% 21.000000 \n","50% 37.000000 \n","75% 66.000000 \n","max 331.000000 "]},"execution_count":31,"metadata":{},"output_type":"execute_result"}],"source":["df.describe()"]},{"cell_type":"code","execution_count":32,"metadata":{},"outputs":[],"source":["metrics_df.to_csv(results_path.replace(\".csv\", \"_metrics.csv\"), index=False)"]}],"metadata":{"accelerator":"GPU","application/vnd.databricks.v1+notebook":{"dashboards":[],"environmentMetadata":null,"language":"python","notebookMetadata":{"mostRecentlyExecutedCommandWithImplicitDF":{"commandId":-1,"dataframes":["_sqldf"]},"pythonIndentUnit":4},"notebookName":"10_eval-lf-medium-py3.11","widgets":{}},"colab":{"gpuType":"L4","provenance":[]},"kernelspec":{"display_name":"Python 3","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.11.9"}},"nbformat":4,"nbformat_minor":0}
|