diff --git a/analyze_scores.ipynb b/analyze_scores.ipynb new file mode 100644 index 0000000..e62b14a --- /dev/null +++ b/analyze_scores.ipynb @@ -0,0 +1,13171 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "9169e316-80c7-460e-86d1-bca78ce044d3", + "metadata": {}, + "outputs": [], + "source": [ + "import csv\n", + "from pathlib import Path\n", + "\n", + "import numpy as np\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "9573a7f9-058c-47af-9af1-50fb4d454abb", + "metadata": {}, + "outputs": [], + "source": [ + "pd.set_option('display.max_colwidth', None)\n", + "pd.set_option('display.colheader_justify', 'center')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "a199810d-893f-494d-b560-a1a82612bd13", + "metadata": {}, + "outputs": [], + "source": [ + "SAMPLE_AUDIO_PATH = \"generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav\"\n", + "EVAL_MAP_PATH = \"reports/eval_map.csv\"\n", + "SCORES_PATH = \"data/scores_results.xlsx\"" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "ac502266-1c5e-4dce-add2-a57d107571ed", + "metadata": {}, + "outputs": [], + "source": [ + "## NOTE: all model keys need to be composed of a single letter followed by a number\n", + "model2folder = {\n", + " \"m1\": 'generated_hifi/esd_tune/g_3164999',\n", + " \"m2\": 'generated_hifi/esd_tune_reversal/g_3164999',\n", + " \"m3\": 'generated_hifi/esd_tune_advloss0/g_3164999',\n", + "}" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "b79125a1-4e4a-483a-a498-ea95ed0eb61d", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'generated_hifi/esd_tune/g_3164999': 'm1',\n", + " 'generated_hifi/esd_tune_reversal/g_3164999': 'm2',\n", + " 'generated_hifi/esd_tune_advloss0/g_3164999': 'm3'}" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "folder2model = {v: k for k, v in model2folder.items()}\n", + "folder2model" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "8a2711f2-14ea-48f8-b8a4-bd6e5d845a0d", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
012345
0--id_1id_2id_3-
1We got few vegetables and fruits , and became fish eaters .0011generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wavgenerated_hifi/esd_tune/g_3164999/0011/angry/1.wavgenerated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wavWe got few vegetables and fruits , and became fish eaters .
2--id_4id_5id_6-
3Humans also judge distance by using the relative sizes of objects.0011generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wavgenerated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wavgenerated_hifi/esd_tune/g_3164999/0011/angry/10.wavHumans also judge distance by using the relative sizes of objects.
4--id_7id_8id_9-
.....................
2695The Claudine was leaving next morning for Honolulu .0020generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wavgenerated_hifi/esd_tune/g_3164999/0020/surprise/7.wavgenerated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wavThe Claudine was leaving next morning for Honolulu .
2696--id_4045id_4046id_4047-
2697Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.0020generated_hifi/esd_tune/g_3164999/0020/surprise/8.wavgenerated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wavgenerated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wavProsecutors have opened a massive investigation into allegations of fixing games and illegal betting.
2698--id_4048id_4049id_4050-
2699Different telescope designs perform differently, and have different strengths and weaknesses.0020generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wavgenerated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wavgenerated_hifi/esd_tune/g_3164999/0020/surprise/9.wavDifferent telescope designs perform differently, and have different strengths and weaknesses.
\n", + "

2700 rows × 6 columns

\n", + "
" + ], + "text/plain": [ + " 0 \\\n", + "0 - \n", + "1 We got few vegetables and fruits , and became fish eaters . \n", + "2 - \n", + "3 Humans also judge distance by using the relative sizes of objects. \n", + "4 - \n", + "... ... \n", + "2695 The Claudine was leaving next morning for Honolulu . \n", + "2696 - \n", + "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "2698 - \n", + "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "\n", + " 1 2 \\\n", + "0 - id_1 \n", + "1 0011 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n", + "2 - id_4 \n", + "3 0011 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n", + "4 - id_7 \n", + "... ... ... \n", + "2695 0020 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n", + "2696 - id_4045 \n", + "2697 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n", + "2698 - id_4048 \n", + "2699 0020 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n", + "\n", + " 3 \\\n", + "0 id_2 \n", + "1 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n", + "2 id_5 \n", + "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n", + "4 id_8 \n", + "... ... \n", + "2695 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n", + "2696 id_4046 \n", + "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n", + "2698 id_4049 \n", + "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n", + "\n", + " 4 \\\n", + "0 id_3 \n", + "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n", + "2 id_6 \n", + "3 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n", + "4 id_9 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n", + "2696 id_4047 \n", + "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n", + "2698 id_4050 \n", + "2699 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n", + "\n", + " 5 \n", + "0 - \n", + "1 We got few vegetables and fruits , and became fish eaters . \n", + "2 - \n", + "3 Humans also judge distance by using the relative sizes of objects. \n", + "4 - \n", + "... ... \n", + "2695 The Claudine was leaving next morning for Honolulu . \n", + "2696 - \n", + "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "2698 - \n", + "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "\n", + "[2700 rows x 6 columns]" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_map = pd.read_csv(\n", + " EVAL_MAP_PATH,\n", + " sep = \"\\t\",\n", + " header = None,\n", + " quoting = csv.QUOTE_NONE,\n", + ")\n", + "\n", + "df_map" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "cb751630-b2aa-41e4-a8ad-333c4c514c4e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'model': 'm3', 'sent_id': 9, 'speaker': '0020', 'accent': None}" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "def get_audio_details(f):\n", + " f_path = Path(f)\n", + " model_ = folder2model[str(f_path.parent.parent.parent)]\n", + " basename_ = f_path.name\n", + " sentence_id = int(f_path.stem)\n", + " speaker = f_path.parent.parent.name\n", + " accent = None\n", + " return {\n", + " 'model': model_,\n", + " 'sent_id': sentence_id,\n", + " 'speaker': speaker,\n", + " 'accent': accent\n", + " }\n", + "\n", + "\n", + "get_audio_details(SAMPLE_AUDIO_PATH)" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "0e1d24c8-b8a8-4dfe-a5b1-e390dbf939bd", + "metadata": {}, + "outputs": [], + "source": [ + "def process_cell(f):\n", + " if Path(f).exists():\n", + " return get_audio_details(f)\n", + " return (f)" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "b016e6c7-a310-443b-83ca-6b477d5efb3d", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
text_leftspeakerm1m2m3text_right
0--id_1id_2id_3-
1We got few vegetables and fruits , and became fish eaters .0011{'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None}{'model': 'm1', 'sent_id': 1, 'speaker': '0011', 'accent': None}{'model': 'm3', 'sent_id': 1, 'speaker': '0011', 'accent': None}We got few vegetables and fruits , and became fish eaters .
2--id_4id_5id_6-
3Humans also judge distance by using the relative sizes of objects.0011{'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None}{'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None}{'model': 'm1', 'sent_id': 10, 'speaker': '0011', 'accent': None}Humans also judge distance by using the relative sizes of objects.
4--id_7id_8id_9-
.....................
2695The Claudine was leaving next morning for Honolulu .0020{'model': 'm2', 'sent_id': 7, 'speaker': '0020', 'accent': None}{'model': 'm1', 'sent_id': 7, 'speaker': '0020', 'accent': None}{'model': 'm3', 'sent_id': 7, 'speaker': '0020', 'accent': None}The Claudine was leaving next morning for Honolulu .
2696--id_4045id_4046id_4047-
2697Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.0020{'model': 'm1', 'sent_id': 8, 'speaker': '0020', 'accent': None}{'model': 'm2', 'sent_id': 8, 'speaker': '0020', 'accent': None}{'model': 'm3', 'sent_id': 8, 'speaker': '0020', 'accent': None}Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.
2698--id_4048id_4049id_4050-
2699Different telescope designs perform differently, and have different strengths and weaknesses.0020{'model': 'm3', 'sent_id': 9, 'speaker': '0020', 'accent': None}{'model': 'm2', 'sent_id': 9, 'speaker': '0020', 'accent': None}{'model': 'm1', 'sent_id': 9, 'speaker': '0020', 'accent': None}Different telescope designs perform differently, and have different strengths and weaknesses.
\n", + "

2700 rows × 6 columns

\n", + "
" + ], + "text/plain": [ + " text_left \\\n", + "0 - \n", + "1 We got few vegetables and fruits , and became fish eaters . \n", + "2 - \n", + "3 Humans also judge distance by using the relative sizes of objects. \n", + "4 - \n", + "... ... \n", + "2695 The Claudine was leaving next morning for Honolulu . \n", + "2696 - \n", + "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "2698 - \n", + "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "\n", + " speaker \\\n", + "0 - \n", + "1 0011 \n", + "2 - \n", + "3 0011 \n", + "4 - \n", + "... ... \n", + "2695 0020 \n", + "2696 - \n", + "2697 0020 \n", + "2698 - \n", + "2699 0020 \n", + "\n", + " m1 \\\n", + "0 id_1 \n", + "1 {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None} \n", + "2 id_4 \n", + "3 {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None} \n", + "4 id_7 \n", + "... ... \n", + "2695 {'model': 'm2', 'sent_id': 7, 'speaker': '0020', 'accent': None} \n", + "2696 id_4045 \n", + "2697 {'model': 'm1', 'sent_id': 8, 'speaker': '0020', 'accent': None} \n", + "2698 id_4048 \n", + "2699 {'model': 'm3', 'sent_id': 9, 'speaker': '0020', 'accent': None} \n", + "\n", + " m2 \\\n", + "0 id_2 \n", + "1 {'model': 'm1', 'sent_id': 1, 'speaker': '0011', 'accent': None} \n", + "2 id_5 \n", + "3 {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None} \n", + "4 id_8 \n", + "... ... \n", + "2695 {'model': 'm1', 'sent_id': 7, 'speaker': '0020', 'accent': None} \n", + "2696 id_4046 \n", + "2697 {'model': 'm2', 'sent_id': 8, 'speaker': '0020', 'accent': None} \n", + "2698 id_4049 \n", + "2699 {'model': 'm2', 'sent_id': 9, 'speaker': '0020', 'accent': None} \n", + "\n", + " m3 \\\n", + "0 id_3 \n", + "1 {'model': 'm3', 'sent_id': 1, 'speaker': '0011', 'accent': None} \n", + "2 id_6 \n", + "3 {'model': 'm1', 'sent_id': 10, 'speaker': '0011', 'accent': None} \n", + "4 id_9 \n", + "... ... \n", + "2695 {'model': 'm3', 'sent_id': 7, 'speaker': '0020', 'accent': None} \n", + "2696 id_4047 \n", + "2697 {'model': 'm3', 'sent_id': 8, 'speaker': '0020', 'accent': None} \n", + "2698 id_4050 \n", + "2699 {'model': 'm1', 'sent_id': 9, 'speaker': '0020', 'accent': None} \n", + "\n", + " text_right \n", + "0 - \n", + "1 We got few vegetables and fruits , and became fish eaters . \n", + "2 - \n", + "3 Humans also judge distance by using the relative sizes of objects. \n", + "4 - \n", + "... ... \n", + "2695 The Claudine was leaving next morning for Honolulu . \n", + "2696 - \n", + "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "2698 - \n", + "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "\n", + "[2700 rows x 6 columns]" + ] + }, + "execution_count": 9, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_detailed = df_map.applymap(lambda f: process_cell(f))\n", + "df_detailed.columns = ['text_left', 'speaker', 'm1', 'm2', 'm3', 'text_right']\n", + "df_detailed" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "16a4bd24-b5e8-4762-98b5-62c38ca5f72e", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "3" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "total_K_models = len(model2folder)\n", + "total_K_models" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "b1184636-00f8-4ab7-a9d3-629095c56876", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1350" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "total_wavs_per_model = int(len(df_map) / 2)\n", + "total_wavs_per_model" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "85b862ab-fd48-45cf-af1e-78e26c9183e4", + "metadata": {}, + "outputs": [], + "source": [ + "x_range = np.array(list(range(total_wavs_per_model)))\n", + "x_indices = x_range * 2\n", + "y_indices = x_range * 2 + 1" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "id": "9bd825c9-5b4e-4e62-a1b3-63c1208a78ae", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0 id_1\n", + "2 id_4\n", + "4 id_7\n", + "6 id_10\n", + "8 id_13\n", + " ... \n", + "2690 id_4036\n", + "2692 id_4039\n", + "2694 id_4042\n", + "2696 id_4045\n", + "2698 id_4048\n", + "Name: m1, Length: 1350, dtype: object" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "m1_indices = df_detailed['m1'].iloc[x_indices]\n", + "m2_indices = df_detailed['m2'].iloc[x_indices]\n", + "m3_indices = df_detailed['m3'].iloc[x_indices]\n", + "m1_indices" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "bbac06d5-fcb6-457c-ac87-557c9634bd1e", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'id_1': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n", + " 'id_4': {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n", + " 'id_7': {'model': 'm1', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n", + " 'id_10': {'model': 'm1', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n", + " 'id_13': {'model': 'm3', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n", + " 'id_16': {'model': 'm3', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n", + " 'id_19': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n", + " 'id_22': {'model': 'm3', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n", + " 'id_25': {'model': 'm1', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n", + " 'id_28': {'model': 'm3', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n", + " 'id_31': {'model': 'm1', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n", + " 'id_34': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n", + " 'id_37': {'model': 'm3', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n", + " 'id_40': {'model': 'm3', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n", + " 'id_43': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n", + " 'id_46': {'model': 'm2', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n", + " 'id_49': {'model': 'm3', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n", + " 'id_52': {'model': 'm2', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n", + " 'id_55': {'model': 'm3', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n", + " 'id_58': {'model': 'm1', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n", + " 'id_61': {'model': 'm1', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n", + " 'id_64': {'model': 'm2', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n", + " 'id_67': {'model': 'm3', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n", + " 'id_70': {'model': 'm2', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n", + " 'id_73': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n", + " 'id_76': {'model': 'm3', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n", + " 'id_79': {'model': 'm1', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n", + " 'id_82': {'model': 'm1', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n", + " 'id_85': {'model': 'm3', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n", + " 'id_88': {'model': 'm1', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n", + " 'id_91': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n", + " 'id_94': {'model': 'm1', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n", + " 'id_97': {'model': 'm3', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n", + " 'id_100': {'model': 'm3', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n", + " 'id_103': {'model': 'm3', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n", + " 'id_106': {'model': 'm1', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n", + " 'id_109': {'model': 'm2', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n", + " 'id_112': {'model': 'm1', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n", + " 'id_115': {'model': 'm3', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n", + " 'id_118': {'model': 'm2', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n", + " 'id_121': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n", + " 'id_124': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n", + " 'id_127': {'model': 'm1', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n", + " 'id_130': {'model': 'm3', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n", + " 'id_133': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n", + " 'id_136': {'model': 'm2', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n", + " 'id_139': {'model': 'm1', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n", + " 'id_142': {'model': 'm1', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n", + " 'id_145': {'model': 'm2', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n", + " 'id_148': {'model': 'm2', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n", + " 'id_151': {'model': 'm2', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n", + " 'id_154': {'model': 'm1', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n", + " 'id_157': {'model': 'm2', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n", + " 'id_160': {'model': 'm3', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n", + " 'id_163': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n", + " 'id_166': {'model': 'm1', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n", + " 'id_169': {'model': 'm2', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n", + " 'id_172': {'model': 'm1', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n", + " 'id_175': {'model': 'm3', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n", + " 'id_178': {'model': 'm3', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n", + " 'id_181': {'model': 'm3', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n", + " 'id_184': {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n", + " 'id_187': {'model': 'm2', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n", + " 'id_190': {'model': 'm2', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n", + " 'id_193': {'model': 'm3', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n", + " 'id_196': {'model': 'm2', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n", + " 'id_199': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n", + " 'id_202': {'model': 'm1', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n", + " 'id_205': {'model': 'm2', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n", + " 'id_208': {'model': 'm3', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n", + " 'id_211': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n", + " 'id_214': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n", + " 'id_217': {'model': 'm3', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n", + " 'id_220': {'model': 'm2', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n", + " 'id_223': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n", + " 'id_226': {'model': 'm3', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n", + " 'id_229': {'model': 'm1', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n", + " 'id_232': {'model': 'm1', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n", + " 'id_235': {'model': 'm1', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n", + " 'id_238': {'model': 'm1', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n", + " 'id_241': {'model': 'm3', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n", + " 'id_244': {'model': 'm2', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n", + " 'id_247': {'model': 'm1', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n", + " 'id_250': {'model': 'm2', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n", + " 'id_253': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n", + " 'id_256': {'model': 'm3', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n", + " 'id_259': {'model': 'm3', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n", + " 'id_262': {'model': 'm1', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n", + " 'id_265': {'model': 'm1', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n", + " 'id_268': {'model': 'm2', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n", + " 'id_271': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n", + " 'id_274': {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n", + " 'id_277': {'model': 'm3', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n", + " 'id_280': {'model': 'm1', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n", + " 'id_283': {'model': 'm1', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n", + " 'id_286': {'model': 'm1', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n", + " 'id_289': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n", + " 'id_292': {'model': 'm3', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n", + " 'id_295': {'model': 'm3', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n", + " 'id_298': {'model': 'm1', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n", + " 'id_301': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n", + " 'id_304': {'model': 'm2', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n", + " 'id_307': {'model': 'm2', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n", + " 'id_310': {'model': 'm3', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n", + " 'id_313': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n", + " 'id_316': {'model': 'm3', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n", + " 'id_319': {'model': 'm1', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n", + " 'id_322': {'model': 'm2', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n", + " 'id_325': {'model': 'm2', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n", + " 'id_328': {'model': 'm2', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n", + " 'id_331': {'model': 'm2', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n", + " 'id_334': {'model': 'm1', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n", + " 'id_337': {'model': 'm3', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n", + " 'id_340': {'model': 'm3', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n", + " 'id_343': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n", + " 'id_346': {'model': 'm1', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n", + " 'id_349': {'model': 'm3', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n", + " 'id_352': {'model': 'm2', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n", + " 'id_355': {'model': 'm1', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n", + " 'id_358': {'model': 'm2', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n", + " 'id_361': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n", + " 'id_364': {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n", + " 'id_367': {'model': 'm3', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n", + " 'id_370': {'model': 'm2', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n", + " 'id_373': {'model': 'm1', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n", + " 'id_376': {'model': 'm3', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n", + " 'id_379': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n", + " 'id_382': {'model': 'm2', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n", + " 'id_385': {'model': 'm2', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n", + " 'id_388': {'model': 'm3', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n", + " 'id_391': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n", + " 'id_394': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n", + " 'id_397': {'model': 'm3', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n", + " 'id_400': {'model': 'm2', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n", + " 'id_403': {'model': 'm2', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n", + " 'id_406': {'model': 'm2', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n", + " 'id_409': {'model': 'm3', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n", + " 'id_412': {'model': 'm1', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n", + " 'id_415': {'model': 'm2', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n", + " 'id_418': {'model': 'm1', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n", + " 'id_421': {'model': 'm2', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n", + " 'id_424': {'model': 'm2', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n", + " 'id_427': {'model': 'm2', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n", + " 'id_430': {'model': 'm3', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n", + " 'id_433': {'model': 'm2', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n", + " 'id_436': {'model': 'm3', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n", + " 'id_439': {'model': 'm1', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n", + " 'id_442': {'model': 'm3', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n", + " 'id_445': {'model': 'm1', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n", + " 'id_448': {'model': 'm3', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n", + " 'id_451': {'model': 'm3', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n", + " 'id_454': {'model': 'm3', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n", + " 'id_457': {'model': 'm3', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n", + " 'id_460': {'model': 'm2', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n", + " 'id_463': {'model': 'm3', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n", + " 'id_466': {'model': 'm2', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n", + " 'id_469': {'model': 'm3', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n", + " 'id_472': {'model': 'm2', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n", + " 'id_475': {'model': 'm2', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n", + " 'id_478': {'model': 'm2', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n", + " 'id_481': {'model': 'm1', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n", + " 'id_484': {'model': 'm2', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n", + " 'id_487': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n", + " 'id_490': {'model': 'm2', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n", + " 'id_493': {'model': 'm2', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n", + " 'id_496': {'model': 'm3', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n", + " 'id_499': {'model': 'm1', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n", + " 'id_502': {'model': 'm2', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n", + " 'id_505': {'model': 'm3', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n", + " 'id_508': {'model': 'm2', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n", + " 'id_511': {'model': 'm2', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n", + " 'id_514': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n", + " 'id_517': {'model': 'm3', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n", + " 'id_520': {'model': 'm3', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n", + " 'id_523': {'model': 'm3', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n", + " 'id_526': {'model': 'm1', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n", + " 'id_529': {'model': 'm2', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n", + " 'id_532': {'model': 'm3', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n", + " 'id_535': {'model': 'm3', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n", + " 'id_538': {'model': 'm3', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n", + " 'id_541': {'model': 'm3', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n", + " 'id_544': {'model': 'm3', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n", + " 'id_547': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n", + " 'id_550': {'model': 'm3', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n", + " 'id_553': {'model': 'm2', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n", + " 'id_556': {'model': 'm1', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n", + " 'id_559': {'model': 'm3', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n", + " 'id_562': {'model': 'm3', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n", + " 'id_565': {'model': 'm1', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n", + " 'id_568': {'model': 'm2', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n", + " 'id_571': {'model': 'm3', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n", + " 'id_574': {'model': 'm1', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n", + " 'id_577': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n", + " 'id_580': {'model': 'm2', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n", + " 'id_583': {'model': 'm3', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n", + " 'id_586': {'model': 'm2', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n", + " 'id_589': {'model': 'm3', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n", + " 'id_592': {'model': 'm2', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n", + " 'id_595': {'model': 'm3', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n", + " 'id_598': {'model': 'm3', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n", + " 'id_601': {'model': 'm2', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n", + " 'id_604': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n", + " 'id_607': {'model': 'm2', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n", + " 'id_610': {'model': 'm2', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n", + " 'id_613': {'model': 'm2', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n", + " 'id_616': {'model': 'm3', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n", + " 'id_619': {'model': 'm2', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n", + " 'id_622': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n", + " 'id_625': {'model': 'm2', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n", + " 'id_628': {'model': 'm2', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n", + " 'id_631': {'model': 'm1', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n", + " 'id_634': {'model': 'm1', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n", + " 'id_637': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n", + " 'id_640': {'model': 'm3', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n", + " 'id_643': {'model': 'm2', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n", + " 'id_646': {'model': 'm2', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n", + " 'id_649': {'model': 'm2', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n", + " 'id_652': {'model': 'm1', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n", + " 'id_655': {'model': 'm1', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n", + " 'id_658': {'model': 'm2', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n", + " 'id_661': {'model': 'm2', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n", + " 'id_664': {'model': 'm3', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n", + " 'id_667': {'model': 'm3', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n", + " 'id_670': {'model': 'm3', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n", + " 'id_673': {'model': 'm3', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n", + " 'id_676': {'model': 'm2', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n", + " 'id_679': {'model': 'm1', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n", + " 'id_682': {'model': 'm2', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n", + " 'id_685': {'model': 'm3', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n", + " 'id_688': {'model': 'm1', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n", + " 'id_691': {'model': 'm3', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n", + " 'id_694': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n", + " 'id_697': {'model': 'm3', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n", + " 'id_700': {'model': 'm3', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n", + " 'id_703': {'model': 'm1', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n", + " 'id_706': {'model': 'm1', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n", + " 'id_709': {'model': 'm2', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n", + " 'id_712': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n", + " 'id_715': {'model': 'm3', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n", + " 'id_718': {'model': 'm3', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n", + " 'id_721': {'model': 'm3', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n", + " 'id_724': {'model': 'm1', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n", + " 'id_727': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n", + " 'id_730': {'model': 'm2', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n", + " 'id_733': {'model': 'm1', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n", + " 'id_736': {'model': 'm1', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n", + " 'id_739': {'model': 'm1', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n", + " 'id_742': {'model': 'm3', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n", + " 'id_745': {'model': 'm2', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n", + " 'id_748': {'model': 'm3', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n", + " 'id_751': {'model': 'm1', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n", + " 'id_754': {'model': 'm1', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n", + " 'id_757': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n", + " 'id_760': {'model': 'm1', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n", + " 'id_763': {'model': 'm2', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n", + " 'id_766': {'model': 'm1', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n", + " 'id_769': {'model': 'm2', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n", + " 'id_772': {'model': 'm1', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n", + " 'id_775': {'model': 'm2', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n", + " 'id_778': {'model': 'm1', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n", + " 'id_781': {'model': 'm3', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n", + " 'id_784': {'model': 'm3', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n", + " 'id_787': {'model': 'm2', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n", + " 'id_790': {'model': 'm2', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n", + " 'id_793': {'model': 'm1', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n", + " 'id_796': {'model': 'm3', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n", + " 'id_799': {'model': 'm3', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n", + " 'id_802': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n", + " 'id_805': {'model': 'm2', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n", + " 'id_808': {'model': 'm1', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n", + " 'id_811': {'model': 'm1', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n", + " 'id_814': {'model': 'm3', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n", + " 'id_817': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n", + " 'id_820': {'model': 'm1', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n", + " 'id_823': {'model': 'm1', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n", + " 'id_826': {'model': 'm2', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n", + " 'id_829': {'model': 'm1', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n", + " 'id_832': {'model': 'm2', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n", + " 'id_835': {'model': 'm3', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n", + " 'id_838': {'model': 'm3', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n", + " 'id_841': {'model': 'm1', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n", + " 'id_844': {'model': 'm2', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n", + " 'id_847': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n", + " 'id_850': {'model': 'm3', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n", + " 'id_853': {'model': 'm2', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n", + " 'id_856': {'model': 'm1', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n", + " 'id_859': {'model': 'm1', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n", + " 'id_862': {'model': 'm3', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n", + " 'id_865': {'model': 'm1', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n", + " 'id_868': {'model': 'm3', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n", + " 'id_871': {'model': 'm3', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n", + " 'id_874': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n", + " 'id_877': {'model': 'm1', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n", + " 'id_880': {'model': 'm1', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n", + " 'id_883': {'model': 'm1', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n", + " 'id_886': {'model': 'm3', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n", + " 'id_889': {'model': 'm1', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n", + " 'id_892': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n", + " 'id_895': {'model': 'm2', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n", + " 'id_898': {'model': 'm3', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n", + " 'id_901': {'model': 'm2', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n", + " 'id_904': {'model': 'm2', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n", + " 'id_907': {'model': 'm2', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n", + " 'id_910': {'model': 'm1', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n", + " 'id_913': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n", + " 'id_916': {'model': 'm3', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n", + " 'id_919': {'model': 'm2', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n", + " 'id_922': {'model': 'm2', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n", + " 'id_925': {'model': 'm1', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n", + " 'id_928': {'model': 'm3', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n", + " 'id_931': {'model': 'm2', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n", + " 'id_934': {'model': 'm3', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n", + " 'id_937': {'model': 'm3', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n", + " 'id_940': {'model': 'm3', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n", + " 'id_943': {'model': 'm3', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n", + " 'id_946': {'model': 'm3', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n", + " 'id_949': {'model': 'm1', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n", + " 'id_952': {'model': 'm2', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n", + " 'id_955': {'model': 'm3', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n", + " 'id_958': {'model': 'm1', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n", + " 'id_961': {'model': 'm1', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n", + " 'id_964': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n", + " 'id_967': {'model': 'm1', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n", + " 'id_970': {'model': 'm3', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n", + " 'id_973': {'model': 'm3', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n", + " 'id_976': {'model': 'm1', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n", + " 'id_979': {'model': 'm3', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n", + " 'id_982': {'model': 'm1', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n", + " 'id_985': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n", + " 'id_988': {'model': 'm2', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n", + " 'id_991': {'model': 'm3', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n", + " 'id_994': {'model': 'm1', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n", + " 'id_997': {'model': 'm3', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n", + " 'id_1000': {'model': 'm3', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n", + " 'id_1003': {'model': 'm2', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n", + " 'id_1006': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n", + " 'id_1009': {'model': 'm3', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n", + " 'id_1012': {'model': 'm2', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n", + " 'id_1015': {'model': 'm3', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n", + " 'id_1018': {'model': 'm3', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n", + " 'id_1021': {'model': 'm3', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n", + " 'id_1024': {'model': 'm1', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n", + " 'id_1027': {'model': 'm2', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n", + " 'id_1030': {'model': 'm2', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n", + " 'id_1033': {'model': 'm1', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n", + " 'id_1036': {'model': 'm3', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n", + " 'id_1039': {'model': 'm2', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n", + " 'id_1042': {'model': 'm1', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n", + " 'id_1045': {'model': 'm3', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n", + " 'id_1048': {'model': 'm3', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n", + " 'id_1051': {'model': 'm2', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n", + " 'id_1054': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n", + " 'id_1057': {'model': 'm3', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n", + " 'id_1060': {'model': 'm3', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n", + " 'id_1063': {'model': 'm2', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n", + " 'id_1066': {'model': 'm3', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n", + " 'id_1069': {'model': 'm1', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n", + " 'id_1072': {'model': 'm3', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n", + " 'id_1075': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n", + " 'id_1078': {'model': 'm2', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n", + " 'id_1081': {'model': 'm3', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n", + " 'id_1084': {'model': 'm3', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n", + " 'id_1087': {'model': 'm1', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n", + " 'id_1090': {'model': 'm2', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n", + " 'id_1093': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n", + " 'id_1096': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n", + " 'id_1099': {'model': 'm3', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n", + " 'id_1102': {'model': 'm1', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n", + " 'id_1105': {'model': 'm3', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n", + " 'id_1108': {'model': 'm3', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n", + " 'id_1111': {'model': 'm2', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n", + " 'id_1114': {'model': 'm3', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n", + " 'id_1117': {'model': 'm2', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n", + " 'id_1120': {'model': 'm1', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n", + " 'id_1123': {'model': 'm2', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n", + " 'id_1126': {'model': 'm1', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n", + " 'id_1129': {'model': 'm1', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n", + " 'id_1132': {'model': 'm2', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n", + " 'id_1135': {'model': 'm1', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n", + " 'id_1138': {'model': 'm3', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n", + " 'id_1141': {'model': 'm3', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n", + " 'id_1144': {'model': 'm3', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n", + " 'id_1147': {'model': 'm3', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n", + " 'id_1150': {'model': 'm1', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n", + " 'id_1153': {'model': 'm2', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n", + " 'id_1156': {'model': 'm3', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n", + " 'id_1159': {'model': 'm1', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n", + " 'id_1162': {'model': 'm1', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n", + " 'id_1165': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n", + " 'id_1168': {'model': 'm3', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n", + " 'id_1171': {'model': 'm2', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n", + " 'id_1174': {'model': 'm3', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n", + " 'id_1177': {'model': 'm2', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n", + " 'id_1180': {'model': 'm3', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n", + " 'id_1183': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n", + " 'id_1186': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n", + " 'id_1189': {'model': 'm1', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n", + " 'id_1192': {'model': 'm2', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n", + " 'id_1195': {'model': 'm2', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n", + " 'id_1198': {'model': 'm2', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n", + " 'id_1201': {'model': 'm3', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n", + " 'id_1204': {'model': 'm1', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n", + " 'id_1207': {'model': 'm2', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n", + " 'id_1210': {'model': 'm1', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n", + " 'id_1213': {'model': 'm1', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n", + " 'id_1216': {'model': 'm2', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n", + " 'id_1219': {'model': 'm1', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n", + " 'id_1222': {'model': 'm3', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n", + " 'id_1225': {'model': 'm3', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n", + " 'id_1228': {'model': 'm3', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n", + " 'id_1231': {'model': 'm1', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n", + " 'id_1234': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n", + " 'id_1237': {'model': 'm2', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n", + " 'id_1240': {'model': 'm2', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n", + " 'id_1243': {'model': 'm2', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n", + " 'id_1246': {'model': 'm2', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n", + " 'id_1249': {'model': 'm2', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n", + " 'id_1252': {'model': 'm3', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n", + " 'id_1255': {'model': 'm1', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n", + " 'id_1258': {'model': 'm3', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n", + " 'id_1261': {'model': 'm2', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n", + " 'id_1264': {'model': 'm3', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n", + " 'id_1267': {'model': 'm3', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n", + " 'id_1270': {'model': 'm3', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n", + " 'id_1273': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n", + " 'id_1276': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n", + " 'id_1279': {'model': 'm1', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n", + " 'id_1282': {'model': 'm3', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n", + " 'id_1285': {'model': 'm1', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n", + " 'id_1288': {'model': 'm1', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n", + " 'id_1291': {'model': 'm1', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n", + " 'id_1294': {'model': 'm3', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n", + " 'id_1297': {'model': 'm1', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n", + " 'id_1300': {'model': 'm2', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n", + " 'id_1303': {'model': 'm3', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n", + " 'id_1306': {'model': 'm1', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n", + " 'id_1309': {'model': 'm3', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n", + " 'id_1312': {'model': 'm2', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n", + " 'id_1315': {'model': 'm2', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n", + " 'id_1318': {'model': 'm1', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n", + " 'id_1321': {'model': 'm1', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n", + " 'id_1324': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n", + " 'id_1327': {'model': 'm2', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n", + " 'id_1330': {'model': 'm3', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n", + " 'id_1333': {'model': 'm1', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n", + " 'id_1336': {'model': 'm1', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n", + " 'id_1339': {'model': 'm2', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n", + " 'id_1342': {'model': 'm1', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n", + " 'id_1345': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n", + " 'id_1348': {'model': 'm3', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n", + " 'id_1351': {'model': 'm2', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n", + " 'id_1354': {'model': 'm1', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n", + " 'id_1357': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n", + " 'id_1360': {'model': 'm2', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n", + " 'id_1363': {'model': 'm1', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n", + " 'id_1366': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n", + " 'id_1369': {'model': 'm2', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n", + " 'id_1372': {'model': 'm3', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n", + " 'id_1375': {'model': 'm3', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n", + " 'id_1378': {'model': 'm3', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n", + " 'id_1381': {'model': 'm3', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n", + " 'id_1384': {'model': 'm2', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n", + " 'id_1387': {'model': 'm2', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n", + " 'id_1390': {'model': 'm1', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n", + " 'id_1393': {'model': 'm3', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n", + " 'id_1396': {'model': 'm1', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n", + " 'id_1399': {'model': 'm1', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n", + " 'id_1402': {'model': 'm1', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n", + " 'id_1405': {'model': 'm2', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n", + " 'id_1408': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n", + " 'id_1411': {'model': 'm1', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n", + " 'id_1414': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n", + " 'id_1417': {'model': 'm2', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n", + " 'id_1420': {'model': 'm3', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n", + " 'id_1423': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n", + " 'id_1426': {'model': 'm3', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n", + " 'id_1429': {'model': 'm3', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n", + " 'id_1432': {'model': 'm1', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n", + " 'id_1435': {'model': 'm1', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n", + " 'id_1438': {'model': 'm1', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n", + " 'id_1441': {'model': 'm1', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n", + " 'id_1444': {'model': 'm2', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n", + " 'id_1447': {'model': 'm2', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n", + " 'id_1450': {'model': 'm2', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n", + " 'id_1453': {'model': 'm1', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n", + " 'id_1456': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n", + " 'id_1459': {'model': 'm1', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n", + " 'id_1462': {'model': 'm2', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n", + " 'id_1465': {'model': 'm2', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n", + " 'id_1468': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n", + " 'id_1471': {'model': 'm1', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n", + " 'id_1474': {'model': 'm3', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n", + " 'id_1477': {'model': 'm1', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n", + " 'id_1480': {'model': 'm1', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n", + " 'id_1483': {'model': 'm2', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n", + " 'id_1486': {'model': 'm3', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n", + " 'id_1489': {'model': 'm1', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n", + " 'id_1492': {'model': 'm2', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n", + " 'id_1495': {'model': 'm2', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n", + " 'id_1498': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n", + " 'id_1501': {'model': 'm1', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n", + " 'id_1504': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n", + " 'id_1507': {'model': 'm3', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n", + " 'id_1510': {'model': 'm1', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n", + " 'id_1513': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n", + " 'id_1516': {'model': 'm2', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n", + " 'id_1519': {'model': 'm2', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n", + " 'id_1522': {'model': 'm3', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n", + " 'id_1525': {'model': 'm1', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n", + " 'id_1528': {'model': 'm2', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n", + " 'id_1531': {'model': 'm1', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n", + " 'id_1534': {'model': 'm1', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n", + " 'id_1537': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n", + " 'id_1540': {'model': 'm3', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n", + " 'id_1543': {'model': 'm3', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n", + " 'id_1546': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n", + " 'id_1549': {'model': 'm1', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n", + " 'id_1552': {'model': 'm3', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n", + " 'id_1555': {'model': 'm2', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n", + " 'id_1558': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n", + " 'id_1561': {'model': 'm1', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n", + " 'id_1564': {'model': 'm3', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n", + " 'id_1567': {'model': 'm3', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n", + " 'id_1570': {'model': 'm3', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n", + " 'id_1573': {'model': 'm2', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n", + " 'id_1576': {'model': 'm1', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n", + " 'id_1579': {'model': 'm3', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n", + " 'id_1582': {'model': 'm3', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n", + " 'id_1585': {'model': 'm1', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n", + " 'id_1588': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n", + " 'id_1591': {'model': 'm1', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n", + " 'id_1594': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n", + " 'id_1597': {'model': 'm1', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n", + " 'id_1600': {'model': 'm2', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n", + " 'id_1603': {'model': 'm3', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n", + " 'id_1606': {'model': 'm3', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n", + " 'id_1609': {'model': 'm1', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n", + " 'id_1612': {'model': 'm1', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n", + " 'id_1615': {'model': 'm3', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n", + " 'id_1618': {'model': 'm2', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n", + " 'id_1621': {'model': 'm2', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n", + " 'id_1624': {'model': 'm1', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n", + " 'id_1627': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n", + " 'id_1630': {'model': 'm2', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n", + " 'id_1633': {'model': 'm1', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n", + " 'id_1636': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n", + " 'id_1639': {'model': 'm2', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n", + " 'id_1642': {'model': 'm2', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n", + " 'id_1645': {'model': 'm1', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n", + " 'id_1648': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n", + " 'id_1651': {'model': 'm3', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n", + " 'id_1654': {'model': 'm1', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n", + " 'id_1657': {'model': 'm2', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n", + " 'id_1660': {'model': 'm2', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n", + " 'id_1663': {'model': 'm2', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n", + " 'id_1666': {'model': 'm1', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n", + " 'id_1669': {'model': 'm3', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n", + " 'id_1672': {'model': 'm3', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n", + " 'id_1675': {'model': 'm1', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n", + " 'id_1678': {'model': 'm1', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n", + " 'id_1681': {'model': 'm2', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n", + " 'id_1684': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n", + " 'id_1687': {'model': 'm2', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n", + " 'id_1690': {'model': 'm2', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n", + " 'id_1693': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n", + " 'id_1696': {'model': 'm1', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n", + " 'id_1699': {'model': 'm2', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n", + " 'id_1702': {'model': 'm1', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n", + " 'id_1705': {'model': 'm3', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n", + " 'id_1708': {'model': 'm3', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n", + " 'id_1711': {'model': 'm1', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n", + " 'id_1714': {'model': 'm3', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n", + " 'id_1717': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n", + " 'id_1720': {'model': 'm1', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n", + " 'id_1723': {'model': 'm2', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n", + " 'id_1726': {'model': 'm3', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n", + " 'id_1729': {'model': 'm2', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n", + " 'id_1732': {'model': 'm1', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n", + " 'id_1735': {'model': 'm3', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n", + " 'id_1738': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n", + " 'id_1741': {'model': 'm1', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n", + " 'id_1744': {'model': 'm3', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n", + " 'id_1747': {'model': 'm2', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n", + " 'id_1750': {'model': 'm2', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n", + " 'id_1753': {'model': 'm1', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n", + " 'id_1756': {'model': 'm2', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n", + " 'id_1759': {'model': 'm3', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n", + " 'id_1762': {'model': 'm1', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n", + " 'id_1765': {'model': 'm3', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n", + " 'id_1768': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n", + " 'id_1771': {'model': 'm2', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n", + " 'id_1774': {'model': 'm3', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n", + " 'id_1777': {'model': 'm2', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n", + " 'id_1780': {'model': 'm3', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n", + " 'id_1783': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n", + " 'id_1786': {'model': 'm2', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n", + " 'id_1789': {'model': 'm2', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n", + " 'id_1792': {'model': 'm3', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n", + " 'id_1795': {'model': 'm1', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n", + " 'id_1798': {'model': 'm2', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n", + " 'id_1801': {'model': 'm2', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n", + " 'id_1804': {'model': 'm1', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n", + " 'id_1807': {'model': 'm2', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n", + " 'id_1810': {'model': 'm1', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n", + " 'id_1813': {'model': 'm3', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n", + " 'id_1816': {'model': 'm3', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n", + " 'id_1819': {'model': 'm3', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n", + " 'id_1822': {'model': 'm1', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n", + " 'id_1825': {'model': 'm2', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n", + " 'id_1828': {'model': 'm1', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n", + " 'id_1831': {'model': 'm3', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n", + " 'id_1834': {'model': 'm3', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n", + " 'id_1837': {'model': 'm1', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n", + " 'id_1840': {'model': 'm2', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n", + " 'id_1843': {'model': 'm1', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n", + " 'id_1846': {'model': 'm1', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n", + " 'id_1849': {'model': 'm1', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n", + " 'id_1852': {'model': 'm2', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n", + " 'id_1855': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n", + " 'id_1858': {'model': 'm3', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n", + " 'id_1861': {'model': 'm2', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n", + " 'id_1864': {'model': 'm1', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n", + " 'id_1867': {'model': 'm1', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n", + " 'id_1870': {'model': 'm1', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n", + " 'id_1873': {'model': 'm3', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n", + " 'id_1876': {'model': 'm1', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n", + " 'id_1879': {'model': 'm3', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n", + " 'id_1882': {'model': 'm1', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n", + " 'id_1885': {'model': 'm3', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n", + " 'id_1888': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n", + " 'id_1891': {'model': 'm1', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n", + " 'id_1894': {'model': 'm1', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n", + " 'id_1897': {'model': 'm1', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n", + " 'id_1900': {'model': 'm2', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n", + " 'id_1903': {'model': 'm3', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n", + " 'id_1906': {'model': 'm2', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n", + " 'id_1909': {'model': 'm3', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n", + " 'id_1912': {'model': 'm1', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n", + " 'id_1915': {'model': 'm3', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n", + " 'id_1918': {'model': 'm1', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n", + " 'id_1921': {'model': 'm2', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n", + " 'id_1924': {'model': 'm1', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n", + " 'id_1927': {'model': 'm3', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n", + " 'id_1930': {'model': 'm3', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n", + " 'id_1933': {'model': 'm1', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n", + " 'id_1936': {'model': 'm3', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n", + " 'id_1939': {'model': 'm2', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n", + " 'id_1942': {'model': 'm3', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n", + " 'id_1945': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n", + " 'id_1948': {'model': 'm2', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n", + " 'id_1951': {'model': 'm3', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n", + " 'id_1954': {'model': 'm2', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n", + " 'id_1957': {'model': 'm3', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n", + " 'id_1960': {'model': 'm2', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n", + " 'id_1963': {'model': 'm2', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n", + " 'id_1966': {'model': 'm3', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n", + " 'id_1969': {'model': 'm1', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n", + " 'id_1972': {'model': 'm1', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n", + " 'id_1975': {'model': 'm3', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n", + " 'id_1978': {'model': 'm1', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n", + " 'id_1981': {'model': 'm1', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n", + " 'id_1984': {'model': 'm2', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n", + " 'id_1987': {'model': 'm1', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n", + " 'id_1990': {'model': 'm1', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n", + " 'id_1993': {'model': 'm1', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n", + " 'id_1996': {'model': 'm2', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n", + " 'id_1999': {'model': 'm3', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n", + " 'id_2002': {'model': 'm1', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n", + " 'id_2005': {'model': 'm2', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n", + " 'id_2008': {'model': 'm2', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n", + " 'id_2011': {'model': 'm1', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n", + " 'id_2014': {'model': 'm1', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n", + " 'id_2017': {'model': 'm1', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n", + " 'id_2020': {'model': 'm1', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n", + " 'id_2023': {'model': 'm1', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n", + " 'id_2026': {'model': 'm2', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n", + " 'id_2029': {'model': 'm1', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n", + " 'id_2032': {'model': 'm2', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n", + " 'id_2035': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n", + " 'id_2038': {'model': 'm3', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n", + " 'id_2041': {'model': 'm3', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n", + " 'id_2044': {'model': 'm1', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n", + " 'id_2047': {'model': 'm2', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n", + " 'id_2050': {'model': 'm1', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n", + " 'id_2053': {'model': 'm2', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n", + " 'id_2056': {'model': 'm2', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n", + " 'id_2059': {'model': 'm3', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n", + " 'id_2062': {'model': 'm2', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n", + " 'id_2065': {'model': 'm1', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n", + " 'id_2068': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n", + " 'id_2071': {'model': 'm2', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n", + " 'id_2074': {'model': 'm1', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n", + " 'id_2077': {'model': 'm3', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n", + " 'id_2080': {'model': 'm3', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n", + " 'id_2083': {'model': 'm2', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n", + " 'id_2086': {'model': 'm1', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n", + " 'id_2089': {'model': 'm1', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n", + " 'id_2092': {'model': 'm2', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n", + " 'id_2095': {'model': 'm2', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n", + " 'id_2098': {'model': 'm2', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n", + " 'id_2101': {'model': 'm3', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n", + " 'id_2104': {'model': 'm1', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n", + " 'id_2107': {'model': 'm3', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n", + " 'id_2110': {'model': 'm2', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n", + " 'id_2113': {'model': 'm2', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n", + " 'id_2116': {'model': 'm1', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n", + " 'id_2119': {'model': 'm3', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n", + " 'id_2122': {'model': 'm1', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n", + " 'id_2125': {'model': 'm1', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n", + " 'id_2128': {'model': 'm2', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n", + " 'id_2131': {'model': 'm2', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n", + " 'id_2134': {'model': 'm1', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n", + " 'id_2137': {'model': 'm2', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n", + " 'id_2140': {'model': 'm3', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n", + " 'id_2143': {'model': 'm1', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n", + " 'id_2146': {'model': 'm1', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n", + " 'id_2149': {'model': 'm2', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n", + " 'id_2152': {'model': 'm2', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n", + " 'id_2155': {'model': 'm1', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n", + " 'id_2158': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n", + " 'id_2161': {'model': 'm1', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n", + " 'id_2164': {'model': 'm2', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n", + " 'id_2167': {'model': 'm3', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n", + " 'id_2170': {'model': 'm2', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n", + " 'id_2173': {'model': 'm1', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n", + " 'id_2176': {'model': 'm3', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n", + " 'id_2179': {'model': 'm1', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n", + " 'id_2182': {'model': 'm3', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n", + " 'id_2185': {'model': 'm1', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n", + " 'id_2188': {'model': 'm1', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n", + " 'id_2191': {'model': 'm2', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n", + " 'id_2194': {'model': 'm2', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n", + " 'id_2197': {'model': 'm2', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n", + " 'id_2200': {'model': 'm1', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n", + " 'id_2203': {'model': 'm3', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n", + " 'id_2206': {'model': 'm2', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n", + " 'id_2209': {'model': 'm2', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n", + " 'id_2212': {'model': 'm3', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n", + " 'id_2215': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n", + " 'id_2218': {'model': 'm2', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n", + " 'id_2221': {'model': 'm2', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n", + " 'id_2224': {'model': 'm3', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n", + " 'id_2227': {'model': 'm2', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n", + " 'id_2230': {'model': 'm3', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n", + " 'id_2233': {'model': 'm2', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n", + " 'id_2236': {'model': 'm2', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n", + " 'id_2239': {'model': 'm3', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n", + " 'id_2242': {'model': 'm1', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n", + " 'id_2245': {'model': 'm1', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n", + " 'id_2248': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n", + " 'id_2251': {'model': 'm2', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n", + " 'id_2254': {'model': 'm3', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n", + " 'id_2257': {'model': 'm1', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n", + " 'id_2260': {'model': 'm1', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n", + " 'id_2263': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n", + " 'id_2266': {'model': 'm3', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n", + " 'id_2269': {'model': 'm1', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n", + " 'id_2272': {'model': 'm3', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n", + " 'id_2275': {'model': 'm1', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n", + " 'id_2278': {'model': 'm1', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n", + " 'id_2281': {'model': 'm2', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n", + " 'id_2284': {'model': 'm2', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n", + " 'id_2287': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n", + " 'id_2290': {'model': 'm2', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n", + " 'id_2293': {'model': 'm2', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n", + " 'id_2296': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n", + " 'id_2299': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n", + " 'id_2302': {'model': 'm1', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n", + " 'id_2305': {'model': 'm1', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n", + " 'id_2308': {'model': 'm3', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n", + " 'id_2311': {'model': 'm2', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n", + " 'id_2314': {'model': 'm2', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n", + " 'id_2317': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n", + " 'id_2320': {'model': 'm1', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n", + " 'id_2323': {'model': 'm1', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n", + " 'id_2326': {'model': 'm2', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n", + " 'id_2329': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n", + " 'id_2332': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n", + " 'id_2335': {'model': 'm1', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n", + " 'id_2338': {'model': 'm2', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n", + " 'id_2341': {'model': 'm3', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n", + " 'id_2344': {'model': 'm2', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n", + " 'id_2347': {'model': 'm3', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n", + " 'id_2350': {'model': 'm2', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n", + " 'id_2353': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n", + " 'id_2356': {'model': 'm3', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n", + " 'id_2359': {'model': 'm1', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n", + " 'id_2362': {'model': 'm2', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n", + " 'id_2365': {'model': 'm1', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n", + " 'id_2368': {'model': 'm3', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n", + " 'id_2371': {'model': 'm2', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n", + " 'id_2374': {'model': 'm3', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n", + " 'id_2377': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n", + " 'id_2380': {'model': 'm3', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n", + " 'id_2383': {'model': 'm1', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n", + " 'id_2386': {'model': 'm1', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n", + " 'id_2389': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n", + " 'id_2392': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n", + " 'id_2395': {'model': 'm2', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n", + " 'id_2398': {'model': 'm2', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n", + " 'id_2401': {'model': 'm3', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n", + " 'id_2404': {'model': 'm3', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n", + " 'id_2407': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n", + " 'id_2410': {'model': 'm3', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n", + " 'id_2413': {'model': 'm2', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n", + " 'id_2416': {'model': 'm2', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n", + " 'id_2419': {'model': 'm3', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n", + " 'id_2422': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n", + " 'id_2425': {'model': 'm3', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n", + " 'id_2428': {'model': 'm2', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n", + " 'id_2431': {'model': 'm3', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n", + " 'id_2434': {'model': 'm3', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n", + " 'id_2437': {'model': 'm3', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n", + " 'id_2440': {'model': 'm1', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n", + " 'id_2443': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n", + " 'id_2446': {'model': 'm3', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n", + " 'id_2449': {'model': 'm3', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n", + " 'id_2452': {'model': 'm3', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n", + " 'id_2455': {'model': 'm2', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n", + " 'id_2458': {'model': 'm3', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n", + " 'id_2461': {'model': 'm1', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n", + " 'id_2464': {'model': 'm1', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n", + " 'id_2467': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n", + " 'id_2470': {'model': 'm1', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n", + " 'id_2473': {'model': 'm1', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n", + " 'id_2476': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n", + " 'id_2479': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n", + " 'id_2482': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n", + " 'id_2485': {'model': 'm2', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n", + " 'id_2488': {'model': 'm3', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n", + " 'id_2491': {'model': 'm1', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n", + " 'id_2494': {'model': 'm1', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n", + " 'id_2497': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n", + " 'id_2500': {'model': 'm3', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n", + " 'id_2503': {'model': 'm1', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n", + " 'id_2506': {'model': 'm1', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n", + " 'id_2509': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n", + " 'id_2512': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n", + " 'id_2515': {'model': 'm2', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n", + " 'id_2518': {'model': 'm3', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n", + " 'id_2521': {'model': 'm1', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n", + " 'id_2524': {'model': 'm1', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n", + " 'id_2527': {'model': 'm2', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n", + " 'id_2530': {'model': 'm2', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n", + " 'id_2533': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n", + " 'id_2536': {'model': 'm1', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n", + " 'id_2539': {'model': 'm3', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n", + " 'id_2542': {'model': 'm3', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n", + " 'id_2545': {'model': 'm1', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n", + " 'id_2548': {'model': 'm2', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n", + " 'id_2551': {'model': 'm3', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n", + " 'id_2554': {'model': 'm3', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n", + " 'id_2557': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n", + " 'id_2560': {'model': 'm3', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n", + " 'id_2563': {'model': 'm3', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n", + " 'id_2566': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n", + " 'id_2569': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n", + " 'id_2572': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n", + " 'id_2575': {'model': 'm2', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n", + " 'id_2578': {'model': 'm1', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n", + " 'id_2581': {'model': 'm1', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n", + " 'id_2584': {'model': 'm3', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n", + " 'id_2587': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n", + " 'id_2590': {'model': 'm2', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n", + " 'id_2593': {'model': 'm3', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n", + " 'id_2596': {'model': 'm3', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n", + " 'id_2599': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n", + " 'id_2602': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n", + " 'id_2605': {'model': 'm2', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n", + " 'id_2608': {'model': 'm3', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n", + " 'id_2611': {'model': 'm1', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n", + " 'id_2614': {'model': 'm2', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n", + " 'id_2617': {'model': 'm2', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n", + " 'id_2620': {'model': 'm2', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n", + " 'id_2623': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n", + " 'id_2626': {'model': 'm2', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n", + " 'id_2629': {'model': 'm3', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n", + " 'id_2632': {'model': 'm2', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n", + " 'id_2635': {'model': 'm2', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n", + " 'id_2638': {'model': 'm1', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n", + " 'id_2641': {'model': 'm2', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n", + " 'id_2644': {'model': 'm1', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n", + " 'id_2647': {'model': 'm2', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n", + " 'id_2650': {'model': 'm3', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n", + " 'id_2653': {'model': 'm1', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n", + " 'id_2656': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n", + " 'id_2659': {'model': 'm3', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n", + " 'id_2662': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n", + " 'id_2665': {'model': 'm1', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n", + " 'id_2668': {'model': 'm2', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n", + " 'id_2671': {'model': 'm2', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n", + " 'id_2674': {'model': 'm3', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n", + " 'id_2677': {'model': 'm1', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n", + " 'id_2680': {'model': 'm3', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n", + " 'id_2683': {'model': 'm2', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n", + " 'id_2686': {'model': 'm1', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n", + " 'id_2689': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n", + " 'id_2692': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n", + " 'id_2695': {'model': 'm2', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n", + " 'id_2698': {'model': 'm1', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n", + " 'id_2701': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n", + " 'id_2704': {'model': 'm2', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n", + " 'id_2707': {'model': 'm3', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n", + " 'id_2710': {'model': 'm1', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n", + " 'id_2713': {'model': 'm1', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n", + " 'id_2716': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n", + " 'id_2719': {'model': 'm3', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n", + " 'id_2722': {'model': 'm3', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n", + " 'id_2725': {'model': 'm2', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n", + " 'id_2728': {'model': 'm3', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n", + " 'id_2731': {'model': 'm2', 'sent_id': 19, 'speaker': '0017', 'accent': None},\n", + " 'id_2734': {'model': 'm1', 'sent_id': 2, 'speaker': '0017', 'accent': None},\n", + " 'id_2737': {'model': 'm3', 'sent_id': 20, 'speaker': '0017', 'accent': None},\n", + " 'id_2740': {'model': 'm3', 'sent_id': 21, 'speaker': '0017', 'accent': None},\n", + " 'id_2743': {'model': 'm1', 'sent_id': 22, 'speaker': '0017', 'accent': None},\n", + " 'id_2746': {'model': 'm3', 'sent_id': 23, 'speaker': '0017', 'accent': None},\n", + " 'id_2749': {'model': 'm2', 'sent_id': 24, 'speaker': '0017', 'accent': None},\n", + " 'id_2752': {'model': 'm3', 'sent_id': 25, 'speaker': '0017', 'accent': None},\n", + " 'id_2755': {'model': 'm3', 'sent_id': 26, 'speaker': '0017', 'accent': None},\n", + " 'id_2758': {'model': 'm3', 'sent_id': 27, 'speaker': '0017', 'accent': None},\n", + " 'id_2761': {'model': 'm2', 'sent_id': 28, 'speaker': '0017', 'accent': None},\n", + " 'id_2764': {'model': 'm1', 'sent_id': 29, 'speaker': '0017', 'accent': None},\n", + " 'id_2767': {'model': 'm3', 'sent_id': 3, 'speaker': '0017', 'accent': None},\n", + " 'id_2770': {'model': 'm3', 'sent_id': 30, 'speaker': '0017', 'accent': None},\n", + " 'id_2773': {'model': 'm2', 'sent_id': 4, 'speaker': '0017', 'accent': None},\n", + " 'id_2776': {'model': 'm1', 'sent_id': 5, 'speaker': '0017', 'accent': None},\n", + " 'id_2779': {'model': 'm3', 'sent_id': 6, 'speaker': '0017', 'accent': None},\n", + " 'id_2782': {'model': 'm2', 'sent_id': 7, 'speaker': '0017', 'accent': None},\n", + " 'id_2785': {'model': 'm1', 'sent_id': 8, 'speaker': '0017', 'accent': None},\n", + " 'id_2788': {'model': 'm2', 'sent_id': 9, 'speaker': '0017', 'accent': None},\n", + " 'id_2791': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n", + " 'id_2794': {'model': 'm3', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n", + " 'id_2797': {'model': 'm1', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n", + " 'id_2800': {'model': 'm2', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n", + " 'id_2803': {'model': 'm1', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n", + " 'id_2806': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n", + " 'id_2809': {'model': 'm3', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n", + " 'id_2812': {'model': 'm1', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n", + " 'id_2815': {'model': 'm1', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n", + " 'id_2818': {'model': 'm1', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n", + " 'id_2821': {'model': 'm1', 'sent_id': 19, 'speaker': '0017', 'accent': None},\n", + " 'id_2824': {'model': 'm3', 'sent_id': 2, 'speaker': '0017', 'accent': None},\n", + " 'id_2827': {'model': 'm2', 'sent_id': 20, 'speaker': '0017', 'accent': None},\n", + " 'id_2830': {'model': 'm2', 'sent_id': 21, 'speaker': '0017', 'accent': None},\n", + " 'id_2833': {'model': 'm3', 'sent_id': 22, 'speaker': '0017', 'accent': None},\n", + " 'id_2836': {'model': 'm2', 'sent_id': 23, 'speaker': '0017', 'accent': None},\n", + " 'id_2839': {'model': 'm2', 'sent_id': 24, 'speaker': '0017', 'accent': None},\n", + " 'id_2842': {'model': 'm3', 'sent_id': 25, 'speaker': '0017', 'accent': None},\n", + " 'id_2845': {'model': 'm2', 'sent_id': 26, 'speaker': '0017', 'accent': None},\n", + " 'id_2848': {'model': 'm2', 'sent_id': 27, 'speaker': '0017', 'accent': None},\n", + " 'id_2851': {'model': 'm1', 'sent_id': 28, 'speaker': '0017', 'accent': None},\n", + " 'id_2854': {'model': 'm3', 'sent_id': 29, 'speaker': '0017', 'accent': None},\n", + " 'id_2857': {'model': 'm1', 'sent_id': 3, 'speaker': '0017', 'accent': None},\n", + " 'id_2860': {'model': 'm3', 'sent_id': 30, 'speaker': '0017', 'accent': None},\n", + " 'id_2863': {'model': 'm1', 'sent_id': 4, 'speaker': '0017', 'accent': None},\n", + " 'id_2866': {'model': 'm2', 'sent_id': 5, 'speaker': '0017', 'accent': None},\n", + " 'id_2869': {'model': 'm3', 'sent_id': 6, 'speaker': '0017', 'accent': None},\n", + " 'id_2872': {'model': 'm2', 'sent_id': 7, 'speaker': '0017', 'accent': None},\n", + " 'id_2875': {'model': 'm1', 'sent_id': 8, 'speaker': '0017', 'accent': None},\n", + " 'id_2878': {'model': 'm2', 'sent_id': 9, 'speaker': '0017', 'accent': None},\n", + " 'id_2881': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n", + " 'id_2884': {'model': 'm2', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n", + " 'id_2887': {'model': 'm1', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n", + " 'id_2890': {'model': 'm3', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n", + " 'id_2893': {'model': 'm3', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n", + " 'id_2896': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n", + " 'id_2899': {'model': 'm3', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n", + " 'id_2902': {'model': 'm1', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n", + " 'id_2905': {'model': 'm2', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n", + " 'id_2908': {'model': 'm3', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n", + " 'id_2911': {'model': 'm2', 'sent_id': 19, 'speaker': '0017', 'accent': None},\n", + " 'id_2914': {'model': 'm3', 'sent_id': 2, 'speaker': '0017', 'accent': None},\n", + " 'id_2917': {'model': 'm2', 'sent_id': 20, 'speaker': '0017', 'accent': None},\n", + " 'id_2920': {'model': 'm2', 'sent_id': 21, 'speaker': '0017', 'accent': None},\n", + " 'id_2923': {'model': 'm1', 'sent_id': 22, 'speaker': '0017', 'accent': None},\n", + " 'id_2926': {'model': 'm2', 'sent_id': 23, 'speaker': '0017', 'accent': None},\n", + " 'id_2929': {'model': 'm2', 'sent_id': 24, 'speaker': '0017', 'accent': None},\n", + " 'id_2932': {'model': 'm3', 'sent_id': 25, 'speaker': '0017', 'accent': None},\n", + " 'id_2935': {'model': 'm3', 'sent_id': 26, 'speaker': '0017', 'accent': None},\n", + " 'id_2938': {'model': 'm2', 'sent_id': 27, 'speaker': '0017', 'accent': None},\n", + " 'id_2941': {'model': 'm3', 'sent_id': 28, 'speaker': '0017', 'accent': None},\n", + " 'id_2944': {'model': 'm1', 'sent_id': 29, 'speaker': '0017', 'accent': None},\n", + " 'id_2947': {'model': 'm1', 'sent_id': 3, 'speaker': '0017', 'accent': None},\n", + " 'id_2950': {'model': 'm2', 'sent_id': 30, 'speaker': '0017', 'accent': None},\n", + " 'id_2953': {'model': 'm1', 'sent_id': 4, 'speaker': '0017', 'accent': None},\n", + " 'id_2956': {'model': 'm3', 'sent_id': 5, 'speaker': '0017', 'accent': None},\n", + " 'id_2959': {'model': 'm3', 'sent_id': 6, 'speaker': '0017', 'accent': None},\n", + " 'id_2962': {'model': 'm3', 'sent_id': 7, 'speaker': '0017', 'accent': None},\n", + " 'id_2965': {'model': 'm2', 'sent_id': 8, 'speaker': '0017', 'accent': None},\n", + " 'id_2968': {'model': 'm2', 'sent_id': 9, 'speaker': '0017', 'accent': None},\n", + " 'id_2971': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n", + " 'id_2974': {'model': 'm3', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n", + " 'id_2977': {'model': 'm3', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n", + " 'id_2980': {'model': 'm2', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n", + " 'id_2983': {'model': 'm3', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n", + " 'id_2986': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n", + " 'id_2989': {'model': 'm1', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n", + " 'id_2992': {'model': 'm1', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n", + " 'id_2995': {'model': 'm1', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n", + " 'id_2998': {'model': 'm1', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n", + " ...}" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "meta = {}\n", + "\n", + "for model_ in folder2model.values():\n", + " meta.update(\n", + " dict(zip(df_detailed[model_].iloc[x_indices], df_detailed[model_].iloc[y_indices]))\n", + " )\n", + "\n", + "meta" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "cd459e48-9aa1-4f8d-bad3-17e55340344a", + "metadata": {}, + "outputs": [], + "source": [ + "assert(len(meta) == total_K_models*total_wavs_per_model)" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "bef6f710-8aa1-4422-b5c4-711497388ec9", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'id_1': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_4': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_7': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_10': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_13': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_16': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_19': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_22': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_25': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_28': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_31': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_34': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_37': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_40': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_43': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_46': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_49': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_52': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_55': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_58': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_61': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_64': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_67': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_70': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_73': {'text': 'The journey was continued at dawn .'},\n", + " 'id_76': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_79': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_82': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_85': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_88': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_91': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_94': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_97': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_100': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_103': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_106': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_109': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_112': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_115': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_118': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_121': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_124': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_127': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_130': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_133': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_136': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_139': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_142': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_145': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_148': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_151': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_154': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_157': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_160': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_163': {'text': 'The journey was continued at dawn .'},\n", + " 'id_166': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_169': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_172': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_175': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_178': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_181': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_184': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_187': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_190': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_193': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_196': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_199': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_202': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_205': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_208': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_211': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_214': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_217': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_220': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_223': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_226': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_229': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_232': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_235': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_238': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_241': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_244': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_247': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_250': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_253': {'text': 'The journey was continued at dawn .'},\n", + " 'id_256': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_259': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_262': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_265': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_268': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_271': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_274': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_277': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_280': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_283': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_286': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_289': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_292': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_295': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_298': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_301': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_304': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_307': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_310': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_313': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_316': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_319': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_322': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_325': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_328': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_331': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_334': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_337': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_340': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_343': {'text': 'The journey was continued at dawn .'},\n", + " 'id_346': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_349': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_352': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_355': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_358': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_361': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_364': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_367': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_370': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_373': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_376': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_379': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_382': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_385': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_388': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_391': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_394': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_397': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_400': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_403': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_406': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_409': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_412': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_415': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_418': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_421': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_424': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_427': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_430': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_433': {'text': 'The journey was continued at dawn .'},\n", + " 'id_436': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_439': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_442': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_445': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_448': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_451': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_454': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_457': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_460': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_463': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_466': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_469': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_472': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_475': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_478': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_481': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_484': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_487': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_490': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_493': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_496': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_499': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_502': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_505': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_508': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_511': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_514': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_517': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_520': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_523': {'text': 'The journey was continued at dawn .'},\n", + " 'id_526': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_529': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_532': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_535': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_538': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_541': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_544': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_547': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_550': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_553': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_556': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_559': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_562': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_565': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_568': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_571': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_574': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_577': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_580': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_583': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_586': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_589': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_592': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_595': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_598': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_601': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_604': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_607': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_610': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_613': {'text': 'The journey was continued at dawn .'},\n", + " 'id_616': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_619': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_622': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_625': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_628': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_631': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_634': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_637': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_640': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_643': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_646': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_649': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_652': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_655': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_658': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_661': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_664': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_667': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_670': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_673': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_676': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_679': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_682': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_685': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_688': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_691': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_694': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_697': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_700': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_703': {'text': 'The journey was continued at dawn .'},\n", + " 'id_706': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_709': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_712': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_715': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_718': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_721': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_724': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_727': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_730': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_733': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_736': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_739': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_742': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_745': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_748': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_751': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_754': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_757': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_760': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_763': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_766': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_769': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_772': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_775': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_778': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_781': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_784': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_787': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_790': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_793': {'text': 'The journey was continued at dawn .'},\n", + " 'id_796': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_799': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_802': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_805': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_808': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_811': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_814': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_817': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_820': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_823': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_826': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_829': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_832': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_835': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_838': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_841': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_844': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_847': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_850': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_853': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_856': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_859': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_862': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_865': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_868': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_871': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_874': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_877': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_880': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_883': {'text': 'The journey was continued at dawn .'},\n", + " 'id_886': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_889': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_892': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_895': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_898': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_901': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_904': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_907': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_910': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_913': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_916': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_919': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_922': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_925': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_928': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_931': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_934': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_937': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_940': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_943': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_946': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_949': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_952': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_955': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_958': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_961': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_964': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_967': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_970': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_973': {'text': 'The journey was continued at dawn .'},\n", + " 'id_976': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_979': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_982': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_985': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_988': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_991': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_994': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_997': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1000': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1003': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1006': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1009': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1012': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1015': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1018': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1021': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1024': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1027': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1030': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1033': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1036': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1039': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1042': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1045': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1048': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1051': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1054': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1057': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1060': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1063': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1066': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1069': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1072': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1075': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1078': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1081': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1084': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1087': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1090': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1093': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1096': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1099': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1102': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1105': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1108': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1111': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1114': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1117': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1120': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1123': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1126': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1129': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1132': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1135': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1138': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1141': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1144': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1147': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1150': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1153': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1156': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1159': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1162': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1165': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1168': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1171': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1174': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1177': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1180': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1183': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1186': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1189': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1192': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1195': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1198': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1201': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1204': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1207': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1210': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1213': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1216': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1219': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1222': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1225': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1228': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1231': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1234': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1237': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1240': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1243': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1246': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1249': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1252': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1255': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1258': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1261': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1264': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1267': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1270': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1273': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1276': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1279': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1282': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1285': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1288': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1291': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1294': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1297': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1300': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1303': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1306': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1309': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1312': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1315': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1318': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1321': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1324': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1327': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1330': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1333': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1336': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1339': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1342': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1345': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1348': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1351': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1354': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1357': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1360': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1363': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1366': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1369': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1372': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1375': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1378': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1381': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1384': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1387': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1390': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1393': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1396': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1399': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1402': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1405': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1408': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1411': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1414': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1417': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1420': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1423': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1426': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1429': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1432': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1435': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1438': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1441': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1444': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1447': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1450': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1453': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1456': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1459': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1462': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1465': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1468': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1471': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1474': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1477': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1480': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1483': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1486': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1489': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1492': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1495': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1498': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1501': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1504': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1507': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1510': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1513': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1516': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1519': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1522': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1525': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1528': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1531': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1534': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1537': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1540': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1543': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1546': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1549': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1552': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1555': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1558': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1561': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1564': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1567': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1570': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1573': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1576': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1579': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1582': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1585': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1588': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1591': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1594': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1597': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1600': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1603': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1606': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1609': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1612': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1615': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1618': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1621': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1624': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1627': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1630': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1633': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1636': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1639': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1642': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1645': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1648': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1651': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1654': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1657': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1660': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1663': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1666': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1669': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1672': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1675': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1678': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1681': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1684': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1687': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1690': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1693': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1696': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1699': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1702': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1705': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1708': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1711': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1714': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1717': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1720': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1723': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1726': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1729': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1732': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1735': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1738': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1741': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1744': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1747': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1750': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1753': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1756': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1759': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1762': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1765': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1768': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1771': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1774': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1777': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1780': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1783': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1786': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1789': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1792': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1795': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1798': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1801': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1804': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1807': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1810': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1813': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1816': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1819': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1822': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1825': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1828': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1831': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1834': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1837': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1840': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1843': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1846': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1849': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1852': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1855': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1858': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1861': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1864': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1867': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1870': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1873': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1876': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1879': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1882': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1885': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1888': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1891': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1894': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1897': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1900': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1903': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1906': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1909': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_1912': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_1915': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_1918': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_1921': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_1924': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_1927': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_1930': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_1933': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_1936': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_1939': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_1942': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_1945': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_1948': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_1951': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_1954': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_1957': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_1960': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_1963': {'text': 'The journey was continued at dawn .'},\n", + " 'id_1966': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_1969': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_1972': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_1975': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_1978': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_1981': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_1984': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_1987': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_1990': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_1993': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_1996': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_1999': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2002': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2005': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2008': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2011': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2014': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2017': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2020': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2023': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2026': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2029': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2032': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2035': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2038': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2041': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2044': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2047': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2050': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2053': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2056': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2059': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2062': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2065': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2068': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2071': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2074': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2077': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2080': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2083': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2086': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2089': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2092': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2095': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2098': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2101': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2104': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2107': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2110': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2113': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2116': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2119': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2122': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2125': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2128': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2131': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2134': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2137': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2140': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2143': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2146': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2149': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2152': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2155': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2158': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2161': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2164': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2167': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2170': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2173': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2176': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2179': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2182': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2185': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2188': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2191': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2194': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2197': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2200': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2203': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2206': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2209': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2212': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2215': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2218': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2221': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2224': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2227': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2230': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2233': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2236': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2239': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2242': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2245': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2248': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2251': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2254': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2257': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2260': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2263': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2266': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2269': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2272': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2275': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2278': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2281': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2284': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2287': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2290': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2293': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2296': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2299': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2302': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2305': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2308': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2311': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2314': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2317': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2320': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2323': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2326': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2329': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2332': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2335': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2338': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2341': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2344': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2347': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2350': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2353': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2356': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2359': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2362': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2365': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2368': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2371': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2374': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2377': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2380': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2383': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2386': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2389': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2392': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2395': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2398': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2401': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2404': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2407': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2410': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2413': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2416': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2419': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2422': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2425': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2428': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2431': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2434': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2437': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2440': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2443': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2446': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2449': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2452': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2455': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2458': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2461': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2464': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2467': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2470': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2473': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2476': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2479': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2482': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2485': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2488': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2491': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2494': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2497': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2500': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2503': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2506': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2509': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2512': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2515': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2518': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2521': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2524': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2527': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2530': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2533': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2536': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2539': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2542': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2545': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2548': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2551': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2554': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2557': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2560': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2563': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2566': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2569': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2572': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2575': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2578': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2581': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2584': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2587': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2590': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2593': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2596': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2599': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2602': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2605': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2608': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2611': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2614': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2617': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2620': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2623': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2626': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2629': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2632': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2635': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2638': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2641': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2644': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2647': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2650': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2653': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2656': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2659': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2662': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2665': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2668': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2671': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2674': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2677': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2680': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2683': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2686': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2689': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2692': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2695': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2698': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2701': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2704': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2707': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2710': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2713': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2716': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2719': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2722': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2725': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2728': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2731': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2734': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2737': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2740': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2743': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2746': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2749': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2752': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2755': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2758': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2761': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2764': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2767': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2770': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2773': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2776': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2779': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2782': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2785': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2788': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2791': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2794': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2797': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2800': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2803': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2806': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2809': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2812': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2815': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2818': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2821': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2824': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2827': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2830': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2833': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2836': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2839': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2842': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2845': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2848': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2851': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2854': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2857': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2860': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2863': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2866': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2869': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2872': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2875': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2878': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2881': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2884': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2887': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2890': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2893': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2896': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2899': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2902': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2905': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2908': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " 'id_2911': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n", + " 'id_2914': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n", + " 'id_2917': {'text': 'Was it using language that caused their brains to develop?'},\n", + " 'id_2920': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n", + " 'id_2923': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n", + " 'id_2926': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n", + " 'id_2929': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n", + " 'id_2932': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n", + " 'id_2935': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n", + " 'id_2938': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n", + " 'id_2941': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n", + " 'id_2944': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n", + " 'id_2947': {'text': 'It seemed the ordained order of things that dogs should work .'},\n", + " 'id_2950': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n", + " 'id_2953': {'text': 'The journey was continued at dawn .'},\n", + " 'id_2956': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n", + " 'id_2959': {'text': 'A dead man is of no use on a plantation .'},\n", + " 'id_2962': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n", + " 'id_2965': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n", + " 'id_2968': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n", + " 'id_2971': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n", + " 'id_2974': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n", + " 'id_2977': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n", + " 'id_2980': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n", + " 'id_2983': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n", + " 'id_2986': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n", + " 'id_2989': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n", + " 'id_2992': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n", + " 'id_2995': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n", + " 'id_2998': {'text': 'Earthquakes damage all structures, including bridges.'},\n", + " ...}" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sentences = {}\n", + "\n", + "for model_ in folder2model.values():\n", + " sentences.update(\n", + " dict(zip(df_detailed[model_].iloc[x_indices], df_detailed['text_left'].iloc[y_indices]))\n", + " )\n", + "\n", + "for k, v in sentences.items():\n", + " sentences[k] = {'text': v}\n", + "\n", + "sentences" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "d6d927dd-c249-47e1-836c-fc6951d1dffd", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0m1_textm1_accent_speakerm1m2m3m2_text
00--id_1id_2id_3-
11We got few vegetables and fruits , and became fish eaters .0011221We got few vegetables and fruits , and became fish eaters .
22--id_4id_5id_6-
33Humans also judge distance by using the relative sizes of objects.0011333Humans also judge distance by using the relative sizes of objects.
44--id_7id_8id_9-
........................
26952695The Claudine was leaving next morning for Honolulu .0020223The Claudine was leaving next morning for Honolulu .
26962696--id_4045id_4046id_4047-
26972697Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.0020123Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.
26982698--id_4048id_4049id_4050-
26992699Different telescope designs perform differently, and have different strengths and weaknesses.0020112Different telescope designs perform differently, and have different strengths and weaknesses.
\n", + "

2700 rows × 7 columns

\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 \\\n", + "0 0 \n", + "1 1 \n", + "2 2 \n", + "3 3 \n", + "4 4 \n", + "... ... \n", + "2695 2695 \n", + "2696 2696 \n", + "2697 2697 \n", + "2698 2698 \n", + "2699 2699 \n", + "\n", + " m1_text \\\n", + "0 - \n", + "1 We got few vegetables and fruits , and became fish eaters . \n", + "2 - \n", + "3 Humans also judge distance by using the relative sizes of objects. \n", + "4 - \n", + "... ... \n", + "2695 The Claudine was leaving next morning for Honolulu . \n", + "2696 - \n", + "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "2698 - \n", + "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "\n", + " m1_accent_speaker m1 m2 m3 \\\n", + "0 - id_1 id_2 id_3 \n", + "1 0011 2 2 1 \n", + "2 - id_4 id_5 id_6 \n", + "3 0011 3 3 3 \n", + "4 - id_7 id_8 id_9 \n", + "... ... ... ... ... \n", + "2695 0020 2 2 3 \n", + "2696 - id_4045 id_4046 id_4047 \n", + "2697 0020 1 2 3 \n", + "2698 - id_4048 id_4049 id_4050 \n", + "2699 0020 1 1 2 \n", + "\n", + " m2_text \n", + "0 - \n", + "1 We got few vegetables and fruits , and became fish eaters . \n", + "2 - \n", + "3 Humans also judge distance by using the relative sizes of objects. \n", + "4 - \n", + "... ... \n", + "2695 The Claudine was leaving next morning for Honolulu . \n", + "2696 - \n", + "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "2698 - \n", + "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "\n", + "[2700 rows x 7 columns]" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "def fillna_with_random_scores(df):\n", + " val_range = [1, 2, 3]\n", + " ranval_array = np.random.choice(val_range, size=(df.shape[0], df.shape[1]))\n", + " ranval_df = pd.DataFrame(ranval_array, columns=df.columns, index=df.index)\n", + " return df.fillna(ranval_df)\n", + "\n", + "\n", + "df_scores = pd.read_excel(SCORES_PATH)\n", + "df_scores = fillna_with_random_scores(df_scores) # If scores are unfilled\n", + "df_scores" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "31e816a7-214b-479a-bdb7-d2d6652f135e", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'id_1': {'nmistakes': 2},\n", + " 'id_4': {'nmistakes': 3},\n", + " 'id_7': {'nmistakes': 3},\n", + " 'id_10': {'nmistakes': 3},\n", + " 'id_13': {'nmistakes': 2},\n", + " 'id_16': {'nmistakes': 3},\n", + " 'id_19': {'nmistakes': 1},\n", + " 'id_22': {'nmistakes': 2},\n", + " 'id_25': {'nmistakes': 3},\n", + " 'id_28': {'nmistakes': 2},\n", + " 'id_31': {'nmistakes': 3},\n", + " 'id_34': {'nmistakes': 1},\n", + " 'id_37': {'nmistakes': 2},\n", + " 'id_40': {'nmistakes': 2},\n", + " 'id_43': {'nmistakes': 3},\n", + " 'id_46': {'nmistakes': 3},\n", + " 'id_49': {'nmistakes': 1},\n", + " 'id_52': {'nmistakes': 1},\n", + " 'id_55': {'nmistakes': 2},\n", + " 'id_58': {'nmistakes': 2},\n", + " 'id_61': {'nmistakes': 2},\n", + " 'id_64': {'nmistakes': 1},\n", + " 'id_67': {'nmistakes': 3},\n", + " 'id_70': {'nmistakes': 3},\n", + " 'id_73': {'nmistakes': 3},\n", + " 'id_76': {'nmistakes': 1},\n", + " 'id_79': {'nmistakes': 2},\n", + " 'id_82': {'nmistakes': 1},\n", + " 'id_85': {'nmistakes': 2},\n", + " 'id_88': {'nmistakes': 2},\n", + " 'id_91': {'nmistakes': 2},\n", + " 'id_94': {'nmistakes': 1},\n", + " 'id_97': {'nmistakes': 1},\n", + " 'id_100': {'nmistakes': 2},\n", + " 'id_103': {'nmistakes': 2},\n", + " 'id_106': {'nmistakes': 3},\n", + " 'id_109': {'nmistakes': 2},\n", + " 'id_112': {'nmistakes': 2},\n", + " 'id_115': {'nmistakes': 1},\n", + " 'id_118': {'nmistakes': 1},\n", + " 'id_121': {'nmistakes': 1},\n", + " 'id_124': {'nmistakes': 1},\n", + " 'id_127': {'nmistakes': 2},\n", + " 'id_130': {'nmistakes': 3},\n", + " 'id_133': {'nmistakes': 1},\n", + " 'id_136': {'nmistakes': 1},\n", + " 'id_139': {'nmistakes': 1},\n", + " 'id_142': {'nmistakes': 1},\n", + " 'id_145': {'nmistakes': 3},\n", + " 'id_148': {'nmistakes': 3},\n", + " 'id_151': {'nmistakes': 3},\n", + " 'id_154': {'nmistakes': 2},\n", + " 'id_157': {'nmistakes': 1},\n", + " 'id_160': {'nmistakes': 2},\n", + " 'id_163': {'nmistakes': 3},\n", + " 'id_166': {'nmistakes': 3},\n", + " 'id_169': {'nmistakes': 1},\n", + " 'id_172': {'nmistakes': 1},\n", + " 'id_175': {'nmistakes': 1},\n", + " 'id_178': {'nmistakes': 2},\n", + " 'id_181': {'nmistakes': 3},\n", + " 'id_184': {'nmistakes': 2},\n", + " 'id_187': {'nmistakes': 1},\n", + " 'id_190': {'nmistakes': 2},\n", + " 'id_193': {'nmistakes': 1},\n", + " 'id_196': {'nmistakes': 1},\n", + " 'id_199': {'nmistakes': 3},\n", + " 'id_202': {'nmistakes': 1},\n", + " 'id_205': {'nmistakes': 2},\n", + " 'id_208': {'nmistakes': 3},\n", + " 'id_211': {'nmistakes': 2},\n", + " 'id_214': {'nmistakes': 1},\n", + " 'id_217': {'nmistakes': 3},\n", + " 'id_220': {'nmistakes': 1},\n", + " 'id_223': {'nmistakes': 2},\n", + " 'id_226': {'nmistakes': 1},\n", + " 'id_229': {'nmistakes': 3},\n", + " 'id_232': {'nmistakes': 1},\n", + " 'id_235': {'nmistakes': 1},\n", + " 'id_238': {'nmistakes': 3},\n", + " 'id_241': {'nmistakes': 3},\n", + " 'id_244': {'nmistakes': 2},\n", + " 'id_247': {'nmistakes': 1},\n", + " 'id_250': {'nmistakes': 2},\n", + " 'id_253': {'nmistakes': 1},\n", + " 'id_256': {'nmistakes': 1},\n", + " 'id_259': {'nmistakes': 1},\n", + " 'id_262': {'nmistakes': 1},\n", + " 'id_265': {'nmistakes': 2},\n", + " 'id_268': {'nmistakes': 1},\n", + " 'id_271': {'nmistakes': 2},\n", + " 'id_274': {'nmistakes': 1},\n", + " 'id_277': {'nmistakes': 1},\n", + " 'id_280': {'nmistakes': 3},\n", + " 'id_283': {'nmistakes': 3},\n", + " 'id_286': {'nmistakes': 2},\n", + " 'id_289': {'nmistakes': 1},\n", + " 'id_292': {'nmistakes': 2},\n", + " 'id_295': {'nmistakes': 2},\n", + " 'id_298': {'nmistakes': 1},\n", + " 'id_301': {'nmistakes': 2},\n", + " 'id_304': {'nmistakes': 3},\n", + " 'id_307': {'nmistakes': 1},\n", + " 'id_310': {'nmistakes': 3},\n", + " 'id_313': {'nmistakes': 3},\n", + " 'id_316': {'nmistakes': 1},\n", + " 'id_319': {'nmistakes': 3},\n", + " 'id_322': {'nmistakes': 3},\n", + " 'id_325': {'nmistakes': 3},\n", + " 'id_328': {'nmistakes': 1},\n", + " 'id_331': {'nmistakes': 1},\n", + " 'id_334': {'nmistakes': 3},\n", + " 'id_337': {'nmistakes': 2},\n", + " 'id_340': {'nmistakes': 1},\n", + " 'id_343': {'nmistakes': 1},\n", + " 'id_346': {'nmistakes': 3},\n", + " 'id_349': {'nmistakes': 2},\n", + " 'id_352': {'nmistakes': 1},\n", + " 'id_355': {'nmistakes': 2},\n", + " 'id_358': {'nmistakes': 3},\n", + " 'id_361': {'nmistakes': 3},\n", + " 'id_364': {'nmistakes': 3},\n", + " 'id_367': {'nmistakes': 2},\n", + " 'id_370': {'nmistakes': 3},\n", + " 'id_373': {'nmistakes': 3},\n", + " 'id_376': {'nmistakes': 3},\n", + " 'id_379': {'nmistakes': 3},\n", + " 'id_382': {'nmistakes': 1},\n", + " 'id_385': {'nmistakes': 1},\n", + " 'id_388': {'nmistakes': 1},\n", + " 'id_391': {'nmistakes': 2},\n", + " 'id_394': {'nmistakes': 2},\n", + " 'id_397': {'nmistakes': 1},\n", + " 'id_400': {'nmistakes': 1},\n", + " 'id_403': {'nmistakes': 2},\n", + " 'id_406': {'nmistakes': 1},\n", + " 'id_409': {'nmistakes': 3},\n", + " 'id_412': {'nmistakes': 2},\n", + " 'id_415': {'nmistakes': 2},\n", + " 'id_418': {'nmistakes': 3},\n", + " 'id_421': {'nmistakes': 3},\n", + " 'id_424': {'nmistakes': 1},\n", + " 'id_427': {'nmistakes': 2},\n", + " 'id_430': {'nmistakes': 2},\n", + " 'id_433': {'nmistakes': 3},\n", + " 'id_436': {'nmistakes': 3},\n", + " 'id_439': {'nmistakes': 2},\n", + " 'id_442': {'nmistakes': 1},\n", + " 'id_445': {'nmistakes': 3},\n", + " 'id_448': {'nmistakes': 2},\n", + " 'id_451': {'nmistakes': 1},\n", + " 'id_454': {'nmistakes': 3},\n", + " 'id_457': {'nmistakes': 3},\n", + " 'id_460': {'nmistakes': 3},\n", + " 'id_463': {'nmistakes': 1},\n", + " 'id_466': {'nmistakes': 1},\n", + " 'id_469': {'nmistakes': 2},\n", + " 'id_472': {'nmistakes': 2},\n", + " 'id_475': {'nmistakes': 3},\n", + " 'id_478': {'nmistakes': 3},\n", + " 'id_481': {'nmistakes': 2},\n", + " 'id_484': {'nmistakes': 3},\n", + " 'id_487': {'nmistakes': 1},\n", + " 'id_490': {'nmistakes': 2},\n", + " 'id_493': {'nmistakes': 3},\n", + " 'id_496': {'nmistakes': 1},\n", + " 'id_499': {'nmistakes': 1},\n", + " 'id_502': {'nmistakes': 2},\n", + " 'id_505': {'nmistakes': 3},\n", + " 'id_508': {'nmistakes': 3},\n", + " 'id_511': {'nmistakes': 1},\n", + " 'id_514': {'nmistakes': 1},\n", + " 'id_517': {'nmistakes': 3},\n", + " 'id_520': {'nmistakes': 3},\n", + " 'id_523': {'nmistakes': 3},\n", + " 'id_526': {'nmistakes': 1},\n", + " 'id_529': {'nmistakes': 3},\n", + " 'id_532': {'nmistakes': 2},\n", + " 'id_535': {'nmistakes': 1},\n", + " 'id_538': {'nmistakes': 2},\n", + " 'id_541': {'nmistakes': 3},\n", + " 'id_544': {'nmistakes': 3},\n", + " 'id_547': {'nmistakes': 3},\n", + " 'id_550': {'nmistakes': 1},\n", + " 'id_553': {'nmistakes': 3},\n", + " 'id_556': {'nmistakes': 2},\n", + " 'id_559': {'nmistakes': 1},\n", + " 'id_562': {'nmistakes': 2},\n", + " 'id_565': {'nmistakes': 3},\n", + " 'id_568': {'nmistakes': 1},\n", + " 'id_571': {'nmistakes': 2},\n", + " 'id_574': {'nmistakes': 2},\n", + " 'id_577': {'nmistakes': 3},\n", + " 'id_580': {'nmistakes': 2},\n", + " 'id_583': {'nmistakes': 3},\n", + " 'id_586': {'nmistakes': 3},\n", + " 'id_589': {'nmistakes': 3},\n", + " 'id_592': {'nmistakes': 3},\n", + " 'id_595': {'nmistakes': 3},\n", + " 'id_598': {'nmistakes': 2},\n", + " 'id_601': {'nmistakes': 1},\n", + " 'id_604': {'nmistakes': 1},\n", + " 'id_607': {'nmistakes': 2},\n", + " 'id_610': {'nmistakes': 1},\n", + " 'id_613': {'nmistakes': 3},\n", + " 'id_616': {'nmistakes': 3},\n", + " 'id_619': {'nmistakes': 1},\n", + " 'id_622': {'nmistakes': 1},\n", + " 'id_625': {'nmistakes': 1},\n", + " 'id_628': {'nmistakes': 1},\n", + " 'id_631': {'nmistakes': 2},\n", + " 'id_634': {'nmistakes': 1},\n", + " 'id_637': {'nmistakes': 3},\n", + " 'id_640': {'nmistakes': 1},\n", + " 'id_643': {'nmistakes': 3},\n", + " 'id_646': {'nmistakes': 2},\n", + " 'id_649': {'nmistakes': 3},\n", + " 'id_652': {'nmistakes': 3},\n", + " 'id_655': {'nmistakes': 3},\n", + " 'id_658': {'nmistakes': 3},\n", + " 'id_661': {'nmistakes': 3},\n", + " 'id_664': {'nmistakes': 1},\n", + " 'id_667': {'nmistakes': 1},\n", + " 'id_670': {'nmistakes': 1},\n", + " 'id_673': {'nmistakes': 2},\n", + " 'id_676': {'nmistakes': 2},\n", + " 'id_679': {'nmistakes': 1},\n", + " 'id_682': {'nmistakes': 1},\n", + " 'id_685': {'nmistakes': 3},\n", + " 'id_688': {'nmistakes': 3},\n", + " 'id_691': {'nmistakes': 1},\n", + " 'id_694': {'nmistakes': 3},\n", + " 'id_697': {'nmistakes': 2},\n", + " 'id_700': {'nmistakes': 1},\n", + " 'id_703': {'nmistakes': 1},\n", + " 'id_706': {'nmistakes': 2},\n", + " 'id_709': {'nmistakes': 1},\n", + " 'id_712': {'nmistakes': 1},\n", + " 'id_715': {'nmistakes': 2},\n", + " 'id_718': {'nmistakes': 1},\n", + " 'id_721': {'nmistakes': 3},\n", + " 'id_724': {'nmistakes': 3},\n", + " 'id_727': {'nmistakes': 2},\n", + " 'id_730': {'nmistakes': 3},\n", + " 'id_733': {'nmistakes': 2},\n", + " 'id_736': {'nmistakes': 1},\n", + " 'id_739': {'nmistakes': 3},\n", + " 'id_742': {'nmistakes': 2},\n", + " 'id_745': {'nmistakes': 1},\n", + " 'id_748': {'nmistakes': 2},\n", + " 'id_751': {'nmistakes': 1},\n", + " 'id_754': {'nmistakes': 3},\n", + " 'id_757': {'nmistakes': 2},\n", + " 'id_760': {'nmistakes': 3},\n", + " 'id_763': {'nmistakes': 3},\n", + " 'id_766': {'nmistakes': 2},\n", + " 'id_769': {'nmistakes': 3},\n", + " 'id_772': {'nmistakes': 3},\n", + " 'id_775': {'nmistakes': 3},\n", + " 'id_778': {'nmistakes': 3},\n", + " 'id_781': {'nmistakes': 3},\n", + " 'id_784': {'nmistakes': 3},\n", + " 'id_787': {'nmistakes': 1},\n", + " 'id_790': {'nmistakes': 1},\n", + " 'id_793': {'nmistakes': 2},\n", + " 'id_796': {'nmistakes': 1},\n", + " 'id_799': {'nmistakes': 3},\n", + " 'id_802': {'nmistakes': 3},\n", + " 'id_805': {'nmistakes': 1},\n", + " 'id_808': {'nmistakes': 3},\n", + " 'id_811': {'nmistakes': 1},\n", + " 'id_814': {'nmistakes': 1},\n", + " 'id_817': {'nmistakes': 1},\n", + " 'id_820': {'nmistakes': 1},\n", + " 'id_823': {'nmistakes': 2},\n", + " 'id_826': {'nmistakes': 3},\n", + " 'id_829': {'nmistakes': 2},\n", + " 'id_832': {'nmistakes': 3},\n", + " 'id_835': {'nmistakes': 2},\n", + " 'id_838': {'nmistakes': 1},\n", + " 'id_841': {'nmistakes': 2},\n", + " 'id_844': {'nmistakes': 1},\n", + " 'id_847': {'nmistakes': 1},\n", + " 'id_850': {'nmistakes': 2},\n", + " 'id_853': {'nmistakes': 3},\n", + " 'id_856': {'nmistakes': 3},\n", + " 'id_859': {'nmistakes': 2},\n", + " 'id_862': {'nmistakes': 3},\n", + " 'id_865': {'nmistakes': 3},\n", + " 'id_868': {'nmistakes': 3},\n", + " 'id_871': {'nmistakes': 3},\n", + " 'id_874': {'nmistakes': 3},\n", + " 'id_877': {'nmistakes': 1},\n", + " 'id_880': {'nmistakes': 2},\n", + " 'id_883': {'nmistakes': 1},\n", + " 'id_886': {'nmistakes': 1},\n", + " 'id_889': {'nmistakes': 3},\n", + " 'id_892': {'nmistakes': 3},\n", + " 'id_895': {'nmistakes': 1},\n", + " 'id_898': {'nmistakes': 3},\n", + " 'id_901': {'nmistakes': 1},\n", + " 'id_904': {'nmistakes': 2},\n", + " 'id_907': {'nmistakes': 2},\n", + " 'id_910': {'nmistakes': 2},\n", + " 'id_913': {'nmistakes': 1},\n", + " 'id_916': {'nmistakes': 2},\n", + " 'id_919': {'nmistakes': 2},\n", + " 'id_922': {'nmistakes': 1},\n", + " 'id_925': {'nmistakes': 3},\n", + " 'id_928': {'nmistakes': 2},\n", + " 'id_931': {'nmistakes': 2},\n", + " 'id_934': {'nmistakes': 3},\n", + " 'id_937': {'nmistakes': 1},\n", + " 'id_940': {'nmistakes': 2},\n", + " 'id_943': {'nmistakes': 1},\n", + " 'id_946': {'nmistakes': 2},\n", + " 'id_949': {'nmistakes': 3},\n", + " 'id_952': {'nmistakes': 2},\n", + " 'id_955': {'nmistakes': 1},\n", + " 'id_958': {'nmistakes': 3},\n", + " 'id_961': {'nmistakes': 3},\n", + " 'id_964': {'nmistakes': 2},\n", + " 'id_967': {'nmistakes': 3},\n", + " 'id_970': {'nmistakes': 1},\n", + " 'id_973': {'nmistakes': 2},\n", + " 'id_976': {'nmistakes': 1},\n", + " 'id_979': {'nmistakes': 2},\n", + " 'id_982': {'nmistakes': 3},\n", + " 'id_985': {'nmistakes': 2},\n", + " 'id_988': {'nmistakes': 3},\n", + " 'id_991': {'nmistakes': 3},\n", + " 'id_994': {'nmistakes': 2},\n", + " 'id_997': {'nmistakes': 1},\n", + " 'id_1000': {'nmistakes': 1},\n", + " 'id_1003': {'nmistakes': 3},\n", + " 'id_1006': {'nmistakes': 2},\n", + " 'id_1009': {'nmistakes': 3},\n", + " 'id_1012': {'nmistakes': 1},\n", + " 'id_1015': {'nmistakes': 2},\n", + " 'id_1018': {'nmistakes': 1},\n", + " 'id_1021': {'nmistakes': 3},\n", + " 'id_1024': {'nmistakes': 2},\n", + " 'id_1027': {'nmistakes': 2},\n", + " 'id_1030': {'nmistakes': 3},\n", + " 'id_1033': {'nmistakes': 1},\n", + " 'id_1036': {'nmistakes': 1},\n", + " 'id_1039': {'nmistakes': 2},\n", + " 'id_1042': {'nmistakes': 2},\n", + " 'id_1045': {'nmistakes': 1},\n", + " 'id_1048': {'nmistakes': 1},\n", + " 'id_1051': {'nmistakes': 2},\n", + " 'id_1054': {'nmistakes': 3},\n", + " 'id_1057': {'nmistakes': 3},\n", + " 'id_1060': {'nmistakes': 3},\n", + " 'id_1063': {'nmistakes': 3},\n", + " 'id_1066': {'nmistakes': 2},\n", + " 'id_1069': {'nmistakes': 2},\n", + " 'id_1072': {'nmistakes': 1},\n", + " 'id_1075': {'nmistakes': 3},\n", + " 'id_1078': {'nmistakes': 2},\n", + " 'id_1081': {'nmistakes': 2},\n", + " 'id_1084': {'nmistakes': 2},\n", + " 'id_1087': {'nmistakes': 2},\n", + " 'id_1090': {'nmistakes': 2},\n", + " 'id_1093': {'nmistakes': 3},\n", + " 'id_1096': {'nmistakes': 2},\n", + " 'id_1099': {'nmistakes': 2},\n", + " 'id_1102': {'nmistakes': 1},\n", + " 'id_1105': {'nmistakes': 1},\n", + " 'id_1108': {'nmistakes': 3},\n", + " 'id_1111': {'nmistakes': 2},\n", + " 'id_1114': {'nmistakes': 2},\n", + " 'id_1117': {'nmistakes': 1},\n", + " 'id_1120': {'nmistakes': 2},\n", + " 'id_1123': {'nmistakes': 2},\n", + " 'id_1126': {'nmistakes': 3},\n", + " 'id_1129': {'nmistakes': 2},\n", + " 'id_1132': {'nmistakes': 1},\n", + " 'id_1135': {'nmistakes': 2},\n", + " 'id_1138': {'nmistakes': 2},\n", + " 'id_1141': {'nmistakes': 1},\n", + " 'id_1144': {'nmistakes': 1},\n", + " 'id_1147': {'nmistakes': 3},\n", + " 'id_1150': {'nmistakes': 1},\n", + " 'id_1153': {'nmistakes': 1},\n", + " 'id_1156': {'nmistakes': 3},\n", + " 'id_1159': {'nmistakes': 1},\n", + " 'id_1162': {'nmistakes': 1},\n", + " 'id_1165': {'nmistakes': 3},\n", + " 'id_1168': {'nmistakes': 1},\n", + " 'id_1171': {'nmistakes': 2},\n", + " 'id_1174': {'nmistakes': 3},\n", + " 'id_1177': {'nmistakes': 2},\n", + " 'id_1180': {'nmistakes': 2},\n", + " 'id_1183': {'nmistakes': 1},\n", + " 'id_1186': {'nmistakes': 2},\n", + " 'id_1189': {'nmistakes': 1},\n", + " 'id_1192': {'nmistakes': 1},\n", + " 'id_1195': {'nmistakes': 2},\n", + " 'id_1198': {'nmistakes': 1},\n", + " 'id_1201': {'nmistakes': 3},\n", + " 'id_1204': {'nmistakes': 1},\n", + " 'id_1207': {'nmistakes': 1},\n", + " 'id_1210': {'nmistakes': 1},\n", + " 'id_1213': {'nmistakes': 1},\n", + " 'id_1216': {'nmistakes': 3},\n", + " 'id_1219': {'nmistakes': 1},\n", + " 'id_1222': {'nmistakes': 3},\n", + " 'id_1225': {'nmistakes': 3},\n", + " 'id_1228': {'nmistakes': 2},\n", + " 'id_1231': {'nmistakes': 2},\n", + " 'id_1234': {'nmistakes': 3},\n", + " 'id_1237': {'nmistakes': 1},\n", + " 'id_1240': {'nmistakes': 2},\n", + " 'id_1243': {'nmistakes': 2},\n", + " 'id_1246': {'nmistakes': 2},\n", + " 'id_1249': {'nmistakes': 3},\n", + " 'id_1252': {'nmistakes': 2},\n", + " 'id_1255': {'nmistakes': 2},\n", + " 'id_1258': {'nmistakes': 1},\n", + " 'id_1261': {'nmistakes': 2},\n", + " 'id_1264': {'nmistakes': 3},\n", + " 'id_1267': {'nmistakes': 3},\n", + " 'id_1270': {'nmistakes': 1},\n", + " 'id_1273': {'nmistakes': 2},\n", + " 'id_1276': {'nmistakes': 3},\n", + " 'id_1279': {'nmistakes': 3},\n", + " 'id_1282': {'nmistakes': 2},\n", + " 'id_1285': {'nmistakes': 3},\n", + " 'id_1288': {'nmistakes': 2},\n", + " 'id_1291': {'nmistakes': 3},\n", + " 'id_1294': {'nmistakes': 2},\n", + " 'id_1297': {'nmistakes': 2},\n", + " 'id_1300': {'nmistakes': 2},\n", + " 'id_1303': {'nmistakes': 3},\n", + " 'id_1306': {'nmistakes': 1},\n", + " 'id_1309': {'nmistakes': 1},\n", + " 'id_1312': {'nmistakes': 2},\n", + " 'id_1315': {'nmistakes': 3},\n", + " 'id_1318': {'nmistakes': 2},\n", + " 'id_1321': {'nmistakes': 3},\n", + " 'id_1324': {'nmistakes': 3},\n", + " 'id_1327': {'nmistakes': 2},\n", + " 'id_1330': {'nmistakes': 2},\n", + " 'id_1333': {'nmistakes': 1},\n", + " 'id_1336': {'nmistakes': 2},\n", + " 'id_1339': {'nmistakes': 3},\n", + " 'id_1342': {'nmistakes': 3},\n", + " 'id_1345': {'nmistakes': 2},\n", + " 'id_1348': {'nmistakes': 3},\n", + " 'id_1351': {'nmistakes': 3},\n", + " 'id_1354': {'nmistakes': 1},\n", + " 'id_1357': {'nmistakes': 2},\n", + " 'id_1360': {'nmistakes': 1},\n", + " 'id_1363': {'nmistakes': 3},\n", + " 'id_1366': {'nmistakes': 2},\n", + " 'id_1369': {'nmistakes': 3},\n", + " 'id_1372': {'nmistakes': 3},\n", + " 'id_1375': {'nmistakes': 2},\n", + " 'id_1378': {'nmistakes': 2},\n", + " 'id_1381': {'nmistakes': 3},\n", + " 'id_1384': {'nmistakes': 3},\n", + " 'id_1387': {'nmistakes': 2},\n", + " 'id_1390': {'nmistakes': 1},\n", + " 'id_1393': {'nmistakes': 1},\n", + " 'id_1396': {'nmistakes': 2},\n", + " 'id_1399': {'nmistakes': 2},\n", + " 'id_1402': {'nmistakes': 3},\n", + " 'id_1405': {'nmistakes': 1},\n", + " 'id_1408': {'nmistakes': 3},\n", + " 'id_1411': {'nmistakes': 3},\n", + " 'id_1414': {'nmistakes': 3},\n", + " 'id_1417': {'nmistakes': 1},\n", + " 'id_1420': {'nmistakes': 1},\n", + " 'id_1423': {'nmistakes': 1},\n", + " 'id_1426': {'nmistakes': 2},\n", + " 'id_1429': {'nmistakes': 2},\n", + " 'id_1432': {'nmistakes': 1},\n", + " 'id_1435': {'nmistakes': 2},\n", + " 'id_1438': {'nmistakes': 3},\n", + " 'id_1441': {'nmistakes': 3},\n", + " 'id_1444': {'nmistakes': 3},\n", + " 'id_1447': {'nmistakes': 3},\n", + " 'id_1450': {'nmistakes': 1},\n", + " 'id_1453': {'nmistakes': 2},\n", + " 'id_1456': {'nmistakes': 2},\n", + " 'id_1459': {'nmistakes': 1},\n", + " 'id_1462': {'nmistakes': 1},\n", + " 'id_1465': {'nmistakes': 2},\n", + " 'id_1468': {'nmistakes': 1},\n", + " 'id_1471': {'nmistakes': 1},\n", + " 'id_1474': {'nmistakes': 2},\n", + " 'id_1477': {'nmistakes': 3},\n", + " 'id_1480': {'nmistakes': 2},\n", + " 'id_1483': {'nmistakes': 3},\n", + " 'id_1486': {'nmistakes': 1},\n", + " 'id_1489': {'nmistakes': 3},\n", + " 'id_1492': {'nmistakes': 3},\n", + " 'id_1495': {'nmistakes': 1},\n", + " 'id_1498': {'nmistakes': 1},\n", + " 'id_1501': {'nmistakes': 2},\n", + " 'id_1504': {'nmistakes': 1},\n", + " 'id_1507': {'nmistakes': 3},\n", + " 'id_1510': {'nmistakes': 2},\n", + " 'id_1513': {'nmistakes': 3},\n", + " 'id_1516': {'nmistakes': 2},\n", + " 'id_1519': {'nmistakes': 3},\n", + " 'id_1522': {'nmistakes': 2},\n", + " 'id_1525': {'nmistakes': 3},\n", + " 'id_1528': {'nmistakes': 1},\n", + " 'id_1531': {'nmistakes': 2},\n", + " 'id_1534': {'nmistakes': 2},\n", + " 'id_1537': {'nmistakes': 3},\n", + " 'id_1540': {'nmistakes': 1},\n", + " 'id_1543': {'nmistakes': 2},\n", + " 'id_1546': {'nmistakes': 3},\n", + " 'id_1549': {'nmistakes': 1},\n", + " 'id_1552': {'nmistakes': 2},\n", + " 'id_1555': {'nmistakes': 1},\n", + " 'id_1558': {'nmistakes': 2},\n", + " 'id_1561': {'nmistakes': 1},\n", + " 'id_1564': {'nmistakes': 2},\n", + " 'id_1567': {'nmistakes': 2},\n", + " 'id_1570': {'nmistakes': 3},\n", + " 'id_1573': {'nmistakes': 2},\n", + " 'id_1576': {'nmistakes': 1},\n", + " 'id_1579': {'nmistakes': 1},\n", + " 'id_1582': {'nmistakes': 1},\n", + " 'id_1585': {'nmistakes': 1},\n", + " 'id_1588': {'nmistakes': 2},\n", + " 'id_1591': {'nmistakes': 3},\n", + " 'id_1594': {'nmistakes': 1},\n", + " 'id_1597': {'nmistakes': 3},\n", + " 'id_1600': {'nmistakes': 2},\n", + " 'id_1603': {'nmistakes': 1},\n", + " 'id_1606': {'nmistakes': 3},\n", + " 'id_1609': {'nmistakes': 1},\n", + " 'id_1612': {'nmistakes': 3},\n", + " 'id_1615': {'nmistakes': 2},\n", + " 'id_1618': {'nmistakes': 1},\n", + " 'id_1621': {'nmistakes': 2},\n", + " 'id_1624': {'nmistakes': 1},\n", + " 'id_1627': {'nmistakes': 1},\n", + " 'id_1630': {'nmistakes': 3},\n", + " 'id_1633': {'nmistakes': 3},\n", + " 'id_1636': {'nmistakes': 2},\n", + " 'id_1639': {'nmistakes': 2},\n", + " 'id_1642': {'nmistakes': 2},\n", + " 'id_1645': {'nmistakes': 2},\n", + " 'id_1648': {'nmistakes': 1},\n", + " 'id_1651': {'nmistakes': 3},\n", + " 'id_1654': {'nmistakes': 3},\n", + " 'id_1657': {'nmistakes': 2},\n", + " 'id_1660': {'nmistakes': 1},\n", + " 'id_1663': {'nmistakes': 3},\n", + " 'id_1666': {'nmistakes': 3},\n", + " 'id_1669': {'nmistakes': 2},\n", + " 'id_1672': {'nmistakes': 2},\n", + " 'id_1675': {'nmistakes': 2},\n", + " 'id_1678': {'nmistakes': 2},\n", + " 'id_1681': {'nmistakes': 2},\n", + " 'id_1684': {'nmistakes': 1},\n", + " 'id_1687': {'nmistakes': 2},\n", + " 'id_1690': {'nmistakes': 2},\n", + " 'id_1693': {'nmistakes': 1},\n", + " 'id_1696': {'nmistakes': 3},\n", + " 'id_1699': {'nmistakes': 3},\n", + " 'id_1702': {'nmistakes': 3},\n", + " 'id_1705': {'nmistakes': 1},\n", + " 'id_1708': {'nmistakes': 2},\n", + " 'id_1711': {'nmistakes': 1},\n", + " 'id_1714': {'nmistakes': 1},\n", + " 'id_1717': {'nmistakes': 3},\n", + " 'id_1720': {'nmistakes': 1},\n", + " 'id_1723': {'nmistakes': 2},\n", + " 'id_1726': {'nmistakes': 1},\n", + " 'id_1729': {'nmistakes': 3},\n", + " 'id_1732': {'nmistakes': 1},\n", + " 'id_1735': {'nmistakes': 2},\n", + " 'id_1738': {'nmistakes': 1},\n", + " 'id_1741': {'nmistakes': 1},\n", + " 'id_1744': {'nmistakes': 3},\n", + " 'id_1747': {'nmistakes': 1},\n", + " 'id_1750': {'nmistakes': 2},\n", + " 'id_1753': {'nmistakes': 1},\n", + " 'id_1756': {'nmistakes': 2},\n", + " 'id_1759': {'nmistakes': 2},\n", + " 'id_1762': {'nmistakes': 3},\n", + " 'id_1765': {'nmistakes': 2},\n", + " 'id_1768': {'nmistakes': 3},\n", + " 'id_1771': {'nmistakes': 1},\n", + " 'id_1774': {'nmistakes': 3},\n", + " 'id_1777': {'nmistakes': 3},\n", + " 'id_1780': {'nmistakes': 3},\n", + " 'id_1783': {'nmistakes': 2},\n", + " 'id_1786': {'nmistakes': 1},\n", + " 'id_1789': {'nmistakes': 1},\n", + " 'id_1792': {'nmistakes': 2},\n", + " 'id_1795': {'nmistakes': 3},\n", + " 'id_1798': {'nmistakes': 2},\n", + " 'id_1801': {'nmistakes': 1},\n", + " 'id_1804': {'nmistakes': 3},\n", + " 'id_1807': {'nmistakes': 3},\n", + " 'id_1810': {'nmistakes': 3},\n", + " 'id_1813': {'nmistakes': 2},\n", + " 'id_1816': {'nmistakes': 1},\n", + " 'id_1819': {'nmistakes': 2},\n", + " 'id_1822': {'nmistakes': 1},\n", + " 'id_1825': {'nmistakes': 1},\n", + " 'id_1828': {'nmistakes': 1},\n", + " 'id_1831': {'nmistakes': 3},\n", + " 'id_1834': {'nmistakes': 2},\n", + " 'id_1837': {'nmistakes': 3},\n", + " 'id_1840': {'nmistakes': 1},\n", + " 'id_1843': {'nmistakes': 1},\n", + " 'id_1846': {'nmistakes': 3},\n", + " 'id_1849': {'nmistakes': 2},\n", + " 'id_1852': {'nmistakes': 2},\n", + " 'id_1855': {'nmistakes': 1},\n", + " 'id_1858': {'nmistakes': 1},\n", + " 'id_1861': {'nmistakes': 3},\n", + " 'id_1864': {'nmistakes': 3},\n", + " 'id_1867': {'nmistakes': 2},\n", + " 'id_1870': {'nmistakes': 3},\n", + " 'id_1873': {'nmistakes': 2},\n", + " 'id_1876': {'nmistakes': 2},\n", + " 'id_1879': {'nmistakes': 3},\n", + " 'id_1882': {'nmistakes': 2},\n", + " 'id_1885': {'nmistakes': 3},\n", + " 'id_1888': {'nmistakes': 3},\n", + " 'id_1891': {'nmistakes': 1},\n", + " 'id_1894': {'nmistakes': 2},\n", + " 'id_1897': {'nmistakes': 1},\n", + " 'id_1900': {'nmistakes': 1},\n", + " 'id_1903': {'nmistakes': 1},\n", + " 'id_1906': {'nmistakes': 3},\n", + " 'id_1909': {'nmistakes': 3},\n", + " 'id_1912': {'nmistakes': 1},\n", + " 'id_1915': {'nmistakes': 3},\n", + " 'id_1918': {'nmistakes': 2},\n", + " 'id_1921': {'nmistakes': 3},\n", + " 'id_1924': {'nmistakes': 3},\n", + " 'id_1927': {'nmistakes': 2},\n", + " 'id_1930': {'nmistakes': 3},\n", + " 'id_1933': {'nmistakes': 1},\n", + " 'id_1936': {'nmistakes': 3},\n", + " 'id_1939': {'nmistakes': 1},\n", + " 'id_1942': {'nmistakes': 2},\n", + " 'id_1945': {'nmistakes': 2},\n", + " 'id_1948': {'nmistakes': 3},\n", + " 'id_1951': {'nmistakes': 2},\n", + " 'id_1954': {'nmistakes': 1},\n", + " 'id_1957': {'nmistakes': 2},\n", + " 'id_1960': {'nmistakes': 1},\n", + " 'id_1963': {'nmistakes': 1},\n", + " 'id_1966': {'nmistakes': 1},\n", + " 'id_1969': {'nmistakes': 3},\n", + " 'id_1972': {'nmistakes': 3},\n", + " 'id_1975': {'nmistakes': 1},\n", + " 'id_1978': {'nmistakes': 3},\n", + " 'id_1981': {'nmistakes': 1},\n", + " 'id_1984': {'nmistakes': 1},\n", + " 'id_1987': {'nmistakes': 3},\n", + " 'id_1990': {'nmistakes': 3},\n", + " 'id_1993': {'nmistakes': 1},\n", + " 'id_1996': {'nmistakes': 1},\n", + " 'id_1999': {'nmistakes': 2},\n", + " 'id_2002': {'nmistakes': 1},\n", + " 'id_2005': {'nmistakes': 2},\n", + " 'id_2008': {'nmistakes': 1},\n", + " 'id_2011': {'nmistakes': 2},\n", + " 'id_2014': {'nmistakes': 1},\n", + " 'id_2017': {'nmistakes': 1},\n", + " 'id_2020': {'nmistakes': 1},\n", + " 'id_2023': {'nmistakes': 2},\n", + " 'id_2026': {'nmistakes': 1},\n", + " 'id_2029': {'nmistakes': 2},\n", + " 'id_2032': {'nmistakes': 1},\n", + " 'id_2035': {'nmistakes': 1},\n", + " 'id_2038': {'nmistakes': 3},\n", + " 'id_2041': {'nmistakes': 1},\n", + " 'id_2044': {'nmistakes': 2},\n", + " 'id_2047': {'nmistakes': 3},\n", + " 'id_2050': {'nmistakes': 2},\n", + " 'id_2053': {'nmistakes': 1},\n", + " 'id_2056': {'nmistakes': 1},\n", + " 'id_2059': {'nmistakes': 3},\n", + " 'id_2062': {'nmistakes': 1},\n", + " 'id_2065': {'nmistakes': 2},\n", + " 'id_2068': {'nmistakes': 3},\n", + " 'id_2071': {'nmistakes': 2},\n", + " 'id_2074': {'nmistakes': 1},\n", + " 'id_2077': {'nmistakes': 1},\n", + " 'id_2080': {'nmistakes': 1},\n", + " 'id_2083': {'nmistakes': 3},\n", + " 'id_2086': {'nmistakes': 1},\n", + " 'id_2089': {'nmistakes': 1},\n", + " 'id_2092': {'nmistakes': 2},\n", + " 'id_2095': {'nmistakes': 3},\n", + " 'id_2098': {'nmistakes': 2},\n", + " 'id_2101': {'nmistakes': 1},\n", + " 'id_2104': {'nmistakes': 1},\n", + " 'id_2107': {'nmistakes': 2},\n", + " 'id_2110': {'nmistakes': 2},\n", + " 'id_2113': {'nmistakes': 2},\n", + " 'id_2116': {'nmistakes': 3},\n", + " 'id_2119': {'nmistakes': 1},\n", + " 'id_2122': {'nmistakes': 1},\n", + " 'id_2125': {'nmistakes': 2},\n", + " 'id_2128': {'nmistakes': 3},\n", + " 'id_2131': {'nmistakes': 1},\n", + " 'id_2134': {'nmistakes': 3},\n", + " 'id_2137': {'nmistakes': 2},\n", + " 'id_2140': {'nmistakes': 2},\n", + " 'id_2143': {'nmistakes': 3},\n", + " 'id_2146': {'nmistakes': 1},\n", + " 'id_2149': {'nmistakes': 1},\n", + " 'id_2152': {'nmistakes': 3},\n", + " 'id_2155': {'nmistakes': 3},\n", + " 'id_2158': {'nmistakes': 2},\n", + " 'id_2161': {'nmistakes': 2},\n", + " 'id_2164': {'nmistakes': 1},\n", + " 'id_2167': {'nmistakes': 2},\n", + " 'id_2170': {'nmistakes': 2},\n", + " 'id_2173': {'nmistakes': 3},\n", + " 'id_2176': {'nmistakes': 3},\n", + " 'id_2179': {'nmistakes': 2},\n", + " 'id_2182': {'nmistakes': 1},\n", + " 'id_2185': {'nmistakes': 3},\n", + " 'id_2188': {'nmistakes': 2},\n", + " 'id_2191': {'nmistakes': 3},\n", + " 'id_2194': {'nmistakes': 2},\n", + " 'id_2197': {'nmistakes': 2},\n", + " 'id_2200': {'nmistakes': 2},\n", + " 'id_2203': {'nmistakes': 2},\n", + " 'id_2206': {'nmistakes': 2},\n", + " 'id_2209': {'nmistakes': 3},\n", + " 'id_2212': {'nmistakes': 1},\n", + " 'id_2215': {'nmistakes': 2},\n", + " 'id_2218': {'nmistakes': 1},\n", + " 'id_2221': {'nmistakes': 1},\n", + " 'id_2224': {'nmistakes': 2},\n", + " 'id_2227': {'nmistakes': 2},\n", + " 'id_2230': {'nmistakes': 2},\n", + " 'id_2233': {'nmistakes': 2},\n", + " 'id_2236': {'nmistakes': 3},\n", + " 'id_2239': {'nmistakes': 2},\n", + " 'id_2242': {'nmistakes': 2},\n", + " 'id_2245': {'nmistakes': 3},\n", + " 'id_2248': {'nmistakes': 2},\n", + " 'id_2251': {'nmistakes': 3},\n", + " 'id_2254': {'nmistakes': 1},\n", + " 'id_2257': {'nmistakes': 2},\n", + " 'id_2260': {'nmistakes': 1},\n", + " 'id_2263': {'nmistakes': 2},\n", + " 'id_2266': {'nmistakes': 3},\n", + " 'id_2269': {'nmistakes': 3},\n", + " 'id_2272': {'nmistakes': 3},\n", + " 'id_2275': {'nmistakes': 1},\n", + " 'id_2278': {'nmistakes': 3},\n", + " 'id_2281': {'nmistakes': 2},\n", + " 'id_2284': {'nmistakes': 1},\n", + " 'id_2287': {'nmistakes': 2},\n", + " 'id_2290': {'nmistakes': 1},\n", + " 'id_2293': {'nmistakes': 3},\n", + " 'id_2296': {'nmistakes': 3},\n", + " 'id_2299': {'nmistakes': 2},\n", + " 'id_2302': {'nmistakes': 2},\n", + " 'id_2305': {'nmistakes': 1},\n", + " 'id_2308': {'nmistakes': 3},\n", + " 'id_2311': {'nmistakes': 2},\n", + " 'id_2314': {'nmistakes': 2},\n", + " 'id_2317': {'nmistakes': 1},\n", + " 'id_2320': {'nmistakes': 1},\n", + " 'id_2323': {'nmistakes': 3},\n", + " 'id_2326': {'nmistakes': 1},\n", + " 'id_2329': {'nmistakes': 1},\n", + " 'id_2332': {'nmistakes': 3},\n", + " 'id_2335': {'nmistakes': 2},\n", + " 'id_2338': {'nmistakes': 1},\n", + " 'id_2341': {'nmistakes': 3},\n", + " 'id_2344': {'nmistakes': 1},\n", + " 'id_2347': {'nmistakes': 1},\n", + " 'id_2350': {'nmistakes': 1},\n", + " 'id_2353': {'nmistakes': 1},\n", + " 'id_2356': {'nmistakes': 1},\n", + " 'id_2359': {'nmistakes': 1},\n", + " 'id_2362': {'nmistakes': 3},\n", + " 'id_2365': {'nmistakes': 3},\n", + " 'id_2368': {'nmistakes': 3},\n", + " 'id_2371': {'nmistakes': 2},\n", + " 'id_2374': {'nmistakes': 3},\n", + " 'id_2377': {'nmistakes': 1},\n", + " 'id_2380': {'nmistakes': 3},\n", + " 'id_2383': {'nmistakes': 2},\n", + " 'id_2386': {'nmistakes': 2},\n", + " 'id_2389': {'nmistakes': 3},\n", + " 'id_2392': {'nmistakes': 3},\n", + " 'id_2395': {'nmistakes': 2},\n", + " 'id_2398': {'nmistakes': 3},\n", + " 'id_2401': {'nmistakes': 2},\n", + " 'id_2404': {'nmistakes': 1},\n", + " 'id_2407': {'nmistakes': 1},\n", + " 'id_2410': {'nmistakes': 1},\n", + " 'id_2413': {'nmistakes': 2},\n", + " 'id_2416': {'nmistakes': 3},\n", + " 'id_2419': {'nmistakes': 3},\n", + " 'id_2422': {'nmistakes': 1},\n", + " 'id_2425': {'nmistakes': 1},\n", + " 'id_2428': {'nmistakes': 2},\n", + " 'id_2431': {'nmistakes': 2},\n", + " 'id_2434': {'nmistakes': 2},\n", + " 'id_2437': {'nmistakes': 2},\n", + " 'id_2440': {'nmistakes': 1},\n", + " 'id_2443': {'nmistakes': 3},\n", + " 'id_2446': {'nmistakes': 2},\n", + " 'id_2449': {'nmistakes': 1},\n", + " 'id_2452': {'nmistakes': 3},\n", + " 'id_2455': {'nmistakes': 2},\n", + " 'id_2458': {'nmistakes': 3},\n", + " 'id_2461': {'nmistakes': 1},\n", + " 'id_2464': {'nmistakes': 1},\n", + " 'id_2467': {'nmistakes': 2},\n", + " 'id_2470': {'nmistakes': 1},\n", + " 'id_2473': {'nmistakes': 3},\n", + " 'id_2476': {'nmistakes': 2},\n", + " 'id_2479': {'nmistakes': 3},\n", + " 'id_2482': {'nmistakes': 3},\n", + " 'id_2485': {'nmistakes': 3},\n", + " 'id_2488': {'nmistakes': 3},\n", + " 'id_2491': {'nmistakes': 1},\n", + " 'id_2494': {'nmistakes': 2},\n", + " 'id_2497': {'nmistakes': 2},\n", + " 'id_2500': {'nmistakes': 2},\n", + " 'id_2503': {'nmistakes': 1},\n", + " 'id_2506': {'nmistakes': 3},\n", + " 'id_2509': {'nmistakes': 2},\n", + " 'id_2512': {'nmistakes': 1},\n", + " 'id_2515': {'nmistakes': 1},\n", + " 'id_2518': {'nmistakes': 3},\n", + " 'id_2521': {'nmistakes': 3},\n", + " 'id_2524': {'nmistakes': 2},\n", + " 'id_2527': {'nmistakes': 2},\n", + " 'id_2530': {'nmistakes': 3},\n", + " 'id_2533': {'nmistakes': 3},\n", + " 'id_2536': {'nmistakes': 2},\n", + " 'id_2539': {'nmistakes': 3},\n", + " 'id_2542': {'nmistakes': 3},\n", + " 'id_2545': {'nmistakes': 3},\n", + " 'id_2548': {'nmistakes': 1},\n", + " 'id_2551': {'nmistakes': 1},\n", + " 'id_2554': {'nmistakes': 1},\n", + " 'id_2557': {'nmistakes': 2},\n", + " 'id_2560': {'nmistakes': 1},\n", + " 'id_2563': {'nmistakes': 1},\n", + " 'id_2566': {'nmistakes': 2},\n", + " 'id_2569': {'nmistakes': 1},\n", + " 'id_2572': {'nmistakes': 2},\n", + " 'id_2575': {'nmistakes': 2},\n", + " 'id_2578': {'nmistakes': 3},\n", + " 'id_2581': {'nmistakes': 2},\n", + " 'id_2584': {'nmistakes': 1},\n", + " 'id_2587': {'nmistakes': 2},\n", + " 'id_2590': {'nmistakes': 2},\n", + " 'id_2593': {'nmistakes': 3},\n", + " 'id_2596': {'nmistakes': 3},\n", + " 'id_2599': {'nmistakes': 3},\n", + " 'id_2602': {'nmistakes': 2},\n", + " 'id_2605': {'nmistakes': 3},\n", + " 'id_2608': {'nmistakes': 2},\n", + " 'id_2611': {'nmistakes': 1},\n", + " 'id_2614': {'nmistakes': 2},\n", + " 'id_2617': {'nmistakes': 2},\n", + " 'id_2620': {'nmistakes': 2},\n", + " 'id_2623': {'nmistakes': 3},\n", + " 'id_2626': {'nmistakes': 2},\n", + " 'id_2629': {'nmistakes': 3},\n", + " 'id_2632': {'nmistakes': 3},\n", + " 'id_2635': {'nmistakes': 2},\n", + " 'id_2638': {'nmistakes': 1},\n", + " 'id_2641': {'nmistakes': 3},\n", + " 'id_2644': {'nmistakes': 2},\n", + " 'id_2647': {'nmistakes': 3},\n", + " 'id_2650': {'nmistakes': 1},\n", + " 'id_2653': {'nmistakes': 3},\n", + " 'id_2656': {'nmistakes': 1},\n", + " 'id_2659': {'nmistakes': 1},\n", + " 'id_2662': {'nmistakes': 3},\n", + " 'id_2665': {'nmistakes': 1},\n", + " 'id_2668': {'nmistakes': 2},\n", + " 'id_2671': {'nmistakes': 2},\n", + " 'id_2674': {'nmistakes': 2},\n", + " 'id_2677': {'nmistakes': 1},\n", + " 'id_2680': {'nmistakes': 2},\n", + " 'id_2683': {'nmistakes': 2},\n", + " 'id_2686': {'nmistakes': 1},\n", + " 'id_2689': {'nmistakes': 1},\n", + " 'id_2692': {'nmistakes': 3},\n", + " 'id_2695': {'nmistakes': 3},\n", + " 'id_2698': {'nmistakes': 2},\n", + " 'id_2701': {'nmistakes': 3},\n", + " 'id_2704': {'nmistakes': 1},\n", + " 'id_2707': {'nmistakes': 3},\n", + " 'id_2710': {'nmistakes': 2},\n", + " 'id_2713': {'nmistakes': 3},\n", + " 'id_2716': {'nmistakes': 1},\n", + " 'id_2719': {'nmistakes': 2},\n", + " 'id_2722': {'nmistakes': 2},\n", + " 'id_2725': {'nmistakes': 3},\n", + " 'id_2728': {'nmistakes': 1},\n", + " 'id_2731': {'nmistakes': 3},\n", + " 'id_2734': {'nmistakes': 1},\n", + " 'id_2737': {'nmistakes': 1},\n", + " 'id_2740': {'nmistakes': 3},\n", + " 'id_2743': {'nmistakes': 1},\n", + " 'id_2746': {'nmistakes': 2},\n", + " 'id_2749': {'nmistakes': 2},\n", + " 'id_2752': {'nmistakes': 2},\n", + " 'id_2755': {'nmistakes': 2},\n", + " 'id_2758': {'nmistakes': 1},\n", + " 'id_2761': {'nmistakes': 3},\n", + " 'id_2764': {'nmistakes': 1},\n", + " 'id_2767': {'nmistakes': 1},\n", + " 'id_2770': {'nmistakes': 2},\n", + " 'id_2773': {'nmistakes': 2},\n", + " 'id_2776': {'nmistakes': 1},\n", + " 'id_2779': {'nmistakes': 1},\n", + " 'id_2782': {'nmistakes': 2},\n", + " 'id_2785': {'nmistakes': 3},\n", + " 'id_2788': {'nmistakes': 3},\n", + " 'id_2791': {'nmistakes': 1},\n", + " 'id_2794': {'nmistakes': 1},\n", + " 'id_2797': {'nmistakes': 2},\n", + " 'id_2800': {'nmistakes': 1},\n", + " 'id_2803': {'nmistakes': 3},\n", + " 'id_2806': {'nmistakes': 1},\n", + " 'id_2809': {'nmistakes': 3},\n", + " 'id_2812': {'nmistakes': 1},\n", + " 'id_2815': {'nmistakes': 1},\n", + " 'id_2818': {'nmistakes': 2},\n", + " 'id_2821': {'nmistakes': 1},\n", + " 'id_2824': {'nmistakes': 1},\n", + " 'id_2827': {'nmistakes': 1},\n", + " 'id_2830': {'nmistakes': 1},\n", + " 'id_2833': {'nmistakes': 2},\n", + " 'id_2836': {'nmistakes': 2},\n", + " 'id_2839': {'nmistakes': 2},\n", + " 'id_2842': {'nmistakes': 3},\n", + " 'id_2845': {'nmistakes': 2},\n", + " 'id_2848': {'nmistakes': 1},\n", + " 'id_2851': {'nmistakes': 3},\n", + " 'id_2854': {'nmistakes': 3},\n", + " 'id_2857': {'nmistakes': 3},\n", + " 'id_2860': {'nmistakes': 2},\n", + " 'id_2863': {'nmistakes': 3},\n", + " 'id_2866': {'nmistakes': 3},\n", + " 'id_2869': {'nmistakes': 3},\n", + " 'id_2872': {'nmistakes': 1},\n", + " 'id_2875': {'nmistakes': 3},\n", + " 'id_2878': {'nmistakes': 1},\n", + " 'id_2881': {'nmistakes': 3},\n", + " 'id_2884': {'nmistakes': 3},\n", + " 'id_2887': {'nmistakes': 3},\n", + " 'id_2890': {'nmistakes': 2},\n", + " 'id_2893': {'nmistakes': 2},\n", + " 'id_2896': {'nmistakes': 1},\n", + " 'id_2899': {'nmistakes': 2},\n", + " 'id_2902': {'nmistakes': 2},\n", + " 'id_2905': {'nmistakes': 1},\n", + " 'id_2908': {'nmistakes': 1},\n", + " 'id_2911': {'nmistakes': 3},\n", + " 'id_2914': {'nmistakes': 2},\n", + " 'id_2917': {'nmistakes': 1},\n", + " 'id_2920': {'nmistakes': 2},\n", + " 'id_2923': {'nmistakes': 3},\n", + " 'id_2926': {'nmistakes': 2},\n", + " 'id_2929': {'nmistakes': 3},\n", + " 'id_2932': {'nmistakes': 2},\n", + " 'id_2935': {'nmistakes': 3},\n", + " 'id_2938': {'nmistakes': 3},\n", + " 'id_2941': {'nmistakes': 1},\n", + " 'id_2944': {'nmistakes': 1},\n", + " 'id_2947': {'nmistakes': 1},\n", + " 'id_2950': {'nmistakes': 2},\n", + " 'id_2953': {'nmistakes': 1},\n", + " 'id_2956': {'nmistakes': 2},\n", + " 'id_2959': {'nmistakes': 1},\n", + " 'id_2962': {'nmistakes': 3},\n", + " 'id_2965': {'nmistakes': 1},\n", + " 'id_2968': {'nmistakes': 2},\n", + " 'id_2971': {'nmistakes': 1},\n", + " 'id_2974': {'nmistakes': 3},\n", + " 'id_2977': {'nmistakes': 2},\n", + " 'id_2980': {'nmistakes': 3},\n", + " 'id_2983': {'nmistakes': 2},\n", + " 'id_2986': {'nmistakes': 3},\n", + " 'id_2989': {'nmistakes': 2},\n", + " 'id_2992': {'nmistakes': 1},\n", + " 'id_2995': {'nmistakes': 1},\n", + " 'id_2998': {'nmistakes': 2},\n", + " ...}" + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "scores = {}\n", + "\n", + "for model_ in folder2model.values():\n", + " scores.update(\n", + " dict(zip(df_scores[model_].iloc[x_indices], df_scores[model_].iloc[y_indices]))\n", + " )\n", + "\n", + "for k,v in scores.items():\n", + " scores[k] = {'nmistakes': v}\n", + "\n", + "scores" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "48e415a6-8a43-47d9-95e3-c4deb7dfe604", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'id_1': {'pref_rank': 2},\n", + " 'id_4': {'pref_rank': 3},\n", + " 'id_7': {'pref_rank': 3},\n", + " 'id_10': {'pref_rank': 3},\n", + " 'id_13': {'pref_rank': 2},\n", + " 'id_16': {'pref_rank': 3},\n", + " 'id_19': {'pref_rank': 1},\n", + " 'id_22': {'pref_rank': 2},\n", + " 'id_25': {'pref_rank': 3},\n", + " 'id_28': {'pref_rank': 2},\n", + " 'id_31': {'pref_rank': 3},\n", + " 'id_34': {'pref_rank': 1},\n", + " 'id_37': {'pref_rank': 2},\n", + " 'id_40': {'pref_rank': 2},\n", + " 'id_43': {'pref_rank': 3},\n", + " 'id_46': {'pref_rank': 3},\n", + " 'id_49': {'pref_rank': 1},\n", + " 'id_52': {'pref_rank': 1},\n", + " 'id_55': {'pref_rank': 2},\n", + " 'id_58': {'pref_rank': 2},\n", + " 'id_61': {'pref_rank': 2},\n", + " 'id_64': {'pref_rank': 1},\n", + " 'id_67': {'pref_rank': 3},\n", + " 'id_70': {'pref_rank': 3},\n", + " 'id_73': {'pref_rank': 3},\n", + " 'id_76': {'pref_rank': 1},\n", + " 'id_79': {'pref_rank': 2},\n", + " 'id_82': {'pref_rank': 1},\n", + " 'id_85': {'pref_rank': 2},\n", + " 'id_88': {'pref_rank': 2},\n", + " 'id_91': {'pref_rank': 2},\n", + " 'id_94': {'pref_rank': 1},\n", + " 'id_97': {'pref_rank': 1},\n", + " 'id_100': {'pref_rank': 2},\n", + " 'id_103': {'pref_rank': 2},\n", + " 'id_106': {'pref_rank': 3},\n", + " 'id_109': {'pref_rank': 2},\n", + " 'id_112': {'pref_rank': 2},\n", + " 'id_115': {'pref_rank': 1},\n", + " 'id_118': {'pref_rank': 1},\n", + " 'id_121': {'pref_rank': 1},\n", + " 'id_124': {'pref_rank': 1},\n", + " 'id_127': {'pref_rank': 2},\n", + " 'id_130': {'pref_rank': 3},\n", + " 'id_133': {'pref_rank': 1},\n", + " 'id_136': {'pref_rank': 1},\n", + " 'id_139': {'pref_rank': 1},\n", + " 'id_142': {'pref_rank': 1},\n", + " 'id_145': {'pref_rank': 3},\n", + " 'id_148': {'pref_rank': 3},\n", + " 'id_151': {'pref_rank': 3},\n", + " 'id_154': {'pref_rank': 2},\n", + " 'id_157': {'pref_rank': 1},\n", + " 'id_160': {'pref_rank': 2},\n", + " 'id_163': {'pref_rank': 3},\n", + " 'id_166': {'pref_rank': 3},\n", + " 'id_169': {'pref_rank': 1},\n", + " 'id_172': {'pref_rank': 1},\n", + " 'id_175': {'pref_rank': 1},\n", + " 'id_178': {'pref_rank': 2},\n", + " 'id_181': {'pref_rank': 3},\n", + " 'id_184': {'pref_rank': 2},\n", + " 'id_187': {'pref_rank': 1},\n", + " 'id_190': {'pref_rank': 2},\n", + " 'id_193': {'pref_rank': 1},\n", + " 'id_196': {'pref_rank': 1},\n", + " 'id_199': {'pref_rank': 3},\n", + " 'id_202': {'pref_rank': 1},\n", + " 'id_205': {'pref_rank': 2},\n", + " 'id_208': {'pref_rank': 3},\n", + " 'id_211': {'pref_rank': 2},\n", + " 'id_214': {'pref_rank': 1},\n", + " 'id_217': {'pref_rank': 3},\n", + " 'id_220': {'pref_rank': 1},\n", + " 'id_223': {'pref_rank': 2},\n", + " 'id_226': {'pref_rank': 1},\n", + " 'id_229': {'pref_rank': 3},\n", + " 'id_232': {'pref_rank': 1},\n", + " 'id_235': {'pref_rank': 1},\n", + " 'id_238': {'pref_rank': 3},\n", + " 'id_241': {'pref_rank': 3},\n", + " 'id_244': {'pref_rank': 2},\n", + " 'id_247': {'pref_rank': 1},\n", + " 'id_250': {'pref_rank': 2},\n", + " 'id_253': {'pref_rank': 1},\n", + " 'id_256': {'pref_rank': 1},\n", + " 'id_259': {'pref_rank': 1},\n", + " 'id_262': {'pref_rank': 1},\n", + " 'id_265': {'pref_rank': 2},\n", + " 'id_268': {'pref_rank': 1},\n", + " 'id_271': {'pref_rank': 2},\n", + " 'id_274': {'pref_rank': 1},\n", + " 'id_277': {'pref_rank': 1},\n", + " 'id_280': {'pref_rank': 3},\n", + " 'id_283': {'pref_rank': 3},\n", + " 'id_286': {'pref_rank': 2},\n", + " 'id_289': {'pref_rank': 1},\n", + " 'id_292': {'pref_rank': 2},\n", + " 'id_295': {'pref_rank': 2},\n", + " 'id_298': {'pref_rank': 1},\n", + " 'id_301': {'pref_rank': 2},\n", + " 'id_304': {'pref_rank': 3},\n", + " 'id_307': {'pref_rank': 1},\n", + " 'id_310': {'pref_rank': 3},\n", + " 'id_313': {'pref_rank': 3},\n", + " 'id_316': {'pref_rank': 1},\n", + " 'id_319': {'pref_rank': 3},\n", + " 'id_322': {'pref_rank': 3},\n", + " 'id_325': {'pref_rank': 3},\n", + " 'id_328': {'pref_rank': 1},\n", + " 'id_331': {'pref_rank': 1},\n", + " 'id_334': {'pref_rank': 3},\n", + " 'id_337': {'pref_rank': 2},\n", + " 'id_340': {'pref_rank': 1},\n", + " 'id_343': {'pref_rank': 1},\n", + " 'id_346': {'pref_rank': 3},\n", + " 'id_349': {'pref_rank': 2},\n", + " 'id_352': {'pref_rank': 1},\n", + " 'id_355': {'pref_rank': 2},\n", + " 'id_358': {'pref_rank': 3},\n", + " 'id_361': {'pref_rank': 3},\n", + " 'id_364': {'pref_rank': 3},\n", + " 'id_367': {'pref_rank': 2},\n", + " 'id_370': {'pref_rank': 3},\n", + " 'id_373': {'pref_rank': 3},\n", + " 'id_376': {'pref_rank': 3},\n", + " 'id_379': {'pref_rank': 3},\n", + " 'id_382': {'pref_rank': 1},\n", + " 'id_385': {'pref_rank': 1},\n", + " 'id_388': {'pref_rank': 1},\n", + " 'id_391': {'pref_rank': 2},\n", + " 'id_394': {'pref_rank': 2},\n", + " 'id_397': {'pref_rank': 1},\n", + " 'id_400': {'pref_rank': 1},\n", + " 'id_403': {'pref_rank': 2},\n", + " 'id_406': {'pref_rank': 1},\n", + " 'id_409': {'pref_rank': 3},\n", + " 'id_412': {'pref_rank': 2},\n", + " 'id_415': {'pref_rank': 2},\n", + " 'id_418': {'pref_rank': 3},\n", + " 'id_421': {'pref_rank': 3},\n", + " 'id_424': {'pref_rank': 1},\n", + " 'id_427': {'pref_rank': 2},\n", + " 'id_430': {'pref_rank': 2},\n", + " 'id_433': {'pref_rank': 3},\n", + " 'id_436': {'pref_rank': 3},\n", + " 'id_439': {'pref_rank': 2},\n", + " 'id_442': {'pref_rank': 1},\n", + " 'id_445': {'pref_rank': 3},\n", + " 'id_448': {'pref_rank': 2},\n", + " 'id_451': {'pref_rank': 1},\n", + " 'id_454': {'pref_rank': 3},\n", + " 'id_457': {'pref_rank': 3},\n", + " 'id_460': {'pref_rank': 3},\n", + " 'id_463': {'pref_rank': 1},\n", + " 'id_466': {'pref_rank': 1},\n", + " 'id_469': {'pref_rank': 2},\n", + " 'id_472': {'pref_rank': 2},\n", + " 'id_475': {'pref_rank': 3},\n", + " 'id_478': {'pref_rank': 3},\n", + " 'id_481': {'pref_rank': 2},\n", + " 'id_484': {'pref_rank': 3},\n", + " 'id_487': {'pref_rank': 1},\n", + " 'id_490': {'pref_rank': 2},\n", + " 'id_493': {'pref_rank': 3},\n", + " 'id_496': {'pref_rank': 1},\n", + " 'id_499': {'pref_rank': 1},\n", + " 'id_502': {'pref_rank': 2},\n", + " 'id_505': {'pref_rank': 3},\n", + " 'id_508': {'pref_rank': 3},\n", + " 'id_511': {'pref_rank': 1},\n", + " 'id_514': {'pref_rank': 1},\n", + " 'id_517': {'pref_rank': 3},\n", + " 'id_520': {'pref_rank': 3},\n", + " 'id_523': {'pref_rank': 3},\n", + " 'id_526': {'pref_rank': 1},\n", + " 'id_529': {'pref_rank': 3},\n", + " 'id_532': {'pref_rank': 2},\n", + " 'id_535': {'pref_rank': 1},\n", + " 'id_538': {'pref_rank': 2},\n", + " 'id_541': {'pref_rank': 3},\n", + " 'id_544': {'pref_rank': 3},\n", + " 'id_547': {'pref_rank': 3},\n", + " 'id_550': {'pref_rank': 1},\n", + " 'id_553': {'pref_rank': 3},\n", + " 'id_556': {'pref_rank': 2},\n", + " 'id_559': {'pref_rank': 1},\n", + " 'id_562': {'pref_rank': 2},\n", + " 'id_565': {'pref_rank': 3},\n", + " 'id_568': {'pref_rank': 1},\n", + " 'id_571': {'pref_rank': 2},\n", + " 'id_574': {'pref_rank': 2},\n", + " 'id_577': {'pref_rank': 3},\n", + " 'id_580': {'pref_rank': 2},\n", + " 'id_583': {'pref_rank': 3},\n", + " 'id_586': {'pref_rank': 3},\n", + " 'id_589': {'pref_rank': 3},\n", + " 'id_592': {'pref_rank': 3},\n", + " 'id_595': {'pref_rank': 3},\n", + " 'id_598': {'pref_rank': 2},\n", + " 'id_601': {'pref_rank': 1},\n", + " 'id_604': {'pref_rank': 1},\n", + " 'id_607': {'pref_rank': 2},\n", + " 'id_610': {'pref_rank': 1},\n", + " 'id_613': {'pref_rank': 3},\n", + " 'id_616': {'pref_rank': 3},\n", + " 'id_619': {'pref_rank': 1},\n", + " 'id_622': {'pref_rank': 1},\n", + " 'id_625': {'pref_rank': 1},\n", + " 'id_628': {'pref_rank': 1},\n", + " 'id_631': {'pref_rank': 2},\n", + " 'id_634': {'pref_rank': 1},\n", + " 'id_637': {'pref_rank': 3},\n", + " 'id_640': {'pref_rank': 1},\n", + " 'id_643': {'pref_rank': 3},\n", + " 'id_646': {'pref_rank': 2},\n", + " 'id_649': {'pref_rank': 3},\n", + " 'id_652': {'pref_rank': 3},\n", + " 'id_655': {'pref_rank': 3},\n", + " 'id_658': {'pref_rank': 3},\n", + " 'id_661': {'pref_rank': 3},\n", + " 'id_664': {'pref_rank': 1},\n", + " 'id_667': {'pref_rank': 1},\n", + " 'id_670': {'pref_rank': 1},\n", + " 'id_673': {'pref_rank': 2},\n", + " 'id_676': {'pref_rank': 2},\n", + " 'id_679': {'pref_rank': 1},\n", + " 'id_682': {'pref_rank': 1},\n", + " 'id_685': {'pref_rank': 3},\n", + " 'id_688': {'pref_rank': 3},\n", + " 'id_691': {'pref_rank': 1},\n", + " 'id_694': {'pref_rank': 3},\n", + " 'id_697': {'pref_rank': 2},\n", + " 'id_700': {'pref_rank': 1},\n", + " 'id_703': {'pref_rank': 1},\n", + " 'id_706': {'pref_rank': 2},\n", + " 'id_709': {'pref_rank': 1},\n", + " 'id_712': {'pref_rank': 1},\n", + " 'id_715': {'pref_rank': 2},\n", + " 'id_718': {'pref_rank': 1},\n", + " 'id_721': {'pref_rank': 3},\n", + " 'id_724': {'pref_rank': 3},\n", + " 'id_727': {'pref_rank': 2},\n", + " 'id_730': {'pref_rank': 3},\n", + " 'id_733': {'pref_rank': 2},\n", + " 'id_736': {'pref_rank': 1},\n", + " 'id_739': {'pref_rank': 3},\n", + " 'id_742': {'pref_rank': 2},\n", + " 'id_745': {'pref_rank': 1},\n", + " 'id_748': {'pref_rank': 2},\n", + " 'id_751': {'pref_rank': 1},\n", + " 'id_754': {'pref_rank': 3},\n", + " 'id_757': {'pref_rank': 2},\n", + " 'id_760': {'pref_rank': 3},\n", + " 'id_763': {'pref_rank': 3},\n", + " 'id_766': {'pref_rank': 2},\n", + " 'id_769': {'pref_rank': 3},\n", + " 'id_772': {'pref_rank': 3},\n", + " 'id_775': {'pref_rank': 3},\n", + " 'id_778': {'pref_rank': 3},\n", + " 'id_781': {'pref_rank': 3},\n", + " 'id_784': {'pref_rank': 3},\n", + " 'id_787': {'pref_rank': 1},\n", + " 'id_790': {'pref_rank': 1},\n", + " 'id_793': {'pref_rank': 2},\n", + " 'id_796': {'pref_rank': 1},\n", + " 'id_799': {'pref_rank': 3},\n", + " 'id_802': {'pref_rank': 3},\n", + " 'id_805': {'pref_rank': 1},\n", + " 'id_808': {'pref_rank': 3},\n", + " 'id_811': {'pref_rank': 1},\n", + " 'id_814': {'pref_rank': 1},\n", + " 'id_817': {'pref_rank': 1},\n", + " 'id_820': {'pref_rank': 1},\n", + " 'id_823': {'pref_rank': 2},\n", + " 'id_826': {'pref_rank': 3},\n", + " 'id_829': {'pref_rank': 2},\n", + " 'id_832': {'pref_rank': 3},\n", + " 'id_835': {'pref_rank': 2},\n", + " 'id_838': {'pref_rank': 1},\n", + " 'id_841': {'pref_rank': 2},\n", + " 'id_844': {'pref_rank': 1},\n", + " 'id_847': {'pref_rank': 1},\n", + " 'id_850': {'pref_rank': 2},\n", + " 'id_853': {'pref_rank': 3},\n", + " 'id_856': {'pref_rank': 3},\n", + " 'id_859': {'pref_rank': 2},\n", + " 'id_862': {'pref_rank': 3},\n", + " 'id_865': {'pref_rank': 3},\n", + " 'id_868': {'pref_rank': 3},\n", + " 'id_871': {'pref_rank': 3},\n", + " 'id_874': {'pref_rank': 3},\n", + " 'id_877': {'pref_rank': 1},\n", + " 'id_880': {'pref_rank': 2},\n", + " 'id_883': {'pref_rank': 1},\n", + " 'id_886': {'pref_rank': 1},\n", + " 'id_889': {'pref_rank': 3},\n", + " 'id_892': {'pref_rank': 3},\n", + " 'id_895': {'pref_rank': 1},\n", + " 'id_898': {'pref_rank': 3},\n", + " 'id_901': {'pref_rank': 1},\n", + " 'id_904': {'pref_rank': 2},\n", + " 'id_907': {'pref_rank': 2},\n", + " 'id_910': {'pref_rank': 2},\n", + " 'id_913': {'pref_rank': 1},\n", + " 'id_916': {'pref_rank': 2},\n", + " 'id_919': {'pref_rank': 2},\n", + " 'id_922': {'pref_rank': 1},\n", + " 'id_925': {'pref_rank': 3},\n", + " 'id_928': {'pref_rank': 2},\n", + " 'id_931': {'pref_rank': 2},\n", + " 'id_934': {'pref_rank': 3},\n", + " 'id_937': {'pref_rank': 1},\n", + " 'id_940': {'pref_rank': 2},\n", + " 'id_943': {'pref_rank': 1},\n", + " 'id_946': {'pref_rank': 2},\n", + " 'id_949': {'pref_rank': 3},\n", + " 'id_952': {'pref_rank': 2},\n", + " 'id_955': {'pref_rank': 1},\n", + " 'id_958': {'pref_rank': 3},\n", + " 'id_961': {'pref_rank': 3},\n", + " 'id_964': {'pref_rank': 2},\n", + " 'id_967': {'pref_rank': 3},\n", + " 'id_970': {'pref_rank': 1},\n", + " 'id_973': {'pref_rank': 2},\n", + " 'id_976': {'pref_rank': 1},\n", + " 'id_979': {'pref_rank': 2},\n", + " 'id_982': {'pref_rank': 3},\n", + " 'id_985': {'pref_rank': 2},\n", + " 'id_988': {'pref_rank': 3},\n", + " 'id_991': {'pref_rank': 3},\n", + " 'id_994': {'pref_rank': 2},\n", + " 'id_997': {'pref_rank': 1},\n", + " 'id_1000': {'pref_rank': 1},\n", + " 'id_1003': {'pref_rank': 3},\n", + " 'id_1006': {'pref_rank': 2},\n", + " 'id_1009': {'pref_rank': 3},\n", + " 'id_1012': {'pref_rank': 1},\n", + " 'id_1015': {'pref_rank': 2},\n", + " 'id_1018': {'pref_rank': 1},\n", + " 'id_1021': {'pref_rank': 3},\n", + " 'id_1024': {'pref_rank': 2},\n", + " 'id_1027': {'pref_rank': 2},\n", + " 'id_1030': {'pref_rank': 3},\n", + " 'id_1033': {'pref_rank': 1},\n", + " 'id_1036': {'pref_rank': 1},\n", + " 'id_1039': {'pref_rank': 2},\n", + " 'id_1042': {'pref_rank': 2},\n", + " 'id_1045': {'pref_rank': 1},\n", + " 'id_1048': {'pref_rank': 1},\n", + " 'id_1051': {'pref_rank': 2},\n", + " 'id_1054': {'pref_rank': 3},\n", + " 'id_1057': {'pref_rank': 3},\n", + " 'id_1060': {'pref_rank': 3},\n", + " 'id_1063': {'pref_rank': 3},\n", + " 'id_1066': {'pref_rank': 2},\n", + " 'id_1069': {'pref_rank': 2},\n", + " 'id_1072': {'pref_rank': 1},\n", + " 'id_1075': {'pref_rank': 3},\n", + " 'id_1078': {'pref_rank': 2},\n", + " 'id_1081': {'pref_rank': 2},\n", + " 'id_1084': {'pref_rank': 2},\n", + " 'id_1087': {'pref_rank': 2},\n", + " 'id_1090': {'pref_rank': 2},\n", + " 'id_1093': {'pref_rank': 3},\n", + " 'id_1096': {'pref_rank': 2},\n", + " 'id_1099': {'pref_rank': 2},\n", + " 'id_1102': {'pref_rank': 1},\n", + " 'id_1105': {'pref_rank': 1},\n", + " 'id_1108': {'pref_rank': 3},\n", + " 'id_1111': {'pref_rank': 2},\n", + " 'id_1114': {'pref_rank': 2},\n", + " 'id_1117': {'pref_rank': 1},\n", + " 'id_1120': {'pref_rank': 2},\n", + " 'id_1123': {'pref_rank': 2},\n", + " 'id_1126': {'pref_rank': 3},\n", + " 'id_1129': {'pref_rank': 2},\n", + " 'id_1132': {'pref_rank': 1},\n", + " 'id_1135': {'pref_rank': 2},\n", + " 'id_1138': {'pref_rank': 2},\n", + " 'id_1141': {'pref_rank': 1},\n", + " 'id_1144': {'pref_rank': 1},\n", + " 'id_1147': {'pref_rank': 3},\n", + " 'id_1150': {'pref_rank': 1},\n", + " 'id_1153': {'pref_rank': 1},\n", + " 'id_1156': {'pref_rank': 3},\n", + " 'id_1159': {'pref_rank': 1},\n", + " 'id_1162': {'pref_rank': 1},\n", + " 'id_1165': {'pref_rank': 3},\n", + " 'id_1168': {'pref_rank': 1},\n", + " 'id_1171': {'pref_rank': 2},\n", + " 'id_1174': {'pref_rank': 3},\n", + " 'id_1177': {'pref_rank': 2},\n", + " 'id_1180': {'pref_rank': 2},\n", + " 'id_1183': {'pref_rank': 1},\n", + " 'id_1186': {'pref_rank': 2},\n", + " 'id_1189': {'pref_rank': 1},\n", + " 'id_1192': {'pref_rank': 1},\n", + " 'id_1195': {'pref_rank': 2},\n", + " 'id_1198': {'pref_rank': 1},\n", + " 'id_1201': {'pref_rank': 3},\n", + " 'id_1204': {'pref_rank': 1},\n", + " 'id_1207': {'pref_rank': 1},\n", + " 'id_1210': {'pref_rank': 1},\n", + " 'id_1213': {'pref_rank': 1},\n", + " 'id_1216': {'pref_rank': 3},\n", + " 'id_1219': {'pref_rank': 1},\n", + " 'id_1222': {'pref_rank': 3},\n", + " 'id_1225': {'pref_rank': 3},\n", + " 'id_1228': {'pref_rank': 2},\n", + " 'id_1231': {'pref_rank': 2},\n", + " 'id_1234': {'pref_rank': 3},\n", + " 'id_1237': {'pref_rank': 1},\n", + " 'id_1240': {'pref_rank': 2},\n", + " 'id_1243': {'pref_rank': 2},\n", + " 'id_1246': {'pref_rank': 2},\n", + " 'id_1249': {'pref_rank': 3},\n", + " 'id_1252': {'pref_rank': 2},\n", + " 'id_1255': {'pref_rank': 2},\n", + " 'id_1258': {'pref_rank': 1},\n", + " 'id_1261': {'pref_rank': 2},\n", + " 'id_1264': {'pref_rank': 3},\n", + " 'id_1267': {'pref_rank': 3},\n", + " 'id_1270': {'pref_rank': 1},\n", + " 'id_1273': {'pref_rank': 2},\n", + " 'id_1276': {'pref_rank': 3},\n", + " 'id_1279': {'pref_rank': 3},\n", + " 'id_1282': {'pref_rank': 2},\n", + " 'id_1285': {'pref_rank': 3},\n", + " 'id_1288': {'pref_rank': 2},\n", + " 'id_1291': {'pref_rank': 3},\n", + " 'id_1294': {'pref_rank': 2},\n", + " 'id_1297': {'pref_rank': 2},\n", + " 'id_1300': {'pref_rank': 2},\n", + " 'id_1303': {'pref_rank': 3},\n", + " 'id_1306': {'pref_rank': 1},\n", + " 'id_1309': {'pref_rank': 1},\n", + " 'id_1312': {'pref_rank': 2},\n", + " 'id_1315': {'pref_rank': 3},\n", + " 'id_1318': {'pref_rank': 2},\n", + " 'id_1321': {'pref_rank': 3},\n", + " 'id_1324': {'pref_rank': 3},\n", + " 'id_1327': {'pref_rank': 2},\n", + " 'id_1330': {'pref_rank': 2},\n", + " 'id_1333': {'pref_rank': 1},\n", + " 'id_1336': {'pref_rank': 2},\n", + " 'id_1339': {'pref_rank': 3},\n", + " 'id_1342': {'pref_rank': 3},\n", + " 'id_1345': {'pref_rank': 2},\n", + " 'id_1348': {'pref_rank': 3},\n", + " 'id_1351': {'pref_rank': 3},\n", + " 'id_1354': {'pref_rank': 1},\n", + " 'id_1357': {'pref_rank': 2},\n", + " 'id_1360': {'pref_rank': 1},\n", + " 'id_1363': {'pref_rank': 3},\n", + " 'id_1366': {'pref_rank': 2},\n", + " 'id_1369': {'pref_rank': 3},\n", + " 'id_1372': {'pref_rank': 3},\n", + " 'id_1375': {'pref_rank': 2},\n", + " 'id_1378': {'pref_rank': 2},\n", + " 'id_1381': {'pref_rank': 3},\n", + " 'id_1384': {'pref_rank': 3},\n", + " 'id_1387': {'pref_rank': 2},\n", + " 'id_1390': {'pref_rank': 1},\n", + " 'id_1393': {'pref_rank': 1},\n", + " 'id_1396': {'pref_rank': 2},\n", + " 'id_1399': {'pref_rank': 2},\n", + " 'id_1402': {'pref_rank': 3},\n", + " 'id_1405': {'pref_rank': 1},\n", + " 'id_1408': {'pref_rank': 3},\n", + " 'id_1411': {'pref_rank': 3},\n", + " 'id_1414': {'pref_rank': 3},\n", + " 'id_1417': {'pref_rank': 1},\n", + " 'id_1420': {'pref_rank': 1},\n", + " 'id_1423': {'pref_rank': 1},\n", + " 'id_1426': {'pref_rank': 2},\n", + " 'id_1429': {'pref_rank': 2},\n", + " 'id_1432': {'pref_rank': 1},\n", + " 'id_1435': {'pref_rank': 2},\n", + " 'id_1438': {'pref_rank': 3},\n", + " 'id_1441': {'pref_rank': 3},\n", + " 'id_1444': {'pref_rank': 3},\n", + " 'id_1447': {'pref_rank': 3},\n", + " 'id_1450': {'pref_rank': 1},\n", + " 'id_1453': {'pref_rank': 2},\n", + " 'id_1456': {'pref_rank': 2},\n", + " 'id_1459': {'pref_rank': 1},\n", + " 'id_1462': {'pref_rank': 1},\n", + " 'id_1465': {'pref_rank': 2},\n", + " 'id_1468': {'pref_rank': 1},\n", + " 'id_1471': {'pref_rank': 1},\n", + " 'id_1474': {'pref_rank': 2},\n", + " 'id_1477': {'pref_rank': 3},\n", + " 'id_1480': {'pref_rank': 2},\n", + " 'id_1483': {'pref_rank': 3},\n", + " 'id_1486': {'pref_rank': 1},\n", + " 'id_1489': {'pref_rank': 3},\n", + " 'id_1492': {'pref_rank': 3},\n", + " 'id_1495': {'pref_rank': 1},\n", + " 'id_1498': {'pref_rank': 1},\n", + " 'id_1501': {'pref_rank': 2},\n", + " 'id_1504': {'pref_rank': 1},\n", + " 'id_1507': {'pref_rank': 3},\n", + " 'id_1510': {'pref_rank': 2},\n", + " 'id_1513': {'pref_rank': 3},\n", + " 'id_1516': {'pref_rank': 2},\n", + " 'id_1519': {'pref_rank': 3},\n", + " 'id_1522': {'pref_rank': 2},\n", + " 'id_1525': {'pref_rank': 3},\n", + " 'id_1528': {'pref_rank': 1},\n", + " 'id_1531': {'pref_rank': 2},\n", + " 'id_1534': {'pref_rank': 2},\n", + " 'id_1537': {'pref_rank': 3},\n", + " 'id_1540': {'pref_rank': 1},\n", + " 'id_1543': {'pref_rank': 2},\n", + " 'id_1546': {'pref_rank': 3},\n", + " 'id_1549': {'pref_rank': 1},\n", + " 'id_1552': {'pref_rank': 2},\n", + " 'id_1555': {'pref_rank': 1},\n", + " 'id_1558': {'pref_rank': 2},\n", + " 'id_1561': {'pref_rank': 1},\n", + " 'id_1564': {'pref_rank': 2},\n", + " 'id_1567': {'pref_rank': 2},\n", + " 'id_1570': {'pref_rank': 3},\n", + " 'id_1573': {'pref_rank': 2},\n", + " 'id_1576': {'pref_rank': 1},\n", + " 'id_1579': {'pref_rank': 1},\n", + " 'id_1582': {'pref_rank': 1},\n", + " 'id_1585': {'pref_rank': 1},\n", + " 'id_1588': {'pref_rank': 2},\n", + " 'id_1591': {'pref_rank': 3},\n", + " 'id_1594': {'pref_rank': 1},\n", + " 'id_1597': {'pref_rank': 3},\n", + " 'id_1600': {'pref_rank': 2},\n", + " 'id_1603': {'pref_rank': 1},\n", + " 'id_1606': {'pref_rank': 3},\n", + " 'id_1609': {'pref_rank': 1},\n", + " 'id_1612': {'pref_rank': 3},\n", + " 'id_1615': {'pref_rank': 2},\n", + " 'id_1618': {'pref_rank': 1},\n", + " 'id_1621': {'pref_rank': 2},\n", + " 'id_1624': {'pref_rank': 1},\n", + " 'id_1627': {'pref_rank': 1},\n", + " 'id_1630': {'pref_rank': 3},\n", + " 'id_1633': {'pref_rank': 3},\n", + " 'id_1636': {'pref_rank': 2},\n", + " 'id_1639': {'pref_rank': 2},\n", + " 'id_1642': {'pref_rank': 2},\n", + " 'id_1645': {'pref_rank': 2},\n", + " 'id_1648': {'pref_rank': 1},\n", + " 'id_1651': {'pref_rank': 3},\n", + " 'id_1654': {'pref_rank': 3},\n", + " 'id_1657': {'pref_rank': 2},\n", + " 'id_1660': {'pref_rank': 1},\n", + " 'id_1663': {'pref_rank': 3},\n", + " 'id_1666': {'pref_rank': 3},\n", + " 'id_1669': {'pref_rank': 2},\n", + " 'id_1672': {'pref_rank': 2},\n", + " 'id_1675': {'pref_rank': 2},\n", + " 'id_1678': {'pref_rank': 2},\n", + " 'id_1681': {'pref_rank': 2},\n", + " 'id_1684': {'pref_rank': 1},\n", + " 'id_1687': {'pref_rank': 2},\n", + " 'id_1690': {'pref_rank': 2},\n", + " 'id_1693': {'pref_rank': 1},\n", + " 'id_1696': {'pref_rank': 3},\n", + " 'id_1699': {'pref_rank': 3},\n", + " 'id_1702': {'pref_rank': 3},\n", + " 'id_1705': {'pref_rank': 1},\n", + " 'id_1708': {'pref_rank': 2},\n", + " 'id_1711': {'pref_rank': 1},\n", + " 'id_1714': {'pref_rank': 1},\n", + " 'id_1717': {'pref_rank': 3},\n", + " 'id_1720': {'pref_rank': 1},\n", + " 'id_1723': {'pref_rank': 2},\n", + " 'id_1726': {'pref_rank': 1},\n", + " 'id_1729': {'pref_rank': 3},\n", + " 'id_1732': {'pref_rank': 1},\n", + " 'id_1735': {'pref_rank': 2},\n", + " 'id_1738': {'pref_rank': 1},\n", + " 'id_1741': {'pref_rank': 1},\n", + " 'id_1744': {'pref_rank': 3},\n", + " 'id_1747': {'pref_rank': 1},\n", + " 'id_1750': {'pref_rank': 2},\n", + " 'id_1753': {'pref_rank': 1},\n", + " 'id_1756': {'pref_rank': 2},\n", + " 'id_1759': {'pref_rank': 2},\n", + " 'id_1762': {'pref_rank': 3},\n", + " 'id_1765': {'pref_rank': 2},\n", + " 'id_1768': {'pref_rank': 3},\n", + " 'id_1771': {'pref_rank': 1},\n", + " 'id_1774': {'pref_rank': 3},\n", + " 'id_1777': {'pref_rank': 3},\n", + " 'id_1780': {'pref_rank': 3},\n", + " 'id_1783': {'pref_rank': 2},\n", + " 'id_1786': {'pref_rank': 1},\n", + " 'id_1789': {'pref_rank': 1},\n", + " 'id_1792': {'pref_rank': 2},\n", + " 'id_1795': {'pref_rank': 3},\n", + " 'id_1798': {'pref_rank': 2},\n", + " 'id_1801': {'pref_rank': 1},\n", + " 'id_1804': {'pref_rank': 3},\n", + " 'id_1807': {'pref_rank': 3},\n", + " 'id_1810': {'pref_rank': 3},\n", + " 'id_1813': {'pref_rank': 2},\n", + " 'id_1816': {'pref_rank': 1},\n", + " 'id_1819': {'pref_rank': 2},\n", + " 'id_1822': {'pref_rank': 1},\n", + " 'id_1825': {'pref_rank': 1},\n", + " 'id_1828': {'pref_rank': 1},\n", + " 'id_1831': {'pref_rank': 3},\n", + " 'id_1834': {'pref_rank': 2},\n", + " 'id_1837': {'pref_rank': 3},\n", + " 'id_1840': {'pref_rank': 1},\n", + " 'id_1843': {'pref_rank': 1},\n", + " 'id_1846': {'pref_rank': 3},\n", + " 'id_1849': {'pref_rank': 2},\n", + " 'id_1852': {'pref_rank': 2},\n", + " 'id_1855': {'pref_rank': 1},\n", + " 'id_1858': {'pref_rank': 1},\n", + " 'id_1861': {'pref_rank': 3},\n", + " 'id_1864': {'pref_rank': 3},\n", + " 'id_1867': {'pref_rank': 2},\n", + " 'id_1870': {'pref_rank': 3},\n", + " 'id_1873': {'pref_rank': 2},\n", + " 'id_1876': {'pref_rank': 2},\n", + " 'id_1879': {'pref_rank': 3},\n", + " 'id_1882': {'pref_rank': 2},\n", + " 'id_1885': {'pref_rank': 3},\n", + " 'id_1888': {'pref_rank': 3},\n", + " 'id_1891': {'pref_rank': 1},\n", + " 'id_1894': {'pref_rank': 2},\n", + " 'id_1897': {'pref_rank': 1},\n", + " 'id_1900': {'pref_rank': 1},\n", + " 'id_1903': {'pref_rank': 1},\n", + " 'id_1906': {'pref_rank': 3},\n", + " 'id_1909': {'pref_rank': 3},\n", + " 'id_1912': {'pref_rank': 1},\n", + " 'id_1915': {'pref_rank': 3},\n", + " 'id_1918': {'pref_rank': 2},\n", + " 'id_1921': {'pref_rank': 3},\n", + " 'id_1924': {'pref_rank': 3},\n", + " 'id_1927': {'pref_rank': 2},\n", + " 'id_1930': {'pref_rank': 3},\n", + " 'id_1933': {'pref_rank': 1},\n", + " 'id_1936': {'pref_rank': 3},\n", + " 'id_1939': {'pref_rank': 1},\n", + " 'id_1942': {'pref_rank': 2},\n", + " 'id_1945': {'pref_rank': 2},\n", + " 'id_1948': {'pref_rank': 3},\n", + " 'id_1951': {'pref_rank': 2},\n", + " 'id_1954': {'pref_rank': 1},\n", + " 'id_1957': {'pref_rank': 2},\n", + " 'id_1960': {'pref_rank': 1},\n", + " 'id_1963': {'pref_rank': 1},\n", + " 'id_1966': {'pref_rank': 1},\n", + " 'id_1969': {'pref_rank': 3},\n", + " 'id_1972': {'pref_rank': 3},\n", + " 'id_1975': {'pref_rank': 1},\n", + " 'id_1978': {'pref_rank': 3},\n", + " 'id_1981': {'pref_rank': 1},\n", + " 'id_1984': {'pref_rank': 1},\n", + " 'id_1987': {'pref_rank': 3},\n", + " 'id_1990': {'pref_rank': 3},\n", + " 'id_1993': {'pref_rank': 1},\n", + " 'id_1996': {'pref_rank': 1},\n", + " 'id_1999': {'pref_rank': 2},\n", + " 'id_2002': {'pref_rank': 1},\n", + " 'id_2005': {'pref_rank': 2},\n", + " 'id_2008': {'pref_rank': 1},\n", + " 'id_2011': {'pref_rank': 2},\n", + " 'id_2014': {'pref_rank': 1},\n", + " 'id_2017': {'pref_rank': 1},\n", + " 'id_2020': {'pref_rank': 1},\n", + " 'id_2023': {'pref_rank': 2},\n", + " 'id_2026': {'pref_rank': 1},\n", + " 'id_2029': {'pref_rank': 2},\n", + " 'id_2032': {'pref_rank': 1},\n", + " 'id_2035': {'pref_rank': 1},\n", + " 'id_2038': {'pref_rank': 3},\n", + " 'id_2041': {'pref_rank': 1},\n", + " 'id_2044': {'pref_rank': 2},\n", + " 'id_2047': {'pref_rank': 3},\n", + " 'id_2050': {'pref_rank': 2},\n", + " 'id_2053': {'pref_rank': 1},\n", + " 'id_2056': {'pref_rank': 1},\n", + " 'id_2059': {'pref_rank': 3},\n", + " 'id_2062': {'pref_rank': 1},\n", + " 'id_2065': {'pref_rank': 2},\n", + " 'id_2068': {'pref_rank': 3},\n", + " 'id_2071': {'pref_rank': 2},\n", + " 'id_2074': {'pref_rank': 1},\n", + " 'id_2077': {'pref_rank': 1},\n", + " 'id_2080': {'pref_rank': 1},\n", + " 'id_2083': {'pref_rank': 3},\n", + " 'id_2086': {'pref_rank': 1},\n", + " 'id_2089': {'pref_rank': 1},\n", + " 'id_2092': {'pref_rank': 2},\n", + " 'id_2095': {'pref_rank': 3},\n", + " 'id_2098': {'pref_rank': 2},\n", + " 'id_2101': {'pref_rank': 1},\n", + " 'id_2104': {'pref_rank': 1},\n", + " 'id_2107': {'pref_rank': 2},\n", + " 'id_2110': {'pref_rank': 2},\n", + " 'id_2113': {'pref_rank': 2},\n", + " 'id_2116': {'pref_rank': 3},\n", + " 'id_2119': {'pref_rank': 1},\n", + " 'id_2122': {'pref_rank': 1},\n", + " 'id_2125': {'pref_rank': 2},\n", + " 'id_2128': {'pref_rank': 3},\n", + " 'id_2131': {'pref_rank': 1},\n", + " 'id_2134': {'pref_rank': 3},\n", + " 'id_2137': {'pref_rank': 2},\n", + " 'id_2140': {'pref_rank': 2},\n", + " 'id_2143': {'pref_rank': 3},\n", + " 'id_2146': {'pref_rank': 1},\n", + " 'id_2149': {'pref_rank': 1},\n", + " 'id_2152': {'pref_rank': 3},\n", + " 'id_2155': {'pref_rank': 3},\n", + " 'id_2158': {'pref_rank': 2},\n", + " 'id_2161': {'pref_rank': 2},\n", + " 'id_2164': {'pref_rank': 1},\n", + " 'id_2167': {'pref_rank': 2},\n", + " 'id_2170': {'pref_rank': 2},\n", + " 'id_2173': {'pref_rank': 3},\n", + " 'id_2176': {'pref_rank': 3},\n", + " 'id_2179': {'pref_rank': 2},\n", + " 'id_2182': {'pref_rank': 1},\n", + " 'id_2185': {'pref_rank': 3},\n", + " 'id_2188': {'pref_rank': 2},\n", + " 'id_2191': {'pref_rank': 3},\n", + " 'id_2194': {'pref_rank': 2},\n", + " 'id_2197': {'pref_rank': 2},\n", + " 'id_2200': {'pref_rank': 2},\n", + " 'id_2203': {'pref_rank': 2},\n", + " 'id_2206': {'pref_rank': 2},\n", + " 'id_2209': {'pref_rank': 3},\n", + " 'id_2212': {'pref_rank': 1},\n", + " 'id_2215': {'pref_rank': 2},\n", + " 'id_2218': {'pref_rank': 1},\n", + " 'id_2221': {'pref_rank': 1},\n", + " 'id_2224': {'pref_rank': 2},\n", + " 'id_2227': {'pref_rank': 2},\n", + " 'id_2230': {'pref_rank': 2},\n", + " 'id_2233': {'pref_rank': 2},\n", + " 'id_2236': {'pref_rank': 3},\n", + " 'id_2239': {'pref_rank': 2},\n", + " 'id_2242': {'pref_rank': 2},\n", + " 'id_2245': {'pref_rank': 3},\n", + " 'id_2248': {'pref_rank': 2},\n", + " 'id_2251': {'pref_rank': 3},\n", + " 'id_2254': {'pref_rank': 1},\n", + " 'id_2257': {'pref_rank': 2},\n", + " 'id_2260': {'pref_rank': 1},\n", + " 'id_2263': {'pref_rank': 2},\n", + " 'id_2266': {'pref_rank': 3},\n", + " 'id_2269': {'pref_rank': 3},\n", + " 'id_2272': {'pref_rank': 3},\n", + " 'id_2275': {'pref_rank': 1},\n", + " 'id_2278': {'pref_rank': 3},\n", + " 'id_2281': {'pref_rank': 2},\n", + " 'id_2284': {'pref_rank': 1},\n", + " 'id_2287': {'pref_rank': 2},\n", + " 'id_2290': {'pref_rank': 1},\n", + " 'id_2293': {'pref_rank': 3},\n", + " 'id_2296': {'pref_rank': 3},\n", + " 'id_2299': {'pref_rank': 2},\n", + " 'id_2302': {'pref_rank': 2},\n", + " 'id_2305': {'pref_rank': 1},\n", + " 'id_2308': {'pref_rank': 3},\n", + " 'id_2311': {'pref_rank': 2},\n", + " 'id_2314': {'pref_rank': 2},\n", + " 'id_2317': {'pref_rank': 1},\n", + " 'id_2320': {'pref_rank': 1},\n", + " 'id_2323': {'pref_rank': 3},\n", + " 'id_2326': {'pref_rank': 1},\n", + " 'id_2329': {'pref_rank': 1},\n", + " 'id_2332': {'pref_rank': 3},\n", + " 'id_2335': {'pref_rank': 2},\n", + " 'id_2338': {'pref_rank': 1},\n", + " 'id_2341': {'pref_rank': 3},\n", + " 'id_2344': {'pref_rank': 1},\n", + " 'id_2347': {'pref_rank': 1},\n", + " 'id_2350': {'pref_rank': 1},\n", + " 'id_2353': {'pref_rank': 1},\n", + " 'id_2356': {'pref_rank': 1},\n", + " 'id_2359': {'pref_rank': 1},\n", + " 'id_2362': {'pref_rank': 3},\n", + " 'id_2365': {'pref_rank': 3},\n", + " 'id_2368': {'pref_rank': 3},\n", + " 'id_2371': {'pref_rank': 2},\n", + " 'id_2374': {'pref_rank': 3},\n", + " 'id_2377': {'pref_rank': 1},\n", + " 'id_2380': {'pref_rank': 3},\n", + " 'id_2383': {'pref_rank': 2},\n", + " 'id_2386': {'pref_rank': 2},\n", + " 'id_2389': {'pref_rank': 3},\n", + " 'id_2392': {'pref_rank': 3},\n", + " 'id_2395': {'pref_rank': 2},\n", + " 'id_2398': {'pref_rank': 3},\n", + " 'id_2401': {'pref_rank': 2},\n", + " 'id_2404': {'pref_rank': 1},\n", + " 'id_2407': {'pref_rank': 1},\n", + " 'id_2410': {'pref_rank': 1},\n", + " 'id_2413': {'pref_rank': 2},\n", + " 'id_2416': {'pref_rank': 3},\n", + " 'id_2419': {'pref_rank': 3},\n", + " 'id_2422': {'pref_rank': 1},\n", + " 'id_2425': {'pref_rank': 1},\n", + " 'id_2428': {'pref_rank': 2},\n", + " 'id_2431': {'pref_rank': 2},\n", + " 'id_2434': {'pref_rank': 2},\n", + " 'id_2437': {'pref_rank': 2},\n", + " 'id_2440': {'pref_rank': 1},\n", + " 'id_2443': {'pref_rank': 3},\n", + " 'id_2446': {'pref_rank': 2},\n", + " 'id_2449': {'pref_rank': 1},\n", + " 'id_2452': {'pref_rank': 3},\n", + " 'id_2455': {'pref_rank': 2},\n", + " 'id_2458': {'pref_rank': 3},\n", + " 'id_2461': {'pref_rank': 1},\n", + " 'id_2464': {'pref_rank': 1},\n", + " 'id_2467': {'pref_rank': 2},\n", + " 'id_2470': {'pref_rank': 1},\n", + " 'id_2473': {'pref_rank': 3},\n", + " 'id_2476': {'pref_rank': 2},\n", + " 'id_2479': {'pref_rank': 3},\n", + " 'id_2482': {'pref_rank': 3},\n", + " 'id_2485': {'pref_rank': 3},\n", + " 'id_2488': {'pref_rank': 3},\n", + " 'id_2491': {'pref_rank': 1},\n", + " 'id_2494': {'pref_rank': 2},\n", + " 'id_2497': {'pref_rank': 2},\n", + " 'id_2500': {'pref_rank': 2},\n", + " 'id_2503': {'pref_rank': 1},\n", + " 'id_2506': {'pref_rank': 3},\n", + " 'id_2509': {'pref_rank': 2},\n", + " 'id_2512': {'pref_rank': 1},\n", + " 'id_2515': {'pref_rank': 1},\n", + " 'id_2518': {'pref_rank': 3},\n", + " 'id_2521': {'pref_rank': 3},\n", + " 'id_2524': {'pref_rank': 2},\n", + " 'id_2527': {'pref_rank': 2},\n", + " 'id_2530': {'pref_rank': 3},\n", + " 'id_2533': {'pref_rank': 3},\n", + " 'id_2536': {'pref_rank': 2},\n", + " 'id_2539': {'pref_rank': 3},\n", + " 'id_2542': {'pref_rank': 3},\n", + " 'id_2545': {'pref_rank': 3},\n", + " 'id_2548': {'pref_rank': 1},\n", + " 'id_2551': {'pref_rank': 1},\n", + " 'id_2554': {'pref_rank': 1},\n", + " 'id_2557': {'pref_rank': 2},\n", + " 'id_2560': {'pref_rank': 1},\n", + " 'id_2563': {'pref_rank': 1},\n", + " 'id_2566': {'pref_rank': 2},\n", + " 'id_2569': {'pref_rank': 1},\n", + " 'id_2572': {'pref_rank': 2},\n", + " 'id_2575': {'pref_rank': 2},\n", + " 'id_2578': {'pref_rank': 3},\n", + " 'id_2581': {'pref_rank': 2},\n", + " 'id_2584': {'pref_rank': 1},\n", + " 'id_2587': {'pref_rank': 2},\n", + " 'id_2590': {'pref_rank': 2},\n", + " 'id_2593': {'pref_rank': 3},\n", + " 'id_2596': {'pref_rank': 3},\n", + " 'id_2599': {'pref_rank': 3},\n", + " 'id_2602': {'pref_rank': 2},\n", + " 'id_2605': {'pref_rank': 3},\n", + " 'id_2608': {'pref_rank': 2},\n", + " 'id_2611': {'pref_rank': 1},\n", + " 'id_2614': {'pref_rank': 2},\n", + " 'id_2617': {'pref_rank': 2},\n", + " 'id_2620': {'pref_rank': 2},\n", + " 'id_2623': {'pref_rank': 3},\n", + " 'id_2626': {'pref_rank': 2},\n", + " 'id_2629': {'pref_rank': 3},\n", + " 'id_2632': {'pref_rank': 3},\n", + " 'id_2635': {'pref_rank': 2},\n", + " 'id_2638': {'pref_rank': 1},\n", + " 'id_2641': {'pref_rank': 3},\n", + " 'id_2644': {'pref_rank': 2},\n", + " 'id_2647': {'pref_rank': 3},\n", + " 'id_2650': {'pref_rank': 1},\n", + " 'id_2653': {'pref_rank': 3},\n", + " 'id_2656': {'pref_rank': 1},\n", + " 'id_2659': {'pref_rank': 1},\n", + " 'id_2662': {'pref_rank': 3},\n", + " 'id_2665': {'pref_rank': 1},\n", + " 'id_2668': {'pref_rank': 2},\n", + " 'id_2671': {'pref_rank': 2},\n", + " 'id_2674': {'pref_rank': 2},\n", + " 'id_2677': {'pref_rank': 1},\n", + " 'id_2680': {'pref_rank': 2},\n", + " 'id_2683': {'pref_rank': 2},\n", + " 'id_2686': {'pref_rank': 1},\n", + " 'id_2689': {'pref_rank': 1},\n", + " 'id_2692': {'pref_rank': 3},\n", + " 'id_2695': {'pref_rank': 3},\n", + " 'id_2698': {'pref_rank': 2},\n", + " 'id_2701': {'pref_rank': 3},\n", + " 'id_2704': {'pref_rank': 1},\n", + " 'id_2707': {'pref_rank': 3},\n", + " 'id_2710': {'pref_rank': 2},\n", + " 'id_2713': {'pref_rank': 3},\n", + " 'id_2716': {'pref_rank': 1},\n", + " 'id_2719': {'pref_rank': 2},\n", + " 'id_2722': {'pref_rank': 2},\n", + " 'id_2725': {'pref_rank': 3},\n", + " 'id_2728': {'pref_rank': 1},\n", + " 'id_2731': {'pref_rank': 3},\n", + " 'id_2734': {'pref_rank': 1},\n", + " 'id_2737': {'pref_rank': 1},\n", + " 'id_2740': {'pref_rank': 3},\n", + " 'id_2743': {'pref_rank': 1},\n", + " 'id_2746': {'pref_rank': 2},\n", + " 'id_2749': {'pref_rank': 2},\n", + " 'id_2752': {'pref_rank': 2},\n", + " 'id_2755': {'pref_rank': 2},\n", + " 'id_2758': {'pref_rank': 1},\n", + " 'id_2761': {'pref_rank': 3},\n", + " 'id_2764': {'pref_rank': 1},\n", + " 'id_2767': {'pref_rank': 1},\n", + " 'id_2770': {'pref_rank': 2},\n", + " 'id_2773': {'pref_rank': 2},\n", + " 'id_2776': {'pref_rank': 1},\n", + " 'id_2779': {'pref_rank': 1},\n", + " 'id_2782': {'pref_rank': 2},\n", + " 'id_2785': {'pref_rank': 3},\n", + " 'id_2788': {'pref_rank': 3},\n", + " 'id_2791': {'pref_rank': 1},\n", + " 'id_2794': {'pref_rank': 1},\n", + " 'id_2797': {'pref_rank': 2},\n", + " 'id_2800': {'pref_rank': 1},\n", + " 'id_2803': {'pref_rank': 3},\n", + " 'id_2806': {'pref_rank': 1},\n", + " 'id_2809': {'pref_rank': 3},\n", + " 'id_2812': {'pref_rank': 1},\n", + " 'id_2815': {'pref_rank': 1},\n", + " 'id_2818': {'pref_rank': 2},\n", + " 'id_2821': {'pref_rank': 1},\n", + " 'id_2824': {'pref_rank': 1},\n", + " 'id_2827': {'pref_rank': 1},\n", + " 'id_2830': {'pref_rank': 1},\n", + " 'id_2833': {'pref_rank': 2},\n", + " 'id_2836': {'pref_rank': 2},\n", + " 'id_2839': {'pref_rank': 2},\n", + " 'id_2842': {'pref_rank': 3},\n", + " 'id_2845': {'pref_rank': 2},\n", + " 'id_2848': {'pref_rank': 1},\n", + " 'id_2851': {'pref_rank': 3},\n", + " 'id_2854': {'pref_rank': 3},\n", + " 'id_2857': {'pref_rank': 3},\n", + " 'id_2860': {'pref_rank': 2},\n", + " 'id_2863': {'pref_rank': 3},\n", + " 'id_2866': {'pref_rank': 3},\n", + " 'id_2869': {'pref_rank': 3},\n", + " 'id_2872': {'pref_rank': 1},\n", + " 'id_2875': {'pref_rank': 3},\n", + " 'id_2878': {'pref_rank': 1},\n", + " 'id_2881': {'pref_rank': 3},\n", + " 'id_2884': {'pref_rank': 3},\n", + " 'id_2887': {'pref_rank': 3},\n", + " 'id_2890': {'pref_rank': 2},\n", + " 'id_2893': {'pref_rank': 2},\n", + " 'id_2896': {'pref_rank': 1},\n", + " 'id_2899': {'pref_rank': 2},\n", + " 'id_2902': {'pref_rank': 2},\n", + " 'id_2905': {'pref_rank': 1},\n", + " 'id_2908': {'pref_rank': 1},\n", + " 'id_2911': {'pref_rank': 3},\n", + " 'id_2914': {'pref_rank': 2},\n", + " 'id_2917': {'pref_rank': 1},\n", + " 'id_2920': {'pref_rank': 2},\n", + " 'id_2923': {'pref_rank': 3},\n", + " 'id_2926': {'pref_rank': 2},\n", + " 'id_2929': {'pref_rank': 3},\n", + " 'id_2932': {'pref_rank': 2},\n", + " 'id_2935': {'pref_rank': 3},\n", + " 'id_2938': {'pref_rank': 3},\n", + " 'id_2941': {'pref_rank': 1},\n", + " 'id_2944': {'pref_rank': 1},\n", + " 'id_2947': {'pref_rank': 1},\n", + " 'id_2950': {'pref_rank': 2},\n", + " 'id_2953': {'pref_rank': 1},\n", + " 'id_2956': {'pref_rank': 2},\n", + " 'id_2959': {'pref_rank': 1},\n", + " 'id_2962': {'pref_rank': 3},\n", + " 'id_2965': {'pref_rank': 1},\n", + " 'id_2968': {'pref_rank': 2},\n", + " 'id_2971': {'pref_rank': 1},\n", + " 'id_2974': {'pref_rank': 3},\n", + " 'id_2977': {'pref_rank': 2},\n", + " 'id_2980': {'pref_rank': 3},\n", + " 'id_2983': {'pref_rank': 2},\n", + " 'id_2986': {'pref_rank': 3},\n", + " 'id_2989': {'pref_rank': 2},\n", + " 'id_2992': {'pref_rank': 1},\n", + " 'id_2995': {'pref_rank': 1},\n", + " 'id_2998': {'pref_rank': 2},\n", + " ...}" + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pref = {}\n", + "\n", + "for model_ in folder2model.values():\n", + " pref.update(\n", + " dict(zip(df_scores[model_].iloc[x_indices], df_scores[model_].iloc[y_indices]))\n", + " )\n", + "\n", + "for k,v in pref.items():\n", + " pref[k] = {'pref_rank': v}\n", + "\n", + "pref" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "4f73823c-a3d2-4cb8-bbe3-317acbf2e4c7", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['id_1', 'id_4', 'id_7', 'id_10', 'id_13']" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "list(df_scores['m1'].iloc[x_indices])[:5]" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "871152a6-5809-4815-91d3-285123b5a80b", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'id_1': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_4': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_7': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_10': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_13': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_16': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_19': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_22': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_25': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_28': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_31': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_34': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_37': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_40': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_43': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_46': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_49': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_52': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_55': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_58': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_61': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_64': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_67': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_70': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_73': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_76': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_79': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_82': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_85': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_88': {'model': 'm1',\n", + " 'sent_id': 9,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_91': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_94': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_97': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_100': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_103': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_106': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_109': {'model': 'm2',\n", + " 'sent_id': 15,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_112': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_115': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_118': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_121': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_124': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_127': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_130': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_133': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_136': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_139': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_142': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_145': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_148': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_151': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_154': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_157': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_160': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_163': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_166': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_169': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_172': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_175': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_178': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_181': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_184': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_187': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_190': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_193': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_196': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_199': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_202': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_205': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_208': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_211': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_214': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_217': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_220': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_223': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_226': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_229': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_232': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_235': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_238': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_241': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_244': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_247': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_250': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_253': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_256': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_259': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_262': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_265': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_268': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_271': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_274': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_277': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_280': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_283': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_286': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_289': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_292': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_295': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_298': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_301': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_304': {'model': 'm2',\n", + " 'sent_id': 2,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_307': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_310': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_313': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_316': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_319': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_322': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_325': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_328': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_331': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_334': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_337': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_340': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_343': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_346': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_349': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_352': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_355': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_358': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_361': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_364': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_367': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_370': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_373': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_376': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_379': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_382': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_385': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_388': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_391': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_394': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_397': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_400': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_403': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_406': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_409': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_412': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_415': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_418': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_421': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_424': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_427': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_430': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_433': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_436': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_439': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_442': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_445': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_448': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0011',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_451': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_454': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_457': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_460': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_463': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_466': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_469': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_472': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_475': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_478': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_481': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_484': {'model': 'm2',\n", + " 'sent_id': 2,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_487': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_490': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_493': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_496': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_499': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_502': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_505': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_508': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_511': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_514': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_517': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_520': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_523': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_526': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_529': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_532': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_535': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_538': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_541': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_544': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_547': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_550': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_553': {'model': 'm2',\n", + " 'sent_id': 13,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_556': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_559': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_562': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_565': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_568': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_571': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_574': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_577': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_580': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_583': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_586': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_589': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_592': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_595': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_598': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_601': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_604': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_607': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_610': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_613': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_616': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_619': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_622': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_625': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_628': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_631': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_634': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_637': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_640': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_643': {'model': 'm2',\n", + " 'sent_id': 13,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_646': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_649': {'model': 'm2',\n", + " 'sent_id': 15,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_652': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_655': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_658': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_661': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_664': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_667': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_670': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_673': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_676': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_679': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_682': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_685': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_688': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_691': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_694': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_697': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_700': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_703': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_706': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_709': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_712': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_715': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_718': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_721': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_724': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_727': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_730': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_733': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_736': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_739': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_742': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_745': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_748': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_751': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_754': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_757': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_760': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_763': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_766': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_769': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_772': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_775': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_778': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_781': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_784': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_787': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_790': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_793': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_796': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_799': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_802': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_805': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_808': {'model': 'm1',\n", + " 'sent_id': 9,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_811': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_814': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_817': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_820': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_823': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_826': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_829': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_832': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_835': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_838': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_841': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_844': {'model': 'm2',\n", + " 'sent_id': 2,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_847': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_850': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_853': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_856': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_859': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_862': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_865': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_868': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_871': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_874': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_877': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_880': {'model': 'm1',\n", + " 'sent_id': 30,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_883': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_886': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_889': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_892': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_895': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_898': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0012',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_901': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_904': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_907': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_910': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_913': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_916': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_919': {'model': 'm2',\n", + " 'sent_id': 15,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_922': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_925': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_928': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_931': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_934': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_937': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_940': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_943': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_946': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_949': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_952': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_955': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_958': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_961': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_964': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_967': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_970': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_973': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_976': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_979': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_982': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_985': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_988': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_991': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_994': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_997': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1000': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1003': {'model': 'm2',\n", + " 'sent_id': 13,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1006': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1009': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1012': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1015': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1018': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1021': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1024': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1027': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1030': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1033': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1036': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1039': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1042': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1045': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1048': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1051': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1054': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1057': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1060': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1063': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1066': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1069': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1072': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1075': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1078': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1081': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1084': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1087': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1090': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1093': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1096': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1099': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1102': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1105': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1108': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1111': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1114': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1117': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1120': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1123': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1126': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1129': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1132': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1135': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1138': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1141': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1144': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1147': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1150': {'model': 'm1',\n", + " 'sent_id': 30,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1153': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1156': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1159': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1162': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1165': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1168': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1171': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1174': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1177': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1180': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1183': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1186': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1189': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1192': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1195': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1198': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1201': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1204': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1207': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1210': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1213': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1216': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1219': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1222': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1225': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1228': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1231': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1234': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1237': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1240': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1243': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1246': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1249': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1252': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1255': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1258': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1261': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1264': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1267': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1270': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1273': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1276': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1279': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1282': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1285': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1288': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1291': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1294': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1297': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1300': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1303': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1306': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1309': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1312': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1315': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1318': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1321': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1324': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1327': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1330': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1333': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1336': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1339': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1342': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1345': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1348': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0013',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1351': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1354': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1357': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1360': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1363': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1366': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1369': {'model': 'm2',\n", + " 'sent_id': 15,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1372': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1375': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1378': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1381': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1384': {'model': 'm2',\n", + " 'sent_id': 2,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1387': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1390': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1393': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1396': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1399': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1402': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1405': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1408': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1411': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1414': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1417': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1420': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1423': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1426': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1429': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1432': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1435': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1438': {'model': 'm1',\n", + " 'sent_id': 9,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1441': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1444': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1447': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1450': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1453': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1456': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1459': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1462': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1465': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1468': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1471': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1474': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1477': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1480': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1483': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1486': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1489': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1492': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1495': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1498': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1501': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1504': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1507': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1510': {'model': 'm1',\n", + " 'sent_id': 30,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1513': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1516': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1519': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1522': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1525': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1528': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1531': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1534': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1537': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1540': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1543': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1546': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1549': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1552': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1555': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1558': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1561': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1564': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1567': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1570': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1573': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1576': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1579': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1582': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1585': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1588': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1591': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1594': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1597': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1600': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1603': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1606': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1609': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1612': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1615': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1618': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1621': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1624': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1627': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1630': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1633': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1636': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1639': {'model': 'm2',\n", + " 'sent_id': 15,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1642': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1645': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1648': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1651': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1654': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1657': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1660': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1663': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1666': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1669': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1672': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1675': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1678': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1681': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1684': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1687': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1690': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1693': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1696': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1699': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1702': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1705': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1708': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1711': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1714': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1717': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1720': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1723': {'model': 'm2',\n", + " 'sent_id': 13,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1726': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1729': {'model': 'm2',\n", + " 'sent_id': 15,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1732': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1735': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1738': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1741': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1744': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1747': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1750': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1753': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1756': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1759': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1762': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1765': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1768': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1771': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1774': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1777': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1780': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1783': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1786': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1789': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1792': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1795': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1798': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0014',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1801': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1804': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1807': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1810': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1813': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1816': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1819': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1822': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1825': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1828': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1831': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1834': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1837': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1840': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1843': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1846': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1849': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1852': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1855': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1858': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1861': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1864': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1867': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1870': {'model': 'm1',\n", + " 'sent_id': 30,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1873': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1876': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1879': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1882': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1885': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1888': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1891': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1894': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1897': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1900': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1903': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1906': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1909': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1912': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1915': {'model': 'm3',\n", + " 'sent_id': 17,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1918': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1921': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1924': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1927': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1930': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1933': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1936': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1939': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1942': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1945': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1948': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1951': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1954': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1957': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_1960': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1963': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1966': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1969': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1972': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1975': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1978': {'model': 'm1',\n", + " 'sent_id': 9,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1981': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1984': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1987': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1990': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_1993': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1996': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_1999': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2002': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2005': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2008': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2011': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2014': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2017': {'model': 'm1',\n", + " 'sent_id': 20,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2020': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2023': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2026': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2029': {'model': 'm1',\n", + " 'sent_id': 24,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2032': {'model': 'm2',\n", + " 'sent_id': 25,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2035': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2038': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2041': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2044': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2047': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2050': {'model': 'm1',\n", + " 'sent_id': 30,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2053': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2056': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2059': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2062': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2065': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2068': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2071': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2074': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2077': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2080': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2083': {'model': 'm2',\n", + " 'sent_id': 13,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2086': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2089': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2092': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2095': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2098': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2101': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2104': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2107': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2110': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2113': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2116': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2119': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2122': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2125': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2128': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2131': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2134': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2137': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2140': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2143': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2146': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2149': {'model': 'm2',\n", + " 'sent_id': 6,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2152': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2155': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2158': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2161': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2164': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2167': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2170': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2173': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2176': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2179': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2182': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2185': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2188': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2191': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2194': {'model': 'm2',\n", + " 'sent_id': 2,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2197': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2200': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2203': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2206': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2209': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2212': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2215': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2218': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2221': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2224': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2227': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2230': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2233': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2236': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2239': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2242': {'model': 'm1',\n", + " 'sent_id': 7,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2245': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2248': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0015',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2251': {'model': 'm2',\n", + " 'sent_id': 1,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2254': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2257': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2260': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2263': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2266': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2269': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2272': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2275': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2278': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2281': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2284': {'model': 'm2',\n", + " 'sent_id': 2,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2287': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2290': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2293': {'model': 'm2',\n", + " 'sent_id': 22,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2296': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2299': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2302': {'model': 'm1',\n", + " 'sent_id': 25,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2305': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2308': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2311': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2314': {'model': 'm2',\n", + " 'sent_id': 29,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2317': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2320': {'model': 'm1',\n", + " 'sent_id': 30,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2323': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2326': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2329': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2332': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2335': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2338': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2341': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2344': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2347': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2350': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2353': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2356': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2359': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2362': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2365': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2368': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2371': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2374': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2377': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2380': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2383': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2386': {'model': 'm1',\n", + " 'sent_id': 23,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2389': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2392': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2395': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2398': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2401': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2404': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2407': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2410': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2413': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2416': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2419': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2422': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2425': {'model': 'm3',\n", + " 'sent_id': 8,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2428': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2431': {'model': 'm3',\n", + " 'sent_id': 1,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2434': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2437': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2440': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2443': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2446': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2449': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2452': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2455': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2458': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2461': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2464': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2467': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2470': {'model': 'm1',\n", + " 'sent_id': 21,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2473': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2476': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2479': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2482': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2485': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2488': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2491': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2494': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2497': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2500': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2503': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2506': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2509': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2512': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2515': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2518': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2521': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2524': {'model': 'm1',\n", + " 'sent_id': 10,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2527': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2530': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2533': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2536': {'model': 'm1',\n", + " 'sent_id': 14,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2539': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2542': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2545': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2548': {'model': 'm2',\n", + " 'sent_id': 18,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2551': {'model': 'm3',\n", + " 'sent_id': 19,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2554': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2557': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2560': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2563': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2566': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2569': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2572': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2575': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2578': {'model': 'm1',\n", + " 'sent_id': 27,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2581': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2584': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2587': {'model': 'm2',\n", + " 'sent_id': 3,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2590': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2593': {'model': 'm3',\n", + " 'sent_id': 4,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2596': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2599': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2602': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2605': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2608': {'model': 'm3',\n", + " 'sent_id': 9,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2611': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2614': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2617': {'model': 'm2',\n", + " 'sent_id': 11,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2620': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2623': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2626': {'model': 'm2',\n", + " 'sent_id': 14,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2629': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2632': {'model': 'm2',\n", + " 'sent_id': 16,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2635': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2638': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2641': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2644': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2647': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2650': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2653': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2656': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2659': {'model': 'm3',\n", + " 'sent_id': 24,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2662': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2665': {'model': 'm1',\n", + " 'sent_id': 26,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2668': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2671': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2674': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2677': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2680': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2683': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2686': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2689': {'model': 'm1',\n", + " 'sent_id': 6,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2692': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2695': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2698': {'model': 'm1',\n", + " 'sent_id': 9,\n", + " 'speaker': '0016',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2701': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2704': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2707': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2710': {'model': 'm1',\n", + " 'sent_id': 12,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2713': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2716': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2719': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2722': {'model': 'm3',\n", + " 'sent_id': 16,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2725': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2728': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2731': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2734': {'model': 'm1',\n", + " 'sent_id': 2,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2737': {'model': 'm3',\n", + " 'sent_id': 20,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2740': {'model': 'm3',\n", + " 'sent_id': 21,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2743': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2746': {'model': 'm3',\n", + " 'sent_id': 23,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2749': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2752': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2755': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2758': {'model': 'm3',\n", + " 'sent_id': 27,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2761': {'model': 'm2',\n", + " 'sent_id': 28,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2764': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2767': {'model': 'm3',\n", + " 'sent_id': 3,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2770': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2773': {'model': 'm2',\n", + " 'sent_id': 4,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2776': {'model': 'm1',\n", + " 'sent_id': 5,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2779': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2782': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2785': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2788': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2791': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2794': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2797': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2800': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2803': {'model': 'm1',\n", + " 'sent_id': 13,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2806': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2809': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2812': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2815': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2818': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2821': {'model': 'm1',\n", + " 'sent_id': 19,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2824': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2827': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2830': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2833': {'model': 'm3',\n", + " 'sent_id': 22,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2836': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2839': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2842': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2845': {'model': 'm2',\n", + " 'sent_id': 26,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2848': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2851': {'model': 'm1',\n", + " 'sent_id': 28,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2854': {'model': 'm3',\n", + " 'sent_id': 29,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2857': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2860': {'model': 'm3',\n", + " 'sent_id': 30,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2863': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2866': {'model': 'm2',\n", + " 'sent_id': 5,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2869': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2872': {'model': 'm2',\n", + " 'sent_id': 7,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2875': {'model': 'm1',\n", + " 'sent_id': 8,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2878': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2881': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2884': {'model': 'm2',\n", + " 'sent_id': 10,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2887': {'model': 'm1',\n", + " 'sent_id': 11,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2890': {'model': 'm3',\n", + " 'sent_id': 12,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2893': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2896': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2899': {'model': 'm3',\n", + " 'sent_id': 15,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2902': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2905': {'model': 'm2',\n", + " 'sent_id': 17,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2908': {'model': 'm3',\n", + " 'sent_id': 18,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2911': {'model': 'm2',\n", + " 'sent_id': 19,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2914': {'model': 'm3',\n", + " 'sent_id': 2,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2917': {'model': 'm2',\n", + " 'sent_id': 20,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Was it using language that caused their brains to develop?',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2920': {'model': 'm2',\n", + " 'sent_id': 21,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2923': {'model': 'm1',\n", + " 'sent_id': 22,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2926': {'model': 'm2',\n", + " 'sent_id': 23,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2929': {'model': 'm2',\n", + " 'sent_id': 24,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2932': {'model': 'm3',\n", + " 'sent_id': 25,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2935': {'model': 'm3',\n", + " 'sent_id': 26,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2938': {'model': 'm2',\n", + " 'sent_id': 27,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2941': {'model': 'm3',\n", + " 'sent_id': 28,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2944': {'model': 'm1',\n", + " 'sent_id': 29,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2947': {'model': 'm1',\n", + " 'sent_id': 3,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'It seemed the ordained order of things that dogs should work .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2950': {'model': 'm2',\n", + " 'sent_id': 30,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2953': {'model': 'm1',\n", + " 'sent_id': 4,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The journey was continued at dawn .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2956': {'model': 'm3',\n", + " 'sent_id': 5,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2959': {'model': 'm3',\n", + " 'sent_id': 6,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'A dead man is of no use on a plantation .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2962': {'model': 'm3',\n", + " 'sent_id': 7,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'The Claudine was leaving next morning for Honolulu .',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2965': {'model': 'm2',\n", + " 'sent_id': 8,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2968': {'model': 'm2',\n", + " 'sent_id': 9,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2971': {'model': 'm1',\n", + " 'sent_id': 1,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2974': {'model': 'm3',\n", + " 'sent_id': 10,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2977': {'model': 'm3',\n", + " 'sent_id': 11,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2980': {'model': 'm2',\n", + " 'sent_id': 12,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2983': {'model': 'm3',\n", + " 'sent_id': 13,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2986': {'model': 'm3',\n", + " 'sent_id': 14,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n", + " 'nmistakes': 3,\n", + " 'pref_rank': 3},\n", + " 'id_2989': {'model': 'm1',\n", + " 'sent_id': 15,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " 'id_2992': {'model': 'm1',\n", + " 'sent_id': 16,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2995': {'model': 'm1',\n", + " 'sent_id': 17,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n", + " 'nmistakes': 1,\n", + " 'pref_rank': 1},\n", + " 'id_2998': {'model': 'm1',\n", + " 'sent_id': 18,\n", + " 'speaker': '0017',\n", + " 'accent': None,\n", + " 'text': 'Earthquakes damage all structures, including bridges.',\n", + " 'nmistakes': 2,\n", + " 'pref_rank': 2},\n", + " ...}" + ] + }, + "execution_count": 21, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "for wav_id in meta.keys():\n", + " record_ = meta[wav_id]\n", + " record_.update(sentences[wav_id])\n", + " record_.update(scores[wav_id])\n", + " record_.update(pref[wav_id])\n", + "\n", + "meta" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "id": "479da0a9-6e49-40af-8e9c-dd6147df0f9f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "4050" + ] + }, + "execution_count": 22, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(pref)" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "id": "fe728682-e40b-47cb-bc38-6864f7312cc5", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
modelsent_idspeakeraccenttextnmistakespref_ranknwords
id_3994m220020NoneFifty yards ahead of her were the first of the rocks .3312
id_719m190012NoneDifferent telescope designs perform differently, and have different strengths and weaknesses.3311
id_4012m3250020NoneYoung people want to feel supported and appreciated by their company and their superiors.2214
id_3258m3140018NoneWhen I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.3319
id_1331m2300013NoneAll this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.1123
\n", + "
" + ], + "text/plain": [ + " model sent_id speaker accent \\\n", + "id_3994 m2 2 0020 None \n", + "id_719 m1 9 0012 None \n", + "id_4012 m3 25 0020 None \n", + "id_3258 m3 14 0018 None \n", + "id_1331 m2 30 0013 None \n", + "\n", + " text \\\n", + "id_3994 Fifty yards ahead of her were the first of the rocks . \n", + "id_719 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "id_4012 Young people want to feel supported and appreciated by their company and their superiors. \n", + "id_3258 When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town. \n", + "id_1331 All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart. \n", + "\n", + " nmistakes pref_rank nwords \n", + "id_3994 3 3 12 \n", + "id_719 3 3 11 \n", + "id_4012 2 2 14 \n", + "id_3258 3 3 19 \n", + "id_1331 1 1 23 " + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_meta = pd.DataFrame.from_dict(meta, orient='index')\n", + "df_meta['nwords'] = df_meta['text'].apply(lambda x: len(x.split(' ')))\n", + "df_meta.sample(5)" + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "id": "2d5a228d-2946-41bf-9a3e-ca699453171a", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
modelsent_idspeakeraccenttextnmistakespref_ranknwords
id_3107m1230017NoneFor more than two hundred years the pessimists have been winning the public debate.FAILEDFAILED14
id_3112m1250017NoneYoung people want to feel supported and appreciated by their company and their superiors.FAILEDFAILED14
id_3108m2230017NoneFor more than two hundred years the pessimists have been winning the public debate.FAILEDFAILED14
\n", + "
" + ], + "text/plain": [ + " model sent_id speaker accent \\\n", + "id_3107 m1 23 0017 None \n", + "id_3112 m1 25 0017 None \n", + "id_3108 m2 23 0017 None \n", + "\n", + " text \\\n", + "id_3107 For more than two hundred years the pessimists have been winning the public debate. \n", + "id_3112 Young people want to feel supported and appreciated by their company and their superiors. \n", + "id_3108 For more than two hundred years the pessimists have been winning the public debate. \n", + "\n", + " nmistakes pref_rank nwords \n", + "id_3107 FAILED FAILED 14 \n", + "id_3112 FAILED FAILED 14 \n", + "id_3108 FAILED FAILED 14 " + ] + }, + "execution_count": 24, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_meta.loc[df_meta['nmistakes'] == 'FAILED'].sample(3)" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "id": "aa54fcc9-7dcb-4371-bcd5-18d850e7e631", + "metadata": {}, + "outputs": [], + "source": [ + "# Filter bad speakers?\n", + "some_bad_speaker = 'scottish__scottish_male__cmu_us_awb_arctic'\n", + "df_failed = df_meta.loc[df_meta['speaker'] == some_bad_speaker]\n", + "df_good = df_meta.loc[df_meta['speaker'] != some_bad_speaker]\n", + "df_good = df_good.loc[df_good['nmistakes'] != \"FAILED\"]" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "id": "48fdd680-684e-4331-929d-e03ea0519182", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
modelsent_idspeakeraccenttextnmistakespref_ranknwords
\n", + "
" + ], + "text/plain": [ + "Empty DataFrame\n", + "Columns: [model, sent_id, speaker, accent, text, nmistakes, pref_rank, nwords]\n", + "Index: []" + ] + }, + "execution_count": 26, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_failed_good_models = df_failed.loc[df_failed['nmistakes'] != 'FAILED', :]\n", + "df_failed_good_models" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "id": "b69770ea-64f8-4e59-a1b8-cccbd95dff2d", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
modelsent_idspeakeraccenttextnmistakespref_ranknwordswer
id_682m2250012NoneYoung people want to feel supported and appreciated by their company and their superiors.11140.071429
id_1709m290014NoneDifferent telescope designs perform differently, and have different strengths and weaknesses.22110.181818
id_3289m2240018NoneIt's wearing me out trying to juggle work with looking after my children and my family.22160.125
id_3131m1300017NoneAll this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.22230.086957
id_807m380012NoneProsecutors have opened a massive investigation into allegations of fixing games and illegal betting.22140.142857
\n", + "
" + ], + "text/plain": [ + " model sent_id speaker accent \\\n", + "id_682 m2 25 0012 None \n", + "id_1709 m2 9 0014 None \n", + "id_3289 m2 24 0018 None \n", + "id_3131 m1 30 0017 None \n", + "id_807 m3 8 0012 None \n", + "\n", + " text \\\n", + "id_682 Young people want to feel supported and appreciated by their company and their superiors. \n", + "id_1709 Different telescope designs perform differently, and have different strengths and weaknesses. \n", + "id_3289 It's wearing me out trying to juggle work with looking after my children and my family. \n", + "id_3131 All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart. \n", + "id_807 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n", + "\n", + " nmistakes pref_rank nwords wer \n", + "id_682 1 1 14 0.071429 \n", + "id_1709 2 2 11 0.181818 \n", + "id_3289 2 2 16 0.125 \n", + "id_3131 2 2 23 0.086957 \n", + "id_807 2 2 14 0.142857 " + ] + }, + "execution_count": 27, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_good['wer'] = df_good['nmistakes'] / df_good['nwords']\n", + "df_good.sample(5)" + ] + }, + { + "cell_type": "code", + "execution_count": 28, + "id": "e1bf942e-a3e1-4849-b60f-9a049810aa66", + "metadata": {}, + "outputs": [], + "source": [ + "df_full = df_good" + ] + }, + { + "cell_type": "code", + "execution_count": 29, + "id": "9eb31c09-902d-4628-b298-5ebc5a56d446", + "metadata": {}, + "outputs": [], + "source": [ + "mean_wer = {}\n", + "std_wer = {}\n", + "stats = {}\n", + "for m, df in df_full.groupby('model'):\n", + " mean_wer[m] = df['wer'].mean()\n", + " std_wer[m] = df['wer'].std()\n", + " stats[m] = (mean_wer[m], std_wer[m])" + ] + }, + { + "cell_type": "code", + "execution_count": 30, + "id": "5ef9cbc8-0807-42ff-8a79-6eedb81b4531", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'m1': 0.15581893610424408, 'm2': 0.1551033686858993, 'm3': 0.1505934661339411}" + ] + }, + "execution_count": 30, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "mean_wer" + ] + }, + { + "cell_type": "code", + "execution_count": 31, + "id": "cb6ed758-1050-4fb3-a505-6510423d92f5", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'m1': (0.15581893610424408, 0.0917370138172076),\n", + " 'm2': (0.1551033686858993, 0.08791329488553278),\n", + " 'm3': (0.1505934661339411, 0.08370192086698483)}" + ] + }, + "execution_count": 31, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "stats" + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "id": "1b749874-5078-49c9-96f1-af75c63998b1", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'m1': (0.06408192228703648, 0.2475559499214517),\n", + " 'm2': (0.06719007380036653, 0.2430166635714321),\n", + " 'm3': (0.06689154526695626, 0.23429538700092592)}" + ] + }, + "execution_count": 32, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "conf_int = {}\n", + "for m in stats.keys():\n", + " conf_int[m] = (stats[m][0] - stats[m][1], stats[m][0] + stats[m][1])\n", + "\n", + "conf_int" + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "id": "725bb813-96c7-4779-a2f6-e46b667c0b98", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'m1': 'generated_hifi/esd_tune/g_3164999',\n", + " 'm2': 'generated_hifi/esd_tune_reversal/g_3164999',\n", + " 'm3': 'generated_hifi/esd_tune_advloss0/g_3164999'}" + ] + }, + "execution_count": 33, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "model2folder" + ] + }, + { + "cell_type": "code", + "execution_count": 34, + "id": "c49f11ee-55f9-477c-a749-8dffd176015a", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/plain": [ + "{'0011_m1': {'mean': 0.1649417562959747,\n", + " 'std': 0.09848066669836777,\n", + " 'conf_int': (0.06646108959760694, 0.2634224229943425)},\n", + " '0011_m2': {'mean': 0.15374506591006587,\n", + " 'std': 0.09372400140491297,\n", + " 'conf_int': (0.060021064505152905, 0.24746906731497884)},\n", + " '0011_m3': {'mean': 0.15757343048134242,\n", + " 'std': 0.09647052824930616,\n", + " 'conf_int': (0.061102902232036266, 0.25404395873064856)},\n", + " '0012_m1': {'mean': 0.15808598946517752,\n", + " 'std': 0.08908074500705088,\n", + " 'conf_int': (0.06900524445812664, 0.2471667344722284)},\n", + " '0012_m2': {'mean': 0.15953635163248103,\n", + " 'std': 0.09717079605964918,\n", + " 'conf_int': (0.062365555572831854, 0.2567071476921302)},\n", + " '0012_m3': {'mean': 0.1525969552657367,\n", + " 'std': 0.07814707979240157,\n", + " 'conf_int': (0.07444987547333512, 0.23074403505813826)},\n", + " '0013_m1': {'mean': 0.16239193389292073,\n", + " 'std': 0.09757158871850868,\n", + " 'conf_int': (0.06482034517441204, 0.2599635226114294)},\n", + " '0013_m2': {'mean': 0.16063079414164727,\n", + " 'std': 0.08754696864487832,\n", + " 'conf_int': (0.07308382549676895, 0.2481777627865256)},\n", + " '0013_m3': {'mean': 0.1519149953173421,\n", + " 'std': 0.08349049225936797,\n", + " 'conf_int': (0.06842450305797412, 0.23540548757671007)},\n", + " '0014_m1': {'mean': 0.15330570306335917,\n", + " 'std': 0.08736689982957992,\n", + " 'conf_int': (0.06593880323377925, 0.24067260289293907)},\n", + " '0014_m2': {'mean': 0.1426293068048946,\n", + " 'std': 0.07633868568249282,\n", + " 'conf_int': (0.06629062112240179, 0.2189679924873874)},\n", + " '0014_m3': {'mean': 0.1384163390987707,\n", + " 'std': 0.07469015107914477,\n", + " 'conf_int': (0.06372618801962594, 0.2131064901779155)},\n", + " '0015_m1': {'mean': 0.15765198768178051,\n", + " 'std': 0.09358788188396122,\n", + " 'conf_int': (0.06406410579781929, 0.25123986956574174)},\n", + " '0015_m2': {'mean': 0.1507825603221522,\n", + " 'std': 0.0814955191128956,\n", + " 'conf_int': (0.0692870412092566, 0.2322780794350478)},\n", + " '0015_m3': {'mean': 0.14636983260313963,\n", + " 'std': 0.0764192598427006,\n", + " 'conf_int': (0.06995057276043903, 0.22278909244584022)},\n", + " '0016_m1': {'mean': 0.15037814523110357,\n", + " 'std': 0.0914280222484199,\n", + " 'conf_int': (0.05895012298268368, 0.24180616747952347)},\n", + " '0016_m2': {'mean': 0.15052519785355048,\n", + " 'std': 0.08800983126453843,\n", + " 'conf_int': (0.06251536658901205, 0.2385350291180889)},\n", + " '0016_m3': {'mean': 0.15825089545714013,\n", + " 'std': 0.09284693977917047,\n", + " 'conf_int': (0.06540395567796967, 0.2510978352363106)},\n", + " '0017_m1': {'mean': 0.14841250241957357,\n", + " 'std': 0.08660737038257468,\n", + " 'conf_int': (0.06180513203699889, 0.23501987280214826)},\n", + " '0017_m2': {'mean': 0.16131369102962131,\n", + " 'std': 0.08667879676997356,\n", + " 'conf_int': (0.07463489425964775, 0.24799248779959487)},\n", + " '0017_m3': {'mean': 0.143035627614613,\n", + " 'std': 0.07708385493382297,\n", + " 'conf_int': (0.06595177268079003, 0.22011948254843597)},\n", + " '0018_m1': {'mean': 0.15305746660308842,\n", + " 'std': 0.0875897927244637,\n", + " 'conf_int': (0.06546767387862472, 0.2406472593275521)},\n", + " '0018_m2': {'mean': 0.1522211084782473,\n", + " 'std': 0.08686380874816599,\n", + " 'conf_int': (0.06535729973008131, 0.23908491722641328)},\n", + " '0018_m3': {'mean': 0.1490366761321364,\n", + " 'std': 0.07977764804299615,\n", + " 'conf_int': (0.06925902808914024, 0.22881432417513253)},\n", + " '0020_m1': {'mean': 0.15404618783608884,\n", + " 'std': 0.09415821387808693,\n", + " 'conf_int': (0.05988797395800191, 0.24820440171417577)},\n", + " '0020_m2': {'mean': 0.1645876441493875,\n", + " 'std': 0.09176936660138603,\n", + " 'conf_int': (0.07281827754800148, 0.25635701075077355)},\n", + " '0020_m3': {'mean': 0.15804567205498574,\n", + " 'std': 0.09105011689380604,\n", + " 'conf_int': (0.06699555516117969, 0.24909578894879178)}}" + ] + }, + "execution_count": 34, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "mean_wer = {}\n", + "std_wer = {}\n", + "stats = {}\n", + "conf_int = {}\n", + "meta_speaker = {}\n", + "for speaker, df1 in df_full.groupby('speaker'):\n", + " for m, df in df1.groupby('model'):\n", + " mean_wer[m] = df['wer'].mean()\n", + " std_wer[m] = df['wer'].std()\n", + " stats[m] = (mean_wer[m], std_wer[m])\n", + " conf_int[m] = (stats[m][0] - stats[m][1], stats[m][0] + stats[m][1])\n", + " meta_speaker[speaker + '_' + m] = {\n", + " 'mean': mean_wer[m],\n", + " 'std': std_wer[m],\n", + " 'conf_int': conf_int[m]\n", + " }\n", + "\n", + "meta_speaker" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "id": "a48e203f-91fb-4018-bd4f-ab6628579def", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
meanstdconf_intspeaker_modelspeaker
0011_m10.1649420.098481(0.06646108959760694, 0.2634224229943425)0011_m10011
0011_m20.1537450.093724(0.060021064505152905, 0.24746906731497884)0011_m20011
0011_m30.1575730.096471(0.061102902232036266, 0.25404395873064856)0011_m30011
0012_m10.1580860.089081(0.06900524445812664, 0.2471667344722284)0012_m10012
0012_m20.1595360.097171(0.062365555572831854, 0.2567071476921302)0012_m20012
0012_m30.1525970.078147(0.07444987547333512, 0.23074403505813826)0012_m30012
0013_m10.1623920.097572(0.06482034517441204, 0.2599635226114294)0013_m10013
0013_m20.1606310.087547(0.07308382549676895, 0.2481777627865256)0013_m20013
0013_m30.1519150.083490(0.06842450305797412, 0.23540548757671007)0013_m30013
0014_m10.1533060.087367(0.06593880323377925, 0.24067260289293907)0014_m10014
0014_m20.1426290.076339(0.06629062112240179, 0.2189679924873874)0014_m20014
0014_m30.1384160.074690(0.06372618801962594, 0.2131064901779155)0014_m30014
0015_m10.1576520.093588(0.06406410579781929, 0.25123986956574174)0015_m10015
0015_m20.1507830.081496(0.0692870412092566, 0.2322780794350478)0015_m20015
0015_m30.1463700.076419(0.06995057276043903, 0.22278909244584022)0015_m30015
0016_m10.1503780.091428(0.05895012298268368, 0.24180616747952347)0016_m10016
0016_m20.1505250.088010(0.06251536658901205, 0.2385350291180889)0016_m20016
0016_m30.1582510.092847(0.06540395567796967, 0.2510978352363106)0016_m30016
0017_m10.1484130.086607(0.06180513203699889, 0.23501987280214826)0017_m10017
0017_m20.1613140.086679(0.07463489425964775, 0.24799248779959487)0017_m20017
0017_m30.1430360.077084(0.06595177268079003, 0.22011948254843597)0017_m30017
0018_m10.1530570.087590(0.06546767387862472, 0.2406472593275521)0018_m10018
0018_m20.1522210.086864(0.06535729973008131, 0.23908491722641328)0018_m20018
0018_m30.1490370.079778(0.06925902808914024, 0.22881432417513253)0018_m30018
0020_m10.1540460.094158(0.05988797395800191, 0.24820440171417577)0020_m10020
0020_m20.1645880.091769(0.07281827754800148, 0.25635701075077355)0020_m20020
0020_m30.1580460.091050(0.06699555516117969, 0.24909578894879178)0020_m30020
\n", + "
" + ], + "text/plain": [ + " mean std conf_int \\\n", + "0011_m1 0.164942 0.098481 (0.06646108959760694, 0.2634224229943425) \n", + "0011_m2 0.153745 0.093724 (0.060021064505152905, 0.24746906731497884) \n", + "0011_m3 0.157573 0.096471 (0.061102902232036266, 0.25404395873064856) \n", + "0012_m1 0.158086 0.089081 (0.06900524445812664, 0.2471667344722284) \n", + "0012_m2 0.159536 0.097171 (0.062365555572831854, 0.2567071476921302) \n", + "0012_m3 0.152597 0.078147 (0.07444987547333512, 0.23074403505813826) \n", + "0013_m1 0.162392 0.097572 (0.06482034517441204, 0.2599635226114294) \n", + "0013_m2 0.160631 0.087547 (0.07308382549676895, 0.2481777627865256) \n", + "0013_m3 0.151915 0.083490 (0.06842450305797412, 0.23540548757671007) \n", + "0014_m1 0.153306 0.087367 (0.06593880323377925, 0.24067260289293907) \n", + "0014_m2 0.142629 0.076339 (0.06629062112240179, 0.2189679924873874) \n", + "0014_m3 0.138416 0.074690 (0.06372618801962594, 0.2131064901779155) \n", + "0015_m1 0.157652 0.093588 (0.06406410579781929, 0.25123986956574174) \n", + "0015_m2 0.150783 0.081496 (0.0692870412092566, 0.2322780794350478) \n", + "0015_m3 0.146370 0.076419 (0.06995057276043903, 0.22278909244584022) \n", + "0016_m1 0.150378 0.091428 (0.05895012298268368, 0.24180616747952347) \n", + "0016_m2 0.150525 0.088010 (0.06251536658901205, 0.2385350291180889) \n", + "0016_m3 0.158251 0.092847 (0.06540395567796967, 0.2510978352363106) \n", + "0017_m1 0.148413 0.086607 (0.06180513203699889, 0.23501987280214826) \n", + "0017_m2 0.161314 0.086679 (0.07463489425964775, 0.24799248779959487) \n", + "0017_m3 0.143036 0.077084 (0.06595177268079003, 0.22011948254843597) \n", + "0018_m1 0.153057 0.087590 (0.06546767387862472, 0.2406472593275521) \n", + "0018_m2 0.152221 0.086864 (0.06535729973008131, 0.23908491722641328) \n", + "0018_m3 0.149037 0.079778 (0.06925902808914024, 0.22881432417513253) \n", + "0020_m1 0.154046 0.094158 (0.05988797395800191, 0.24820440171417577) \n", + "0020_m2 0.164588 0.091769 (0.07281827754800148, 0.25635701075077355) \n", + "0020_m3 0.158046 0.091050 (0.06699555516117969, 0.24909578894879178) \n", + "\n", + " speaker_model speaker \n", + "0011_m1 0011_m1 0011 \n", + "0011_m2 0011_m2 0011 \n", + "0011_m3 0011_m3 0011 \n", + "0012_m1 0012_m1 0012 \n", + "0012_m2 0012_m2 0012 \n", + "0012_m3 0012_m3 0012 \n", + "0013_m1 0013_m1 0013 \n", + "0013_m2 0013_m2 0013 \n", + "0013_m3 0013_m3 0013 \n", + "0014_m1 0014_m1 0014 \n", + "0014_m2 0014_m2 0014 \n", + "0014_m3 0014_m3 0014 \n", + "0015_m1 0015_m1 0015 \n", + "0015_m2 0015_m2 0015 \n", + "0015_m3 0015_m3 0015 \n", + "0016_m1 0016_m1 0016 \n", + "0016_m2 0016_m2 0016 \n", + "0016_m3 0016_m3 0016 \n", + "0017_m1 0017_m1 0017 \n", + "0017_m2 0017_m2 0017 \n", + "0017_m3 0017_m3 0017 \n", + "0018_m1 0018_m1 0018 \n", + "0018_m2 0018_m2 0018 \n", + "0018_m3 0018_m3 0018 \n", + "0020_m1 0020_m1 0020 \n", + "0020_m2 0020_m2 0020 \n", + "0020_m3 0020_m3 0020 " + ] + }, + "execution_count": 35, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df_meta_speakers = pd.DataFrame.from_dict(meta_speaker, orient='index')\n", + "df_meta_speakers['speaker_model'] = df_meta_speakers.index\n", + "df_meta_speakers['speaker'] = df_meta_speakers['speaker_model'].apply(lambda x: x.split('_')[0])\n", + "df_meta_speakers" + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "id": "9c44e9ac-7f96-401a-9e5a-499824ad08a9", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'m1': 'generated_hifi/esd_tune/g_3164999',\n", + " 'm2': 'generated_hifi/esd_tune_reversal/g_3164999',\n", + " 'm3': 'generated_hifi/esd_tune_advloss0/g_3164999'}" + ] + }, + "execution_count": 36, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "model2folder" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/environment.yml b/environment.yml index 037bfc3..f349548 100644 --- a/environment.yml +++ b/environment.yml @@ -18,6 +18,7 @@ dependencies: - matplotlib - montreal-forced-aligner=2.0.0b4 - numpy + - openpyxl - pip - python=3.8 - pytorch=1.11.0+cu113 @@ -29,6 +30,8 @@ dependencies: - unidecode - unzip - uvicorn + - xlrd - pip: + - phonemizer - tgt \ No newline at end of file diff --git a/generate_listener_html.ipynb b/generate_listener_html.ipynb new file mode 100644 index 0000000..3cf7791 --- /dev/null +++ b/generate_listener_html.ipynb @@ -0,0 +1,1615 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "60f2a2f5-75b6-4f29-bfa3-687283fc3edd", + "metadata": {}, + "outputs": [], + "source": [ + "import csv\n", + "from itertools import combinations\n", + "from pathlib import Path\n", + "\n", + "import numpy as np\n", + "import pandas as pd\n", + "from IPython.display import HTML, Audio, display\n", + "\n", + "\n", + "pd.set_option('display.max_colwidth', None)\n", + "pd.set_option('display.colheader_justify', 'center')\n", + "\n", + "\n", + "REPORTS_DIR = Path('reports')\n", + "REPORT_NAME = 'esd_tune_1-2-7'\n", + "OUTPUT_DIR = REPORTS_DIR / REPORT_NAME" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "f0d165ce-a7bb-4e83-b37e-dc0692ed1089", + "metadata": {}, + "outputs": [], + "source": [ + "texts = [\n", + " 'Do you realize what time it is?',\n", + " 'He comes back to the valley.',\n", + " 'This dress does not look worth much!',\n", + " 'What happened tonight has nothing to do with Henry.',\n", + " 'Today, five years later, we are facing a similar situation.',\n", + " 'When I saw you kissing, you looked really happy.',\n", + " 'Only one vehicle may be allowed to park at any given time.',\n", + " 'The deadlines are indeed very tight.',\n", + " \"I'm glad you enjoyed yourself.\",\n", + " 'What are you still doing here?',\n", + " 'This is an animal that is admired for its whiteness and cleanliness. ',\n", + " 'Perhaps there is another way to pose these issues.',\n", + " \"Your students' test scores drop lower and lower every year.\",\n", + " 'Wherever her tears fell, a fruit tree grew.',\n", + " 'I was about to head back to my hotel and go to sleep.',\n", + " 'You said she really helped last time.',\n", + " 'My favorite season, spring, is here.',\n", + " \"He's the rich guy who built the airplanes.\",\n", + " 'Otto and Elizabeth gave it to us, for the wedding - incredibly generous.',\n", + " 'Look, the police said that there was nothing stolen from the house.',\n", + " 'And I suppose we can thank your brother for that.',\n", + " \"That's a pretty dangerous thing you're doing.\",\n", + " 'He arrived in Japan for the first time at the age of twenty six.',\n", + " 'Sam thought we were having fun being together.',\n", + " \"Well, the true value of something isn't always determined by its price.\",\n", + " \"No, it's not polite to discuss a lady's age.\",\n", + " \"Just another quarter-mile and I don't have to be tolerant ever again.\",\n", + " \"But Jones' apartment had only been rented out for a week.\",\n", + " 'What your perfect day would have been like?',\n", + " 'Not a very useful skill, especially when the money runs out.',\n", + "]" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f0871808-7396-4a82-b529-404babb6be8d", + "metadata": {}, + "outputs": [], + "source": [ + "huawei_phones = [\n", + " ' D UW1 Y UW1 R IY1 AH0 L AY2 Z W AH1 T T AY1 M IH1 T IH1 Z ',\n", + " ' HH IY1 K AH1 M Z B AE1 K T UW1 DH AH0 V AE1 L IY0 ',\n", + " ' DH IH1 S D R EH1 S D AH1 Z N AA1 T L UH1 K W ER1 TH M AH1 CH ',\n", + " ' W AH1 T HH AE1 P AH0 N D T AH0 N AY1 T HH AE1 Z N AH1 TH IH0 NG T UW1 D UW1 W IH1 DH HH EH1 N R IY0 ',\n", + " ' T AH0 D EY1 F AY1 V Y IH1 R Z L EY1 T ER0 W IY1 AA1 R F EY1 S IH0 NG AH0 S IH1 M AH0 L ER0 S IH2 CH UW0 EY1 SH AH0 N ',\n", + " ' W EH1 N AY1 S AO1 Y UW1 K IH1 S IH0 NG Y UW1 L UH1 K T R IH1 L IY0 HH AE1 P IY0 ',\n", + " ' OW1 N L IY0 W AH1 N V IY1 HH IH0 K AH0 L M EY1 B IY1 AH0 L AW1 D T UW1 P AA1 R K AE1 T EH1 N IY0 G IH1 V AH0 N T AY1 M ',\n", + " ' DH AH0 D EH1 D L AY2 N Z AA1 R IH2 N D IY1 D V EH1 R IY0 T AY1 T ',\n", + " ' AY1 EH1 M G L AE1 D Y UW1 EH2 N JH OY1 D Y ER0 S EH1 L F ',\n", + " ' W AH1 T AA1 R Y UW1 S T IH1 L D UW1 IH0 NG HH IY1 R ',\n", + " ' DH IH1 S IH1 Z AE1 N AE1 N AH0 M AH0 L DH AE1 T IH1 Z AH0 D M AY1 ER0 D F AO1 R IH1 T S W AY1 T N AH0 S AH0 N D K L EH1 N L IY0 N IH0 S ',\n", + " ' P ER0 HH AE1 P S DH EH1 R IH1 Z AH0 N AH1 DH ER0 W EY1 T UW1 P OW1 Z DH IY1 Z IH1 SH UW0 Z ',\n", + " ' Y AO1 R S T UW1 D AH0 N T S T EH1 S T S K AO1 R Z D R AA1 P L OW1 ER0 AH0 N D L OW1 ER0 EH1 V ER0 IY0 Y IH1 R ',\n", + " ' W EH0 R EH1 V ER0 HH ER1 T IH1 R Z F EH1 L AH0 F R UW1 T T R IY1 G R UW1 ',\n", + " ' AY1 W AA1 Z AH0 B AW1 T T UW1 HH EH1 D B AE1 K T UW1 M AY1 HH OW0 T EH1 L AH0 N D G OW1 T UW1 S L IY1 P ',\n", + " ' Y UW1 S EH1 D SH IY1 R IH1 L IY0 HH EH1 L P T L AE1 S T T AY1 M ',\n", + " ' M AY1 F EY1 V ER0 IH0 T S IY1 Z AH0 N S P R IH1 NG IH1 Z HH IY1 R ',\n", + " ' HH IY1 EH1 S DH AH0 R IH1 CH G AY1 HH UW1 B IH1 L T DH IY0 EH1 R P L EY0 N Z ',\n", + " ' AA1 T OW2 AH0 N D IH0 L IH1 Z AH0 B AH0 TH G EY1 V IH1 T T UW1 AH1 S F AO1 R DH AH0 W EH1 D IH0 NG IH2 N K R EH1 D AH0 B L IY0 JH EH1 N ER0 AH0 S ',\n", + " ' L UH1 K DH AH0 P AH0 L IY1 S S EH1 D DH AE1 T DH EH1 R W AA1 Z N AH1 TH IH0 NG S T OW1 L AH0 N F R AH1 M DH AH0 HH AW1 S ',\n", + " ' AH0 N D AY1 S AH0 P OW1 Z W IY1 K AE1 N TH AE1 NG K Y AO1 R B R AH1 DH ER0 F AO1 R DH AE1 T ',\n", + " ' DH AE1 T EH1 S EY0 P R IH1 T IY0 D EY1 N JH ER0 AH0 S TH IH1 NG Y UW1 R EY1 D UW1 IH0 NG ',\n", + " ' HH IY1 ER0 AY1 V D IH0 N JH AH0 P AE1 N F AO1 R DH AH0 F ER1 S T T AY1 M AE1 T DH IY0 EY1 JH AH1 V T W EH1 N T IY0 S IH1 K S ',\n", + " ' S AE1 M TH AO1 T W IY1 W ER1 HH AE1 V IH0 NG F AH1 N B IY1 IH0 NG T AH0 G EH1 DH ER0 ',\n", + " ' W EH1 L DH AH0 T R UW1 V AE1 L Y UW0 AH1 V S AH1 M TH IH0 NG IH1 S N T IY1 AO1 L W EY2 Z D IH0 T ER1 M AH0 N D B AY1 IH1 T S P R AY1 S ',\n", + " ' N OW1 IH1 T EH1 S N AA1 T P AH0 L AY1 T T UW1 D IH0 S K AH1 S AH0 L EY1 D IY0 EH1 S EY1 JH ',\n", + " ' JH AH1 S T AH0 N AH1 DH ER0 K W AO1 R T ER0 M AY1 L AH0 N D AY1 D AA1 N T IY1 HH AE1 V T UW1 B IY1 T AA1 L ER0 AH0 N T EH1 V ER0 AH0 G EH1 N ',\n", + " ' B AH1 T JH OW1 N Z AH0 P AA1 R T M AH0 N T HH AE1 D OW1 N L IY0 B IH1 N R EH1 N T IH0 D AW1 T F AO1 R AH0 W IY1 K ',\n", + " ' W AH1 T Y AO1 R P ER1 F IH1 K T D EY1 W UH1 D HH AE1 V B IH1 N L AY1 K ',\n", + " ' N AA1 T AH0 V EH1 R IY0 Y UW1 S F AH0 L S K IH1 L AH0 S P EH1 SH L IY0 W EH1 N DH AH0 M AH1 N IY0 R AH1 N Z AW1 T ',\n", + "]" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "d7942da8-a539-4a50-98ef-d93cbdcec403", + "metadata": {}, + "outputs": [], + "source": [ + "## NOTE: all model keys need to be composed of a single letter followed by a number\n", + "model2folder = {\n", + " \"m1\": 'generated_hifi/esd_tune_1/g_2879999',\n", + " \"m2\": 'generated_hifi/esd_tune_2/g_2939999',\n", + " \"m3\": 'generated_hifi/esd_tune_7/g_3059999',\n", + "}" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "d4d44f9e-525a-4e3d-bb5c-679b64bd7861", + "metadata": {}, + "outputs": [], + "source": [ + "total_K_models = len(model2folder)" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "51e4eae6-ea64-4d69-947c-2a0c7b15678b", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "m1: 1350 wav files total\n", + "m2: 1350 wav files total\n", + "m3: 1350 wav files total\n" + ] + } + ], + "source": [ + "wav_files = {}\n", + "total_wavs_per_model = 0\n", + "for ip in model2folder.keys():\n", + " wav_files[ip] = list(Path(model2folder[ip]).rglob(\"*.wav\"))\n", + " total_wavs_per_model = len(wav_files[ip])\n", + " print(f\"{ip}: {total_wavs_per_model} wav files total\")" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "e2031149-e1e8-421f-983c-83833c1b67ad", + "metadata": {}, + "outputs": [], + "source": [ + "x_range = np.array(list(range(total_wavs_per_model)))\n", + "x_indices = x_range * 2\n", + "y_indices = x_range * 2 + 1" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "f60b3404-269a-407e-bedd-898b754c5651", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
m1m2m3m1_wavbasenamem1_accent_speakerm1_textm2_wavbasenamem2_accent_speakerm2_textm3_wavbasenamem3_accent_speakerm3_text
0NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
1NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
2NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
3NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
4NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
.......................................
2695NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
2696NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
2697NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
2698NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
2699NoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNoneNone
\n", + "

2700 rows × 12 columns

\n", + "
" + ], + "text/plain": [ + " m1 m2 m3 m1_wavbasename m1_accent_speaker m1_text \\\n", + "0 None None None None None None \n", + "1 None None None None None None \n", + "2 None None None None None None \n", + "3 None None None None None None \n", + "4 None None None None None None \n", + "... ... ... ... ... ... ... \n", + "2695 None None None None None None \n", + "2696 None None None None None None \n", + "2697 None None None None None None \n", + "2698 None None None None None None \n", + "2699 None None None None None None \n", + "\n", + " m2_wavbasename m2_accent_speaker m2_text m3_wavbasename \\\n", + "0 None None None None \n", + "1 None None None None \n", + "2 None None None None \n", + "3 None None None None \n", + "4 None None None None \n", + "... ... ... ... ... \n", + "2695 None None None None \n", + "2696 None None None None \n", + "2697 None None None None \n", + "2698 None None None None \n", + "2699 None None None None \n", + "\n", + " m3_accent_speaker m3_text \n", + "0 None None \n", + "1 None None \n", + "2 None None \n", + "3 None None \n", + "4 None None \n", + "... ... ... \n", + "2695 None None \n", + "2696 None None \n", + "2697 None None \n", + "2698 None None \n", + "2699 None None \n", + "\n", + "[2700 rows x 12 columns]" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "def allocate_empty_array(alength):\n", + " return [None]*alength\n", + "\n", + "\n", + "def create_empty_dataframe(total_wavs_per_model: int, total_K_models: int):\n", + "\n", + " df = pd.DataFrame({\n", + " 'm' + str(i): allocate_empty_array(2 * total_wavs_per_model)\n", + " for i in range(1, total_K_models + 1, 1)\n", + " })\n", + "\n", + " for i in range(1, total_K_models + 1, 1):\n", + " df['m' + str(i) + '_wavbasename'] = None\n", + " df['m' + str(i) + '_accent_speaker'] = None\n", + " df['m' + str(i) + '_text'] = None\n", + " \n", + " return df\n", + "\n", + "\n", + "df_empty = create_empty_dataframe(total_wavs_per_model, total_K_models)\n", + "df_empty" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "id": "2b88d46e-c3af-43eb-8af7-282492147a1f", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
m1m2m3m1_wavbasenamem1_accent_speakerm1_textm2_wavbasenamem2_accent_speakerm2_textm3_wavbasenamem3_accent_speakerm3_text
0id_1id_2id_3NoneNoneNoneNoneNoneNoneNoneNoneNone
1generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wavgenerated_hifi/esd_tune_2/g_2939999/0011/angry/1.wavgenerated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav1.wav0011Do you realize what time it is?1.wav0011Do you realize what time it is?1.wav0011Do you realize what time it is?
2id_4id_5id_6NoneNoneNoneNoneNoneNoneNoneNoneNone
3generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wavgenerated_hifi/esd_tune_2/g_2939999/0011/angry/10.wavgenerated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav10.wav0011What are you still doing here?10.wav0011What are you still doing here?10.wav0011What are you still doing here?
4id_7id_8id_9NoneNoneNoneNoneNoneNoneNoneNoneNone
.......................................
2695generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav7.wav0020Only one vehicle may be allowed to park at any given time.7.wav0020Only one vehicle may be allowed to park at any given time.7.wav0020Only one vehicle may be allowed to park at any given time.
2696id_4045id_4046id_4047NoneNoneNoneNoneNoneNoneNoneNoneNone
2697generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav8.wav0020The deadlines are indeed very tight.8.wav0020The deadlines are indeed very tight.8.wav0020The deadlines are indeed very tight.
2698id_4048id_4049id_4050NoneNoneNoneNoneNoneNoneNoneNoneNone
2699generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav9.wav0020I'm glad you enjoyed yourself.9.wav0020I'm glad you enjoyed yourself.9.wav0020I'm glad you enjoyed yourself.
\n", + "

2700 rows × 12 columns

\n", + "
" + ], + "text/plain": [ + " m1 \\\n", + "0 id_1 \n", + "1 generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav \n", + "2 id_4 \n", + "3 generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav \n", + "4 id_7 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav \n", + "2696 id_4045 \n", + "2697 generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav \n", + "2698 id_4048 \n", + "2699 generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav \n", + "\n", + " m2 \\\n", + "0 id_2 \n", + "1 generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav \n", + "2 id_5 \n", + "3 generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav \n", + "4 id_8 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav \n", + "2696 id_4046 \n", + "2697 generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav \n", + "2698 id_4049 \n", + "2699 generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav \n", + "\n", + " m3 m1_wavbasename \\\n", + "0 id_3 None \n", + "1 generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav 1.wav \n", + "2 id_6 None \n", + "3 generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav 10.wav \n", + "4 id_9 None \n", + "... ... ... \n", + "2695 generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav 7.wav \n", + "2696 id_4047 None \n", + "2697 generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav 8.wav \n", + "2698 id_4050 None \n", + "2699 generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav 9.wav \n", + "\n", + " m1_accent_speaker \\\n", + "0 None \n", + "1 0011 \n", + "2 None \n", + "3 0011 \n", + "4 None \n", + "... ... \n", + "2695 0020 \n", + "2696 None \n", + "2697 0020 \n", + "2698 None \n", + "2699 0020 \n", + "\n", + " m1_text \\\n", + "0 None \n", + "1 Do you realize what time it is? \n", + "2 None \n", + "3 What are you still doing here? \n", + "4 None \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 None \n", + "2697 The deadlines are indeed very tight. \n", + "2698 None \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + " m2_wavbasename m2_accent_speaker \\\n", + "0 None None \n", + "1 1.wav 0011 \n", + "2 None None \n", + "3 10.wav 0011 \n", + "4 None None \n", + "... ... ... \n", + "2695 7.wav 0020 \n", + "2696 None None \n", + "2697 8.wav 0020 \n", + "2698 None None \n", + "2699 9.wav 0020 \n", + "\n", + " m2_text \\\n", + "0 None \n", + "1 Do you realize what time it is? \n", + "2 None \n", + "3 What are you still doing here? \n", + "4 None \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 None \n", + "2697 The deadlines are indeed very tight. \n", + "2698 None \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + " m3_wavbasename m3_accent_speaker \\\n", + "0 None None \n", + "1 1.wav 0011 \n", + "2 None None \n", + "3 10.wav 0011 \n", + "4 None None \n", + "... ... ... \n", + "2695 7.wav 0020 \n", + "2696 None None \n", + "2697 8.wav 0020 \n", + "2698 None None \n", + "2699 9.wav 0020 \n", + "\n", + " m3_text \n", + "0 None \n", + "1 Do you realize what time it is? \n", + "2 None \n", + "3 What are you still doing here? \n", + "4 None \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 None \n", + "2697 The deadlines are indeed very tight. \n", + "2698 None \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + "[2700 rows x 12 columns]" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "def populate_dataframe(df, model2folder, wav_files, total_K_models, total_wavs_per_model):\n", + "\n", + " for model_key in model2folder.keys():\n", + "\n", + " column_name = model_key\n", + " model_index = int(model_key[1:])\n", + " paths_orig_wavs = sorted(wav_files[model_key])\n", + " assert(total_wavs_per_model == len(paths_orig_wavs))\n", + "\n", + " wavids = np.array(list(range(len(paths_orig_wavs)))) * total_K_models + model_index\n", + " wavids = ['id_' + str(x) for x in wavids]\n", + " df[column_name].iloc[x_indices] = wavids\n", + " df[column_name].iloc[y_indices] = paths_orig_wavs\n", + "\n", + " df[column_name + '_wavbasename'].iloc[y_indices] = (\n", + " df[column_name]\n", + " .iloc[y_indices]\n", + " .apply(lambda x: x.name)\n", + " )\n", + " \n", + " df[column_name + '_text'].iloc[y_indices] = (\n", + " df[column_name]\n", + " .iloc[y_indices]\n", + " .apply(lambda x: texts[int(x.stem) - 1])\n", + " )\n", + " \n", + " df[column_name + '_accent_speaker'].iloc[y_indices] = (\n", + " df[column_name]\n", + " .iloc[y_indices]\n", + " .apply(lambda x: x.parent.parent.stem)\n", + " )\n", + " \n", + " return df\n", + "\n", + "\n", + "df_populated = populate_dataframe(df_empty, model2folder, wav_files, total_K_models, total_wavs_per_model)\n", + "df_populated" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "efc3b273-7b7d-4165-aef8-38da88cfc154", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "m1 m2\n", + "m1 m3\n", + "m2 m3\n" + ] + } + ], + "source": [ + "def validate_pairs(df):\n", + " all_possible_pairs = list(combinations(model2folder.keys(), 2))\n", + " for k, v in all_possible_pairs:\n", + " print(k, v)\n", + " assert((df[k + '_text'].iloc[y_indices] == df[v + '_text'].iloc[y_indices]).all())\n", + " assert((df[k + '_accent_speaker'].iloc[y_indices] == df[v + '_accent_speaker'].iloc[y_indices]).all())\n", + " \n", + " \n", + "validate_pairs(df_populated)" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "e3f303a2-0923-4b6a-802c-11c497fe5e58", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['m1', 'm2', 'm3']" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "model_columns = ['m' + str(i) for i in range(1, total_K_models + 1, 1)]\n", + "model_columns" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "d1b37dd4-39c3-4956-adf0-22cf45b49f85", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
m1_textm1_accent_speakerm1m2m3m2_text
0NoneNoneid_1id_2id_3None
1Do you realize what time it is?0011generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wavgenerated_hifi/esd_tune_2/g_2939999/0011/angry/1.wavgenerated_hifi/esd_tune_7/g_3059999/0011/angry/1.wavDo you realize what time it is?
2NoneNoneid_4id_5id_6None
3What are you still doing here?0011generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wavgenerated_hifi/esd_tune_2/g_2939999/0011/angry/10.wavgenerated_hifi/esd_tune_7/g_3059999/0011/angry/10.wavWhat are you still doing here?
4NoneNoneid_7id_8id_9None
.....................
2695Only one vehicle may be allowed to park at any given time.0020generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wavOnly one vehicle may be allowed to park at any given time.
2696NoneNoneid_4045id_4046id_4047None
2697The deadlines are indeed very tight.0020generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wavThe deadlines are indeed very tight.
2698NoneNoneid_4048id_4049id_4050None
2699I'm glad you enjoyed yourself.0020generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wavI'm glad you enjoyed yourself.
\n", + "

2700 rows × 6 columns

\n", + "
" + ], + "text/plain": [ + " m1_text \\\n", + "0 None \n", + "1 Do you realize what time it is? \n", + "2 None \n", + "3 What are you still doing here? \n", + "4 None \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 None \n", + "2697 The deadlines are indeed very tight. \n", + "2698 None \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + " m1_accent_speaker \\\n", + "0 None \n", + "1 0011 \n", + "2 None \n", + "3 0011 \n", + "4 None \n", + "... ... \n", + "2695 0020 \n", + "2696 None \n", + "2697 0020 \n", + "2698 None \n", + "2699 0020 \n", + "\n", + " m1 \\\n", + "0 id_1 \n", + "1 generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav \n", + "2 id_4 \n", + "3 generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav \n", + "4 id_7 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav \n", + "2696 id_4045 \n", + "2697 generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav \n", + "2698 id_4048 \n", + "2699 generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav \n", + "\n", + " m2 \\\n", + "0 id_2 \n", + "1 generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav \n", + "2 id_5 \n", + "3 generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav \n", + "4 id_8 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav \n", + "2696 id_4046 \n", + "2697 generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav \n", + "2698 id_4049 \n", + "2699 generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav \n", + "\n", + " m3 \\\n", + "0 id_3 \n", + "1 generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav \n", + "2 id_6 \n", + "3 generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav \n", + "4 id_9 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav \n", + "2696 id_4047 \n", + "2697 generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav \n", + "2698 id_4050 \n", + "2699 generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav \n", + "\n", + " m2_text \n", + "0 None \n", + "1 Do you realize what time it is? \n", + "2 None \n", + "3 What are you still doing here? \n", + "4 None \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 None \n", + "2697 The deadlines are indeed very tight. \n", + "2698 None \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + "[2700 rows x 6 columns]" + ] + }, + "execution_count": 11, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "def choose_columns_to_render(df):\n", + " chosen_columns = ['m1_text', 'm1_accent_speaker'] + model_columns + ['m2_text']\n", + " df = df.loc[:, chosen_columns]\n", + " return df\n", + "\n", + "\n", + "df_filtered = choose_columns_to_render(df_populated)\n", + "df_filtered" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "id": "a9915d2e-01e5-40c0-923b-4bf6bf7389cf", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
m1_textm1_accent_speakerm1m2m3m2_text
0--id_1id_2id_3-
1Do you realize what time it is?0011generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wavgenerated_hifi/esd_tune_7/g_3059999/0011/angry/1.wavgenerated_hifi/esd_tune_1/g_2879999/0011/angry/1.wavDo you realize what time it is?
2--id_4id_5id_6-
3What are you still doing here?0011generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wavgenerated_hifi/esd_tune_2/g_2939999/0011/angry/10.wavgenerated_hifi/esd_tune_1/g_2879999/0011/angry/10.wavWhat are you still doing here?
4--id_7id_8id_9-
.....................
2695Only one vehicle may be allowed to park at any given time.0020generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wavgenerated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wavOnly one vehicle may be allowed to park at any given time.
2696--id_4045id_4046id_4047-
2697The deadlines are indeed very tight.0020generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wavgenerated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wavgenerated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wavThe deadlines are indeed very tight.
2698--id_4048id_4049id_4050-
2699I'm glad you enjoyed yourself.0020generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wavgenerated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wavgenerated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wavI'm glad you enjoyed yourself.
\n", + "

2700 rows × 6 columns

\n", + "
" + ], + "text/plain": [ + " m1_text \\\n", + "0 - \n", + "1 Do you realize what time it is? \n", + "2 - \n", + "3 What are you still doing here? \n", + "4 - \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 - \n", + "2697 The deadlines are indeed very tight. \n", + "2698 - \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + " m1_accent_speaker \\\n", + "0 - \n", + "1 0011 \n", + "2 - \n", + "3 0011 \n", + "4 - \n", + "... ... \n", + "2695 0020 \n", + "2696 - \n", + "2697 0020 \n", + "2698 - \n", + "2699 0020 \n", + "\n", + " m1 \\\n", + "0 id_1 \n", + "1 generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav \n", + "2 id_4 \n", + "3 generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav \n", + "4 id_7 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav \n", + "2696 id_4045 \n", + "2697 generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav \n", + "2698 id_4048 \n", + "2699 generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav \n", + "\n", + " m2 \\\n", + "0 id_2 \n", + "1 generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav \n", + "2 id_5 \n", + "3 generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav \n", + "4 id_8 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav \n", + "2696 id_4046 \n", + "2697 generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav \n", + "2698 id_4049 \n", + "2699 generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav \n", + "\n", + " m3 \\\n", + "0 id_3 \n", + "1 generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav \n", + "2 id_6 \n", + "3 generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav \n", + "4 id_9 \n", + "... ... \n", + "2695 generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav \n", + "2696 id_4047 \n", + "2697 generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav \n", + "2698 id_4050 \n", + "2699 generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav \n", + "\n", + " m2_text \n", + "0 - \n", + "1 Do you realize what time it is? \n", + "2 - \n", + "3 What are you still doing here? \n", + "4 - \n", + "... ... \n", + "2695 Only one vehicle may be allowed to park at any given time. \n", + "2696 - \n", + "2697 The deadlines are indeed very tight. \n", + "2698 - \n", + "2699 I'm glad you enjoyed yourself. \n", + "\n", + "[2700 rows x 6 columns]" + ] + }, + "execution_count": 12, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "def permute_wavs_and_fillna(df):\n", + " df1 = df.loc[:,model_columns]\n", + " ## random permutation of each row (independently)\n", + " for i in y_indices:\n", + " df1.iloc[i,:] = np.random.permutation(df1.iloc[i,:])\n", + " df.loc[:,model_columns] = df1\n", + " df = df.fillna('-')\n", + " return df\n", + "\n", + "\n", + "df_permuted = permute_wavs_and_fillna(df_filtered)\n", + "df_permuted" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "id": "eef3b325-c26e-457a-b575-eb6b210aff7f", + "metadata": {}, + "outputs": [], + "source": [ + "OUTPUT_DIR.mkdir(exist_ok=True, parents=True)\n", + "df_permuted.to_csv(\n", + " OUTPUT_DIR / 'eval_map.csv',\n", + " sep = \"\\t\",\n", + " header = False,\n", + " index = False,\n", + " quoting = csv.QUOTE_NONE\n", + ")" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "d32630c2-aca7-4ee9-b44c-a949d0fd17c4", + "metadata": {}, + "outputs": [], + "source": [ + "def columns_from_filenames(df, column_names):\n", + " res = []\n", + " for colname in column_names:\n", + " filenames = df[colname]\n", + " col = [Audio(filename)._repr_html_() if Path(filename).exists() else filename for filename in filenames]\n", + " res.append(col)\n", + " columns = res\n", + " return columns, column_names" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "2c11c3ca-abe4-4bbd-930f-8a4f62c9dc8f", + "metadata": {}, + "outputs": [], + "source": [ + "def make_table(columns, column_names):\n", + " names = \"\\n\".join([f\"{name}\" for name in column_names])\n", + " table = [f\"{names}\"]\n", + " for row in zip(*columns):\n", + " row = \"\\n\".join([f\"{elem}\" for elem in row])\n", + " row = f'{row}'\n", + " table.append(row)\n", + " \n", + " content = \"\\n\".join(table)\n", + " table_html = f'{content}
'\n", + " \n", + " html = HTML(table_html)\n", + " # display(html)\n", + " return html" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "11d84c76-841a-4215-a45f-268076e4ae21", + "metadata": {}, + "outputs": [], + "source": [ + "def make_table_from_df(df, column_names):\n", + " columns, column_names = columns_from_filenames(df, column_names)\n", + " return make_table(columns, column_names)" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "26b577fe-3957-4902-8758-e5501f5d81a0", + "metadata": {}, + "outputs": [], + "source": [ + "column_names = df_permuted.columns\n", + "chunk_size = 100" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "f37b7fb3-93eb-448c-a8a3-a23cb0d165ae", + "metadata": {}, + "outputs": [], + "source": [ + "output_folder = OUTPUT_DIR / 'html'\n", + "output_folder.mkdir(parents=True, exist_ok=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "24aef771-215a-4fe6-82cb-1ff375681189", + "metadata": { + "scrolled": true, + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0 100\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_1.html\n", + "100 200\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_2.html\n", + "200 300\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_3.html\n", + "300 400\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_4.html\n", + "400 500\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_5.html\n", + "500 600\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_6.html\n", + "600 700\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_7.html\n", + "700 800\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_8.html\n", + "800 900\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_9.html\n", + "900 1000\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_10.html\n", + "1000 1100\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_11.html\n", + "1100 1200\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_12.html\n", + "1200 1300\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_13.html\n", + "1300 1400\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_14.html\n", + "1400 1500\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_15.html\n", + "1500 1600\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_16.html\n", + "1600 1700\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_17.html\n", + "1700 1800\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_18.html\n", + "1800 1900\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_19.html\n", + "1900 2000\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_20.html\n", + "2000 2100\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_21.html\n", + "2100 2200\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_22.html\n", + "2200 2300\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_23.html\n", + "2300 2400\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_24.html\n", + "2400 2500\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_25.html\n", + "2500 2600\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_26.html\n", + "2600 2700\n", + "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_27.html\n" + ] + } + ], + "source": [ + "def create_htmls(df, column_names, chunk_size):\n", + " import os\n", + " chunk_number = 0\n", + " start = 0\n", + " experiment_prefix = \"nat_vctk_esd_tune_test_\"\n", + " while (start < len(df)):\n", + " end = start + chunk_size\n", + " end = min(end, len(df))\n", + " print(start, end)\n", + " chunk_number += 1\n", + " df_chunk = df.iloc[start:end,:]\n", + " final_html = make_table_from_df(df_chunk, column_names)\n", + " f_html = output_folder.joinpath(experiment_prefix + str(chunk_number) + '.html')\n", + " print(f_html)\n", + " with open(f_html, 'w') as f:\n", + " f.write(final_html.data)\n", + " start = end\n", + "\n", + " \n", + "create_htmls(df_permuted, column_names, chunk_size)" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "49a60285-31bf-4263-9162-c3d928aa9068", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "reports/esd_tune_1-2-7/scores/scores.csv\n", + "reports/esd_tune_1-2-7/scores/scores.xlsx\n" + ] + } + ], + "source": [ + "def create_scores_file(df, output_dir):\n", + " \n", + " output_dir = Path(output_dir)\n", + " output_dir.mkdir(exist_ok=True, parents=True)\n", + " \n", + " for k in model2folder.keys():\n", + " df[k].iloc[y_indices] = ''\n", + " \n", + " csv_path = output_dir / \"scores.csv\"\n", + " df.to_csv(\n", + " csv_path,\n", + " sep = \"\\t\",\n", + " header = True,\n", + " index = False,\n", + " quoting = csv.QUOTE_NONE,\n", + " )\n", + " \n", + " excel_path = output_dir / \"scores.xlsx\" \n", + " df.to_excel(excel_path)\n", + " \n", + " print(csv_path)\n", + " print(excel_path)\n", + "\n", + "\n", + "create_scores_file(df_permuted, OUTPUT_DIR / \"scores\")" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.8.12" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/models/download_g2p.sh b/models/download_g2p.sh index 2e1faf4..3124bf1 100644 --- a/models/download_g2p.sh +++ b/models/download_g2p.sh @@ -1,6 +1,6 @@ -G2P_ENGLISH_URL="https://github.com/MontrealCorpusTools/mfa-models/blob/main/g2p/english_g2p.zip" +G2P_ENGLISH_URL="https://github.com/MontrealCorpusTools/mfa-models/raw/main/g2p/english_g2p.zip" G2P_ENGLISH_PATH="models/en/g2p/english_g2p.zip" -G2P_RUSSIAN_URL="https://github.com/MontrealCorpusTools/mfa-models/blob/main/g2p/russian_g2p.zip" +G2P_RUSSIAN_URL="https://github.com/MontrealCorpusTools/mfa-models/raw/main/g2p/russian_g2p.zip" G2P_RUSSIAN_PATH="models/ru/g2p/russian_g2p.zip" echo Downloading English G2P model... diff --git a/russian_preprocessing/steps.sh b/russian_preprocessing/steps.sh index 4ee2f2e..c7a0595 100644 --- a/russian_preprocessing/steps.sh +++ b/russian_preprocessing/steps.sh @@ -2,42 +2,43 @@ echo -e "\n0) Setup env" conda env create -n emotts -f russian_preprocessing/environment.yaml conda activate emotts conda config --set ssl_verify no -export RUSSIAN_DATASET_PATH=/media/diskB/ruslan_a/data/datasets/EMO/russian -export OUTPUT_DIR=$RUSSIAN_DATASET_PATH/processed -export OUTPUT_DIR=$RUSSIAN_DATASET_PATH/processed_mix +export EMO_DATASET_DIR=/media/diskB/ruslan_a/data/datasets/EMO/russian +export NEUTRAL_DATASET_DIR=/media/diskB/ruslan_a/data/datasets/NEUTRAL/russian +export EMO_OUTPUT_DIR=$EMO_DATASET_DIR/processed_v2 +export NEUTRAL_OUTPUT_DIR=$NEUTRAL_DATASET_DIR/processed_v2 export MFA_PREMADE=/media/diskB/ruslan_a/data/datasets/emo_rus_Olga_v2_processed/mfa_espeak_grids # 16164it [03:36, 74.61it/s] -# 25544it [02:45, 154.48it/s] mix echo -e "\n1) Prep raw files" -# python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw -python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original_and_neutral --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw +python src/preprocessing/prep_files_russian.py --dataset-dir $EMO_DATASET_DIR/original --text-output-dir $EMO_OUTPUT_DIR/text/raw --audio-output-dir $EMO_OUTPUT_DIR/audio/raw --meta-output-dir $EMO_OUTPUT_DIR/meta +python src/preprocessing/prep_files_russian_neutral.py --dataset-dir $NEUTRAL_DATASET_DIR/original --text-output-dir $NEUTRAL_OUTPUT_DIR/text/raw --audio-output-dir $NEUTRAL_OUTPUT_DIR/audio/raw --meta-output-dir $NEUTRAL_OUTPUT_DIR/meta -# ~1.5-2.0 hours -echo -e "\n2) Pausation cutting with VAD" -python src/preprocessing/pausation_cutting.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/no_pause --target-sr 96000 --audio-ext wav +# ~1.5-2.0 hours (Deprecated) +# echo -e "\n2) Pausation cutting with VAD" +# python src/preprocessing/pausation_cutting.py --input-dir $EMO_OUTPUT_DIR/audio/raw --output-dir $EMO_OUTPUT_DIR/audio/no_pause --target-sr 96000 --audio-ext wav # 16071/16071 [02:50<00:00, 94.26it/s] -# 25429/25429 [04:18<00:00, 98.26it/s] mix echo -e "\n3) Resampling and Converting audio to 1-channel" -# python src/preprocessing/resampling.py --input-dir $OUTPUT_DIR/audio/no_pause --output-dir $OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav -python src/preprocessing/resampling.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav +# python src/preprocessing/resampling.py --input-dir $EMO_OUTPUT_DIR/audio/no_pause --output-dir $EMO_OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav +python src/preprocessing/resampling.py --input-dir $EMO_OUTPUT_DIR/audio/raw --output-dir $EMO_OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav +python src/preprocessing/resampling.py --input-dir $NEUTRAL_OUTPUT_DIR/audio/raw --output-dir $NEUTRAL_OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav conda env config vars set LD_LIBRARY_PATH=$CONDA_PREFIX/lib # link to libopenblas conda deactivate conda activate emotts # 16071/16071 [13:09<00:00, 20.37it/s] -# 25429/25429 [13:11<00:00, 32.15it/s] mix echo -e "\n4) Audio to Mel" -python src/preprocessing/wav_to_mel.py --input-dir $OUTPUT_DIR/audio/resampled --output-dir $OUTPUT_DIR/mels --audio-ext wav +python src/preprocessing/wav_to_mel.py --input-dir $EMO_OUTPUT_DIR/audio/resampled --output-dir $EMO_OUTPUT_DIR/mels --audio-ext wav +python src/preprocessing/wav_to_mel.py --input-dir $NEUTRAL_OUTPUT_DIR/audio/resampled --output-dir $NEUTRAL_OUTPUT_DIR/mels --audio-ext wav # 16069/16069 [31:38<00:00, 8.46it/s] # 16962/16962 [12:22<00:00, 22.85it/s] mix # Model is needed: https://github.com/snakers4/russian_stt_text_normalization/blob/master/jit_s2s.pt # Put model to src/preprocessing/text/russian/ echo -e "\n5) Text normalization" -python src/preprocessing/text_normalization_russian.py --input-dir $OUTPUT_DIR/text/raw --output-dir $OUTPUT_DIR/mfa_inputs +python src/preprocessing/text_normalization_russian.py --input-dir $EMO_OUTPUT_DIR/text/raw --output-dir $EMO_OUTPUT_DIR/mfa_inputs +python src/preprocessing/text_normalization_russian.py --input-dir $NEUTRAL_OUTPUT_DIR/text/raw --output-dir $NEUTRAL_OUTPUT_DIR/mfa_inputs echo -e "\n6) MFA Alignment setup" @@ -52,33 +53,38 @@ export RUS_ESPEAK_LEXICON=/media/diskB/ruslan_a/models/mfa/rus-espeak-mfa/rus-mf # 16069/16069 [00:00<00:00, 21508.15it/s] echo -e "\n6.1) Creating word list from dataset" -python src/preprocessing/create_corpus.py --input-dir $OUTPUT_DIR/text/raw --output-path $OUTPUT_DIR/meta/words.txt +python src/preprocessing/create_corpus.py --input-dir $EMO_OUTPUT_DIR/mfa_inputs --output-path $EMO_OUTPUT_DIR/meta/words.txt +python src/preprocessing/create_corpus.py --input-dir $NEUTRAL_OUTPUT_DIR/mfa_inputs --output-path $NEUTRAL_OUTPUT_DIR/meta/words.txt # 25849/25983 [01:19<00:00, 326.82it/s] -echo -e "\n6.2) Creating G2P lexicon from word list" -mfa g2p -t mfa_tmp -j 32 --clean --overwrite models/g2p/russian_g2p.zip $OUTPUT_DIR/meta/words.txt models/mfa/russian_lexicon.txt +echo -e "\n6.2.a) Creating G2P lexicon from word list with G2P" +mfa g2p -t mfa_tmp -j 32 --clean --overwrite models/g2p/russian_g2p.zip $EMO_OUTPUT_DIR/meta/words.txt models/mfa/russian_lexicon.txt rm -rf mfa_tmp +echo -e "\n6.2.b) Creating G2P lexicon from word list with espeak" +python src/preprocessing/create_lexicon.py -i $EMO_OUTPUT_DIR/meta/words.txt -o $EMO_OUTPUT_DIR/meta/lexicon.txt -l ru +python src/preprocessing/create_lexicon.py -i $NEUTRAL_OUTPUT_DIR/meta/words.txt -o $NEUTRAL_OUTPUT_DIR/meta/lexicon.txt -l ru + # 42it [00:10, 4.01it/s] # 58it [00:12, 4.54it/s] mix echo -e "\n7) MFA Preprocessing" -python src/preprocessing/mfa_preprocessing.py --input-dir $OUTPUT_DIR/audio/resampled --output-dir $OUTPUT_DIR/mfa_inputs +python src/preprocessing/mfa_preprocessing.py --input-dir $EMO_OUTPUT_DIR/audio/resampled --output-dir $EMO_OUTPUT_DIR/mfa_inputs # FINALLY, align phonemes and speech # ~50 min echo -e "\n8) MFA Alignment" -echo $OUTPUT_DIR -mfa align -t mfa_tmp --clean -j 32 $OUTPUT_DIR/mfa_inputs models/mfa/russian_lexicon.txt models/mfa/russian.zip $OUTPUT_DIR/mfa_outputs +echo $EMO_OUTPUT_DIR +mfa align -t mfa_tmp --clean -j 32 $EMO_OUTPUT_DIR/mfa_inputs models/mfa/russian_lexicon.txt models/mfa/russian.zip $EMO_OUTPUT_DIR/mfa_outputs # for mix -mfa align -t mfa_tmp --clean -j 32 $OUTPUT_DIR/mfa_inputs $RUS_ESPEAK_LEXICON $RUS_ESPEAK_ACOUSTIC_MODEL $OUTPUT_DIR/mfa_outputs +mfa align -t mfa_tmp --clean -j 32 $EMO_OUTPUT_DIR/mfa_inputs $RUS_ESPEAK_LEXICON $RUS_ESPEAK_ACOUSTIC_MODEL $EMO_OUTPUT_DIR/mfa_outputs rm -rf mfa_tmp echo -e "\n9) MFA Postprocessing" # Aggregate mels by speakers # 16071it [00:00, 16767.84it/s] # 25429it [00:01, 17870.70it/s] mix -python src/preprocessing/mfa_postprocessing.py --input-dir $OUTPUT_DIR/mels +python src/preprocessing/mfa_postprocessing.py --input-dir $EMO_OUTPUT_DIR/mels # Only for MFA PREMADE case echo -e "\n10) MFA Premade Preprocessing" -python src/preprocessing/mfa_premade_preprocessing.py --input-dir $MFA_PREMADE --output-dir $OUTPUT_DIR/mfa_outputs \ No newline at end of file +python src/preprocessing/mfa_premade_preprocessing.py --input-dir $MFA_PREMADE --output-dir $EMO_OUTPUT_DIR/mfa_outputs \ No newline at end of file diff --git a/src/preprocessing/create_lexicon.py b/src/preprocessing/create_lexicon.py new file mode 100644 index 0000000..12fc223 --- /dev/null +++ b/src/preprocessing/create_lexicon.py @@ -0,0 +1,84 @@ +""" +Util to create phonematic lexicon for given corpus. +Espeak backend must be installed on the system. +""" + +from pathlib import Path + +import click +from phonemizer.phonemize import phonemize +from phonemizer.separator import Separator + +ENCODING = "utf8" +SEPARATOR = Separator(phone=" ", syllable="", word="\n") +CORPUS_STRING_WORD_SEPARATOR = " " + + +@click.command() +@click.option( + "-i", + "--input-path", + type=Path, + help="Path to corpus file (1 word per line).", + required=True, +) +@click.option( + "-o", + "--output-path", + type=Path, + default="russian-lexicon-espeak.txt", + help="Filepath to write lexicon.", + required=False, +) +@click.option( + "-l", + "--language", + type=str, + default="en-us", + help="Language in espeak format. See for more info: https://github.com/espeak-ng/espeak-ng/blob/master/docs/languages.md", + required=False, +) +def main(input_path: Path, output_path: Path, language: str) -> None: + + print("Reading corpus...", end=" ") + with open(input_path, "r", encoding=ENCODING) as corpus_file: + corpus_string = CORPUS_STRING_WORD_SEPARATOR.join( + corpus_file.read().splitlines() + ) + print("Done.") + print(corpus_string[:80], end="\n\n") + + print("Getting phonemizations...", end=" ") + phones_string = phonemize( + corpus_string, + language=language, + backend="espeak", + preserve_punctuation=True, + with_stress=True, + strip=True, + separator=SEPARATOR, + ) + print("Done.") + print(phones_string[:80], end="\n\n") + + print("Creating lexicon...", end=" ") + corpus = corpus_string.split(CORPUS_STRING_WORD_SEPARATOR) + phones = phones_string.split(SEPARATOR.word) + assert len(corpus) == len(phones), ( + f"# of words should match # of phones after phomenization\n" + f"but you have {len(corpus)} words and {len(phones)} phones\n" + f"First 5 words: {corpus[:5]}\n" + f"First 5 phones: {phones[:5]}\n" + ) + lexicon = [f"{word}\t{phon}" for word, phon in zip(corpus, phones)] + lexicon_str = "\n".join(lexicon) + print("Done.", end="\n\n") + + output_path.parent.mkdir(exist_ok=True, parents=True) + with open(output_path, "w", encoding=ENCODING) as lexicon_file: + lexicon_file.write(lexicon_str) + print(f"Lexicon file saved at:\n{output_path}", end="\n\n") + + +if __name__ == "__main__": + main() diff --git a/src/preprocessing/espeak_phon.py b/src/preprocessing/espeak_phon.py new file mode 100644 index 0000000..82a9d1a --- /dev/null +++ b/src/preprocessing/espeak_phon.py @@ -0,0 +1,83 @@ +from phonemizer.phonemize import phonemize +from phonemizer.separator import Separator +import re, regex + + +## from Tacotron (from SIWIS corpus) +punkt_class = "“”„«»!,.:;–?\"'…\[\](){}—\-" ## NOTE: without the whitespace +re_punkt_class = re.compile("([" + punkt_class + "])") + + +def espeak_phon( + text, + lang="ru", + accent=None, + clean=True, + add_punkt=True, + mark_pausation=True, + pausation_symbol="%", + _spec_seq="@@@", + verbose=False, +): + language = lang + if accent: + language += f"-{accent}" + if verbose: + print(f"Original input:\n{text}\n") + + separator = Separator(phone=" ", syllable="", word="\n") + + punkt = None + if add_punkt: + spec_phonseq = phonemize(_spec_seq, language=language, backend="espeak").strip() + assert len(spec_phonseq) > 0 + assert not re.match("\s", spec_phonseq) + punkt = re_punkt_class.finditer(text) + # punkt = re_punkt_class.findall(text) + # punkt = regex.findall('([' + punkt_class + '])', text) + punkt = [x.group(0) for x in punkt] + if verbose: + print(f"Punctuation recognized:\n{punkt}\n") + if len(punkt) > 0: + punkt = iter(punkt) + else: + punkt = None + text = re.sub(re_punkt_class, _spec_seq + r"\1", text) + if verbose: + print(f"Input with marked punctuation:\n{text}\n") + + phoneseq = phonemize(text, language=language, backend="espeak") + if mark_pausation: + phoneseq = re.sub("\n", pausation_symbol, phoneseq) + else: + phoneseq = re.sub("\n", " ", phoneseq) + if verbose: + print(f"Input with marked pausation:\n{phoneseq}\n") + + if clean: + phoneseq = regex.sub( + "\(.+?\)", "", phoneseq + ) ## use regex for non-greedy matching + ## zz = liaison after z + phoneseq = re.sub("z+", "z", phoneseq) + if verbose: + print(f'Input after "cleaning":\n{phoneseq}\n') + + out_phoneseq = "" + if add_punkt and (punkt is not None): + split_phoneseq = [x for x in re.split("(" + spec_phonseq + ")", phoneseq) if x] + for x in split_phoneseq: + if x == spec_phonseq: + out_phoneseq += next(punkt) + else: + out_phoneseq += x + else: + out_phoneseq = phoneseq + out_phoneseq = re.sub(r" %", r"%", out_phoneseq) + out_phoneseq = re.sub(r"([" + punkt_class + "]+)(%)", r"\2\1 ", out_phoneseq) + out_phoneseq = re.sub(r" %", r"%", out_phoneseq) + out_phoneseq = re.sub("\s+", " ", out_phoneseq) + if verbose: + print(f"Output:\n{out_phoneseq}") + + return out_phoneseq diff --git a/src/preprocessing/prep_files_russian.py b/src/preprocessing/prep_files_russian.py index d47900d..04cb3e9 100644 --- a/src/preprocessing/prep_files_russian.py +++ b/src/preprocessing/prep_files_russian.py @@ -1,5 +1,7 @@ #!/usr/bin/env python +import json import shutil +from collections import defaultdict from pathlib import Path from typing import List @@ -8,19 +10,22 @@ from tqdm import tqdm -def process_audio(audio_path: Path, audio_output_dir: Path) -> None: - speaker = audio_path.parent.name.replace("_", "-") +def process_audio(audio_path: Path, audio_output_dir: Path, emo_speaker: defaultdict) -> None: + old_dir = audio_path.parent.name.replace("_", "-") + speaker = "olga" emotion = audio_path.parent.parent.name new_dir = audio_output_dir / speaker new_dir.mkdir(parents=True, exist_ok=True) - new_filename = f"{speaker}_{emotion}_{audio_path.name}" + new_filename = f"{old_dir}-{emotion}_{audio_path.name}" new_audio_path = new_dir / new_filename + emo_speaker[emotion][speaker].add(new_audio_path.stem) shutil.copy(audio_path, new_audio_path) -def process_annotation(annot_path: Path, text_output_dir: Path) -> None: +def process_annotation(annot_path: Path, text_output_dir: Path, emo_speaker: defaultdict) -> None: text_ext = "txt" - speaker = annot_path.parent.name.replace("_", "-") + old_dir = annot_path.parent.name.replace("_", "-") + speaker = "olga" emotion = annot_path.parent.parent.name df: pd.DataFrame = pd.read_excel(annot_path) df = df.iloc[:, :3] @@ -32,11 +37,12 @@ def process_annotation(annot_path: Path, text_output_dir: Path) -> None: except KeyError: print(row) raise - new_filename = f"{speaker}_{emotion}_{filename}.{text_ext}" + new_filename = f"{old_dir}-{emotion}_{filename}.{text_ext}" new_dir = text_output_dir / speaker new_dir.mkdir(parents=True, exist_ok=True) new_filepath = new_dir / new_filename - with open(new_filepath, "w") as text_output_file: + emo_speaker[emotion][speaker].add(new_filepath.stem) + with open(new_filepath, "w", encoding="utf8") as text_output_file: text_output_file.write(content) @@ -56,6 +62,12 @@ def process_annotation(annot_path: Path, text_output_dir: Path) -> None: default="wavs", help="Directory for rearranged audio files.", ) +@click.option( + "--meta-output-dir", + type=Path, + default="meta", + help="Directory for newly created metadata files.", +) @click.option( "--log-path", type=Path, @@ -74,6 +86,7 @@ def main( dataset_dir: Path, text_output_dir: Path, audio_output_dir: Path, + meta_output_dir: Path, log_path: Path, audio_ext: str, annot_ext: List[str], @@ -81,23 +94,32 @@ def main( text_output_dir.mkdir(exist_ok=True, parents=True) audio_output_dir.mkdir(exist_ok=True, parents=True) + meta_output_dir.mkdir(exist_ok=True, parents=True) log_path.parent.mkdir(exist_ok=True, parents=True) log_path.unlink(missing_ok=True) - for path in tqdm(dataset_dir.rglob("*")): + emo_speaker_json = defaultdict(lambda: defaultdict(set)) + for path in tqdm(list(dataset_dir.rglob("*"))): # If audio, get speaker, get emotion and copy it with new name if path.suffix == f".{audio_ext}": - process_audio(path, audio_output_dir) + process_audio(path, audio_output_dir, emo_speaker_json) # If annotation, parse it and rearrange texts elif path.suffix[1:] in annot_ext: - process_annotation(path, text_output_dir) + process_annotation(path, text_output_dir, emo_speaker_json) # else do nothing, log skipped path else: with open(log_path, "a") as logfile: logfile.write(f"{path}\n") continue + emo_speaker_json = dict(emo_speaker_json) + for emotion in emo_speaker_json.keys(): + for speaker in emo_speaker_json[emotion].keys(): + emo_speaker_json[emotion][speaker] = list(emo_speaker_json[emotion][speaker]) + with open(meta_output_dir / "emo_speaker_file.json", "w", encoding="utf8") as f: + json.dump(emo_speaker_json, f) + if __name__ == "__main__": main() diff --git a/src/preprocessing/prep_files_russian_neutral.py b/src/preprocessing/prep_files_russian_neutral.py new file mode 100644 index 0000000..5a8a160 --- /dev/null +++ b/src/preprocessing/prep_files_russian_neutral.py @@ -0,0 +1,116 @@ +#!/usr/bin/env python +import json +import shutil +from collections import defaultdict +from pathlib import Path + +import click +import pandas as pd +from tqdm import tqdm + + +def process_audio(audio_path: Path, audio_output_dir: Path, emo_speaker: defaultdict) -> None: + old_dir = audio_path.parent.name.replace("_", "-") + speaker = "olga" + emotion = "neutral" + new_dir = audio_output_dir / speaker + new_dir.mkdir(parents=True, exist_ok=True) + new_filename = f"{old_dir}-{emotion}_{audio_path.name}" + new_audio_path = new_dir / new_filename + emo_speaker[emotion][speaker].add(new_audio_path.stem) + shutil.copy(audio_path, new_audio_path) + + +def process_metadata(metadata_path: Path, text_output_dir: Path, emo_speaker: defaultdict) -> None: + text_ext = "txt" + speaker = "olga" + emotion = "neutral" + df: pd.DataFrame = pd.read_csv(metadata_path, delimiter="|", header=None, names=["path", "original", "stressed"]) + for (_, path, original, stressed) in df.itertuples(): + old_dir, filename = path.split("/") + old_dir = old_dir.replace("_", "-") + new_filename = f"{old_dir}-{emotion}_{filename}.{text_ext}" + new_dir = text_output_dir / speaker + new_dir.mkdir(parents=True, exist_ok=True) + new_filepath = new_dir / new_filename + emo_speaker[emotion][speaker].add(new_filepath.stem) + with open(new_filepath, "w", encoding="utf8") as text_output_file: + text_output_file.write(original) + + +@click.command() +@click.option( + "--dataset-dir", type=Path, help="Directory with original russian dataset" +) +@click.option( + "--text-output-dir", + type=Path, + default="texts", + help="Directory for text files extracted from annotations.", +) +@click.option( + "--audio-output-dir", + type=Path, + default="wavs", + help="Directory for rearranged audio files.", +) +@click.option( + "--meta-output-dir", + type=Path, + default="meta", + help="Directory for newly created metadata files.", +) +@click.option( + "--log-path", + type=Path, + default="logs/preprocessing/russian-skipped-paths.txt", + help="Path for logging list of skipped items.", +) +@click.option( + "--metadata-filename", + type=str, + default="metadata.csv", + help="Name of metadata file to search in dataset.", +) +@click.option("--audio-ext", type=str, default="wav", help="Extension of audio files.") +def main( + dataset_dir: Path, + text_output_dir: Path, + audio_output_dir: Path, + meta_output_dir: Path, + log_path: Path, + audio_ext: str, + metadata_filename: str, +) -> None: + + text_output_dir.mkdir(exist_ok=True, parents=True) + audio_output_dir.mkdir(exist_ok=True, parents=True) + meta_output_dir.mkdir(exist_ok=True, parents=True) + log_path.parent.mkdir(exist_ok=True, parents=True) + log_path.unlink(missing_ok=True) + + emo_speaker_json = defaultdict(lambda: defaultdict(set)) + + for path in tqdm(list(dataset_dir.rglob("*"))): + # If audio, get speaker, get emotion and copy it with new name + if path.suffix == f".{audio_ext}": + process_audio(path, audio_output_dir, emo_speaker_json) + # If metadata, parse it and rearrange texts + elif path.name == metadata_filename: + process_metadata(path, text_output_dir, emo_speaker_json) + # else do nothing, log skipped path + else: + with open(log_path, "a") as logfile: + logfile.write(f"{path}\n") + continue + + emo_speaker_json = dict(emo_speaker_json) + for emotion in emo_speaker_json.keys(): + for speaker in emo_speaker_json[emotion].keys(): + emo_speaker_json[emotion][speaker] = list(emo_speaker_json[emotion][speaker]) + with open(meta_output_dir / "neutral_speaker_file.json", "w", encoding="utf8") as f: + json.dump(emo_speaker_json, f) + + +if __name__ == "__main__": + main() diff --git a/src/preprocessing/text_normalization_russian.py b/src/preprocessing/text_normalization_russian.py index 946aa5f..591938b 100644 --- a/src/preprocessing/text_normalization_russian.py +++ b/src/preprocessing/text_normalization_russian.py @@ -27,12 +27,13 @@ def main(input_dir: Path, output_dir: Path) -> None: new_dir.mkdir(exist_ok=True) new_file = new_dir / filepath.name - with open(filepath, "r") as fin, open(new_file, "w") as fout: - content = fin.read() - normalized_content = normalizer.norm_text(content) - normalized_content = lowercase(normalized_content) - normalized_content = collapse_whitespace(normalized_content) - fout.write(normalized_content) + with open(filepath, "r", encoding="utf8") as fin: + with open(new_file, "w", encoding="utf8") as fout: + content = fin.read() + normalized_content = normalizer.norm_text(content) + normalized_content = lowercase(normalized_content) + normalized_content = collapse_whitespace(normalized_content) + fout.write(normalized_content) print("Finished successfully.") print(f"Processed files are located at {output_dir}") diff --git a/src/preprocessing/wav_to_mel.py b/src/preprocessing/wav_to_mel.py index 604039c..20ffe2b 100644 --- a/src/preprocessing/wav_to_mel.py +++ b/src/preprocessing/wav_to_mel.py @@ -66,7 +66,9 @@ def main(input_dir: Path, output_dir: Path, audio_ext: str) -> None: print("Transforming audio to mel...") for filepath in tqdm(filepath_list): - new_path = output_dir / filepath.stem + speaker = filepath.parent.stem + new_path = output_dir / speaker / filepath.stem + new_path.parent.mkdir(exist_ok=True, parents=True) wave_tensor, _ = torchaudio.load(filepath) assert wave_tensor.shape[0] == 1, "Audio has more than 1 channel"