From 0089e59187e71ccee22a24e908a95b50408c4ca0 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Fri, 15 Apr 2022 05:28:38 -0700
Subject: [PATCH 01/17] Adapt raw files preprocessing for new loaders, add
emo_speaker_file preparation, add deps for Excel parsing to conda env
---
environment.yml | 2 ++
russian_preprocessing/steps.sh | 7 ++---
src/preprocessing/prep_files_russian.py | 42 +++++++++++++++++++------
3 files changed, 36 insertions(+), 15 deletions(-)
diff --git a/environment.yml b/environment.yml
index 3446865..0379f6c 100644
--- a/environment.yml
+++ b/environment.yml
@@ -18,6 +18,7 @@ dependencies:
- matplotlib
- montreal-forced-aligner=2.0.0b4
- numpy
+ - openpyxl
- pip
- python=3.8
- pytorch=1.10.0
@@ -29,6 +30,7 @@ dependencies:
- unidecode
- unzip
- uvicorn
+ - xlrd
- pip:
- tgt
\ No newline at end of file
diff --git a/russian_preprocessing/steps.sh b/russian_preprocessing/steps.sh
index 4ee2f2e..08b684f 100644
--- a/russian_preprocessing/steps.sh
+++ b/russian_preprocessing/steps.sh
@@ -3,15 +3,12 @@ conda env create -n emotts -f russian_preprocessing/environment.yaml
conda activate emotts
conda config --set ssl_verify no
export RUSSIAN_DATASET_PATH=/media/diskB/ruslan_a/data/datasets/EMO/russian
-export OUTPUT_DIR=$RUSSIAN_DATASET_PATH/processed
-export OUTPUT_DIR=$RUSSIAN_DATASET_PATH/processed_mix
+export OUTPUT_DIR=$RUSSIAN_DATASET_PATH/processed_v2
export MFA_PREMADE=/media/diskB/ruslan_a/data/datasets/emo_rus_Olga_v2_processed/mfa_espeak_grids
# 16164it [03:36, 74.61it/s]
-# 25544it [02:45, 154.48it/s] mix
echo -e "\n1) Prep raw files"
-# python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw
-python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original_and_neutral --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw
+python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw --meta-output-dir $OUTPUT_DIR/meta
# ~1.5-2.0 hours
echo -e "\n2) Pausation cutting with VAD"
diff --git a/src/preprocessing/prep_files_russian.py b/src/preprocessing/prep_files_russian.py
index d47900d..04cb3e9 100644
--- a/src/preprocessing/prep_files_russian.py
+++ b/src/preprocessing/prep_files_russian.py
@@ -1,5 +1,7 @@
#!/usr/bin/env python
+import json
import shutil
+from collections import defaultdict
from pathlib import Path
from typing import List
@@ -8,19 +10,22 @@
from tqdm import tqdm
-def process_audio(audio_path: Path, audio_output_dir: Path) -> None:
- speaker = audio_path.parent.name.replace("_", "-")
+def process_audio(audio_path: Path, audio_output_dir: Path, emo_speaker: defaultdict) -> None:
+ old_dir = audio_path.parent.name.replace("_", "-")
+ speaker = "olga"
emotion = audio_path.parent.parent.name
new_dir = audio_output_dir / speaker
new_dir.mkdir(parents=True, exist_ok=True)
- new_filename = f"{speaker}_{emotion}_{audio_path.name}"
+ new_filename = f"{old_dir}-{emotion}_{audio_path.name}"
new_audio_path = new_dir / new_filename
+ emo_speaker[emotion][speaker].add(new_audio_path.stem)
shutil.copy(audio_path, new_audio_path)
-def process_annotation(annot_path: Path, text_output_dir: Path) -> None:
+def process_annotation(annot_path: Path, text_output_dir: Path, emo_speaker: defaultdict) -> None:
text_ext = "txt"
- speaker = annot_path.parent.name.replace("_", "-")
+ old_dir = annot_path.parent.name.replace("_", "-")
+ speaker = "olga"
emotion = annot_path.parent.parent.name
df: pd.DataFrame = pd.read_excel(annot_path)
df = df.iloc[:, :3]
@@ -32,11 +37,12 @@ def process_annotation(annot_path: Path, text_output_dir: Path) -> None:
except KeyError:
print(row)
raise
- new_filename = f"{speaker}_{emotion}_{filename}.{text_ext}"
+ new_filename = f"{old_dir}-{emotion}_{filename}.{text_ext}"
new_dir = text_output_dir / speaker
new_dir.mkdir(parents=True, exist_ok=True)
new_filepath = new_dir / new_filename
- with open(new_filepath, "w") as text_output_file:
+ emo_speaker[emotion][speaker].add(new_filepath.stem)
+ with open(new_filepath, "w", encoding="utf8") as text_output_file:
text_output_file.write(content)
@@ -56,6 +62,12 @@ def process_annotation(annot_path: Path, text_output_dir: Path) -> None:
default="wavs",
help="Directory for rearranged audio files.",
)
+@click.option(
+ "--meta-output-dir",
+ type=Path,
+ default="meta",
+ help="Directory for newly created metadata files.",
+)
@click.option(
"--log-path",
type=Path,
@@ -74,6 +86,7 @@ def main(
dataset_dir: Path,
text_output_dir: Path,
audio_output_dir: Path,
+ meta_output_dir: Path,
log_path: Path,
audio_ext: str,
annot_ext: List[str],
@@ -81,23 +94,32 @@ def main(
text_output_dir.mkdir(exist_ok=True, parents=True)
audio_output_dir.mkdir(exist_ok=True, parents=True)
+ meta_output_dir.mkdir(exist_ok=True, parents=True)
log_path.parent.mkdir(exist_ok=True, parents=True)
log_path.unlink(missing_ok=True)
- for path in tqdm(dataset_dir.rglob("*")):
+ emo_speaker_json = defaultdict(lambda: defaultdict(set))
+ for path in tqdm(list(dataset_dir.rglob("*"))):
# If audio, get speaker, get emotion and copy it with new name
if path.suffix == f".{audio_ext}":
- process_audio(path, audio_output_dir)
+ process_audio(path, audio_output_dir, emo_speaker_json)
# If annotation, parse it and rearrange texts
elif path.suffix[1:] in annot_ext:
- process_annotation(path, text_output_dir)
+ process_annotation(path, text_output_dir, emo_speaker_json)
# else do nothing, log skipped path
else:
with open(log_path, "a") as logfile:
logfile.write(f"{path}\n")
continue
+ emo_speaker_json = dict(emo_speaker_json)
+ for emotion in emo_speaker_json.keys():
+ for speaker in emo_speaker_json[emotion].keys():
+ emo_speaker_json[emotion][speaker] = list(emo_speaker_json[emotion][speaker])
+ with open(meta_output_dir / "emo_speaker_file.json", "w", encoding="utf8") as f:
+ json.dump(emo_speaker_json, f)
+
if __name__ == "__main__":
main()
From 6c84a209ca8c361b409ee472c5e4f54e3f7b45ac Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Fri, 15 Apr 2022 06:09:40 -0700
Subject: [PATCH 02/17] Add speaker directory creation
---
russian_preprocessing/steps.sh | 8 +++-----
src/preprocessing/wav_to_mel.py | 4 +++-
2 files changed, 6 insertions(+), 6 deletions(-)
diff --git a/russian_preprocessing/steps.sh b/russian_preprocessing/steps.sh
index 08b684f..f6a3d4d 100644
--- a/russian_preprocessing/steps.sh
+++ b/russian_preprocessing/steps.sh
@@ -10,12 +10,11 @@ export MFA_PREMADE=/media/diskB/ruslan_a/data/datasets/emo_rus_Olga_v2_processed
echo -e "\n1) Prep raw files"
python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw --meta-output-dir $OUTPUT_DIR/meta
-# ~1.5-2.0 hours
-echo -e "\n2) Pausation cutting with VAD"
-python src/preprocessing/pausation_cutting.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/no_pause --target-sr 96000 --audio-ext wav
+# ~1.5-2.0 hours (Deprecated)
+# echo -e "\n2) Pausation cutting with VAD"
+# python src/preprocessing/pausation_cutting.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/no_pause --target-sr 96000 --audio-ext wav
# 16071/16071 [02:50<00:00, 94.26it/s]
-# 25429/25429 [04:18<00:00, 98.26it/s] mix
echo -e "\n3) Resampling and Converting audio to 1-channel"
# python src/preprocessing/resampling.py --input-dir $OUTPUT_DIR/audio/no_pause --output-dir $OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
python src/preprocessing/resampling.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
@@ -25,7 +24,6 @@ conda deactivate
conda activate emotts
# 16071/16071 [13:09<00:00, 20.37it/s]
-# 25429/25429 [13:11<00:00, 32.15it/s] mix
echo -e "\n4) Audio to Mel"
python src/preprocessing/wav_to_mel.py --input-dir $OUTPUT_DIR/audio/resampled --output-dir $OUTPUT_DIR/mels --audio-ext wav
diff --git a/src/preprocessing/wav_to_mel.py b/src/preprocessing/wav_to_mel.py
index 604039c..20ffe2b 100644
--- a/src/preprocessing/wav_to_mel.py
+++ b/src/preprocessing/wav_to_mel.py
@@ -66,7 +66,9 @@ def main(input_dir: Path, output_dir: Path, audio_ext: str) -> None:
print("Transforming audio to mel...")
for filepath in tqdm(filepath_list):
- new_path = output_dir / filepath.stem
+ speaker = filepath.parent.stem
+ new_path = output_dir / speaker / filepath.stem
+ new_path.parent.mkdir(exist_ok=True, parents=True)
wave_tensor, _ = torchaudio.load(filepath)
assert wave_tensor.shape[0] == 1, "Audio has more than 1 channel"
From aec36e051284986df08c5bf660c54f91511bd5b1 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Fri, 15 Apr 2022 07:15:57 -0700
Subject: [PATCH 03/17] Fix encoding
---
src/preprocessing/text_normalization_russian.py | 13 +++++++------
1 file changed, 7 insertions(+), 6 deletions(-)
diff --git a/src/preprocessing/text_normalization_russian.py b/src/preprocessing/text_normalization_russian.py
index 946aa5f..591938b 100644
--- a/src/preprocessing/text_normalization_russian.py
+++ b/src/preprocessing/text_normalization_russian.py
@@ -27,12 +27,13 @@ def main(input_dir: Path, output_dir: Path) -> None:
new_dir.mkdir(exist_ok=True)
new_file = new_dir / filepath.name
- with open(filepath, "r") as fin, open(new_file, "w") as fout:
- content = fin.read()
- normalized_content = normalizer.norm_text(content)
- normalized_content = lowercase(normalized_content)
- normalized_content = collapse_whitespace(normalized_content)
- fout.write(normalized_content)
+ with open(filepath, "r", encoding="utf8") as fin:
+ with open(new_file, "w", encoding="utf8") as fout:
+ content = fin.read()
+ normalized_content = normalizer.norm_text(content)
+ normalized_content = lowercase(normalized_content)
+ normalized_content = collapse_whitespace(normalized_content)
+ fout.write(normalized_content)
print("Finished successfully.")
print(f"Processed files are located at {output_dir}")
From bfce4462e670b5d869ed478720d6fa48f76f44da Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Mon, 18 Apr 2022 04:22:03 -0700
Subject: [PATCH 04/17] Add neutral raw russian data preprocessing
---
russian_preprocessing/steps.sh | 38 +++---
.../prep_files_russian_neutral.py | 115 ++++++++++++++++++
2 files changed, 137 insertions(+), 16 deletions(-)
create mode 100644 src/preprocessing/prep_files_russian_neutral.py
diff --git a/russian_preprocessing/steps.sh b/russian_preprocessing/steps.sh
index f6a3d4d..f10bf8c 100644
--- a/russian_preprocessing/steps.sh
+++ b/russian_preprocessing/steps.sh
@@ -2,22 +2,26 @@ echo -e "\n0) Setup env"
conda env create -n emotts -f russian_preprocessing/environment.yaml
conda activate emotts
conda config --set ssl_verify no
-export RUSSIAN_DATASET_PATH=/media/diskB/ruslan_a/data/datasets/EMO/russian
-export OUTPUT_DIR=$RUSSIAN_DATASET_PATH/processed_v2
+export EMO_DATASET_DIR=/media/diskB/ruslan_a/data/datasets/EMO/russian
+export NEUTRAL_DATASET_DIR=/media/diskB/ruslan_a/data/datasets/NEUTRAL/russian
+export EMO_OUTPUT_DIR=$EMO_DATASET_DIR/processed_v2
+export NEUTRAL_OUTPUT_DIR=$NEUTRAL_DATASET_DIR/processed_v2
export MFA_PREMADE=/media/diskB/ruslan_a/data/datasets/emo_rus_Olga_v2_processed/mfa_espeak_grids
# 16164it [03:36, 74.61it/s]
echo -e "\n1) Prep raw files"
-python src/preprocessing/prep_files_russian.py --dataset-dir $RUSSIAN_DATASET_PATH/original --text-output-dir $OUTPUT_DIR/text/raw --audio-output-dir $OUTPUT_DIR/audio/raw --meta-output-dir $OUTPUT_DIR/meta
+python src/preprocessing/prep_files_russian.py --dataset-dir $EMO_DATASET_DIR/original --text-output-dir $EMO_OUTPUT_DIR/text/raw --audio-output-dir $EMO_OUTPUT_DIR/audio/raw --meta-output-dir $EMO_OUTPUT_DIR/meta
+python src/preprocessing/prep_files_russian_neutral.py --dataset-dir $NEUTRAL_DATASET_DIR/original --text-output-dir $NEUTRAL_OUTPUT_DIR/text/raw --audio-output-dir $NEUTRAL_OUTPUT_DIR/audio/raw --meta-output-dir $NEUTRAL_OUTPUT_DIR/meta
# ~1.5-2.0 hours (Deprecated)
# echo -e "\n2) Pausation cutting with VAD"
-# python src/preprocessing/pausation_cutting.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/no_pause --target-sr 96000 --audio-ext wav
+# python src/preprocessing/pausation_cutting.py --input-dir $EMO_OUTPUT_DIR/audio/raw --output-dir $EMO_OUTPUT_DIR/audio/no_pause --target-sr 96000 --audio-ext wav
# 16071/16071 [02:50<00:00, 94.26it/s]
echo -e "\n3) Resampling and Converting audio to 1-channel"
-# python src/preprocessing/resampling.py --input-dir $OUTPUT_DIR/audio/no_pause --output-dir $OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
-python src/preprocessing/resampling.py --input-dir $OUTPUT_DIR/audio/raw --output-dir $OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
+# python src/preprocessing/resampling.py --input-dir $EMO_OUTPUT_DIR/audio/no_pause --output-dir $EMO_OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
+python src/preprocessing/resampling.py --input-dir $EMO_OUTPUT_DIR/audio/raw --output-dir $EMO_OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
+python src/preprocessing/resampling.py --input-dir $NEUTRAL_OUTPUT_DIR/audio/raw --output-dir $NEUTRAL_OUTPUT_DIR/audio/resampled --resample-rate 22050 --audio-ext wav
conda env config vars set LD_LIBRARY_PATH=$CONDA_PREFIX/lib # link to libopenblas
conda deactivate
@@ -25,14 +29,16 @@ conda activate emotts
# 16071/16071 [13:09<00:00, 20.37it/s]
echo -e "\n4) Audio to Mel"
-python src/preprocessing/wav_to_mel.py --input-dir $OUTPUT_DIR/audio/resampled --output-dir $OUTPUT_DIR/mels --audio-ext wav
+python src/preprocessing/wav_to_mel.py --input-dir $EMO_OUTPUT_DIR/audio/resampled --output-dir $EMO_OUTPUT_DIR/mels --audio-ext wav
+python src/preprocessing/wav_to_mel.py --input-dir $NEUTRAL_OUTPUT_DIR/audio/resampled --output-dir $NEUTRAL_OUTPUT_DIR/mels --audio-ext wav
# 16069/16069 [31:38<00:00, 8.46it/s]
# 16962/16962 [12:22<00:00, 22.85it/s] mix
# Model is needed: https://github.com/snakers4/russian_stt_text_normalization/blob/master/jit_s2s.pt
# Put model to src/preprocessing/text/russian/
echo -e "\n5) Text normalization"
-python src/preprocessing/text_normalization_russian.py --input-dir $OUTPUT_DIR/text/raw --output-dir $OUTPUT_DIR/mfa_inputs
+python src/preprocessing/text_normalization_russian.py --input-dir $EMO_OUTPUT_DIR/text/raw --output-dir $EMO_OUTPUT_DIR/mfa_inputs
+python src/preprocessing/text_normalization_russian.py --input-dir $NEUTRAL_OUTPUT_DIR/text/raw --output-dir $NEUTRAL_OUTPUT_DIR/mfa_inputs
echo -e "\n6) MFA Alignment setup"
@@ -47,33 +53,33 @@ export RUS_ESPEAK_LEXICON=/media/diskB/ruslan_a/models/mfa/rus-espeak-mfa/rus-mf
# 16069/16069 [00:00<00:00, 21508.15it/s]
echo -e "\n6.1) Creating word list from dataset"
-python src/preprocessing/create_corpus.py --input-dir $OUTPUT_DIR/text/raw --output-path $OUTPUT_DIR/meta/words.txt
+python src/preprocessing/create_corpus.py --input-dir $EMO_OUTPUT_DIR/text/raw --output-path $EMO_OUTPUT_DIR/meta/words.txt
# 25849/25983 [01:19<00:00, 326.82it/s]
echo -e "\n6.2) Creating G2P lexicon from word list"
-mfa g2p -t mfa_tmp -j 32 --clean --overwrite models/g2p/russian_g2p.zip $OUTPUT_DIR/meta/words.txt models/mfa/russian_lexicon.txt
+mfa g2p -t mfa_tmp -j 32 --clean --overwrite models/g2p/russian_g2p.zip $EMO_OUTPUT_DIR/meta/words.txt models/mfa/russian_lexicon.txt
rm -rf mfa_tmp
# 42it [00:10, 4.01it/s]
# 58it [00:12, 4.54it/s] mix
echo -e "\n7) MFA Preprocessing"
-python src/preprocessing/mfa_preprocessing.py --input-dir $OUTPUT_DIR/audio/resampled --output-dir $OUTPUT_DIR/mfa_inputs
+python src/preprocessing/mfa_preprocessing.py --input-dir $EMO_OUTPUT_DIR/audio/resampled --output-dir $EMO_OUTPUT_DIR/mfa_inputs
# FINALLY, align phonemes and speech
# ~50 min
echo -e "\n8) MFA Alignment"
-echo $OUTPUT_DIR
-mfa align -t mfa_tmp --clean -j 32 $OUTPUT_DIR/mfa_inputs models/mfa/russian_lexicon.txt models/mfa/russian.zip $OUTPUT_DIR/mfa_outputs
+echo $EMO_OUTPUT_DIR
+mfa align -t mfa_tmp --clean -j 32 $EMO_OUTPUT_DIR/mfa_inputs models/mfa/russian_lexicon.txt models/mfa/russian.zip $EMO_OUTPUT_DIR/mfa_outputs
# for mix
-mfa align -t mfa_tmp --clean -j 32 $OUTPUT_DIR/mfa_inputs $RUS_ESPEAK_LEXICON $RUS_ESPEAK_ACOUSTIC_MODEL $OUTPUT_DIR/mfa_outputs
+mfa align -t mfa_tmp --clean -j 32 $EMO_OUTPUT_DIR/mfa_inputs $RUS_ESPEAK_LEXICON $RUS_ESPEAK_ACOUSTIC_MODEL $EMO_OUTPUT_DIR/mfa_outputs
rm -rf mfa_tmp
echo -e "\n9) MFA Postprocessing"
# Aggregate mels by speakers
# 16071it [00:00, 16767.84it/s]
# 25429it [00:01, 17870.70it/s] mix
-python src/preprocessing/mfa_postprocessing.py --input-dir $OUTPUT_DIR/mels
+python src/preprocessing/mfa_postprocessing.py --input-dir $EMO_OUTPUT_DIR/mels
# Only for MFA PREMADE case
echo -e "\n10) MFA Premade Preprocessing"
-python src/preprocessing/mfa_premade_preprocessing.py --input-dir $MFA_PREMADE --output-dir $OUTPUT_DIR/mfa_outputs
\ No newline at end of file
+python src/preprocessing/mfa_premade_preprocessing.py --input-dir $MFA_PREMADE --output-dir $EMO_OUTPUT_DIR/mfa_outputs
\ No newline at end of file
diff --git a/src/preprocessing/prep_files_russian_neutral.py b/src/preprocessing/prep_files_russian_neutral.py
new file mode 100644
index 0000000..0dab729
--- /dev/null
+++ b/src/preprocessing/prep_files_russian_neutral.py
@@ -0,0 +1,115 @@
+#!/usr/bin/env python
+import json
+import shutil
+from collections import defaultdict
+from pathlib import Path
+
+import click
+import pandas as pd
+from tqdm import tqdm
+
+
+def process_audio(audio_path: Path, audio_output_dir: Path, emo_speaker: defaultdict) -> None:
+ old_dir = audio_path.parent.name.replace("_", "-")
+ speaker = "olga"
+ emotion = "neutral"
+ new_dir = audio_output_dir / speaker
+ new_dir.mkdir(parents=True, exist_ok=True)
+ new_filename = f"{old_dir}-{emotion}_{audio_path.name}"
+ new_audio_path = new_dir / new_filename
+ emo_speaker[emotion][speaker].add(new_audio_path.stem)
+ shutil.copy(audio_path, new_audio_path)
+
+
+def process_metadata(metadata_path: Path, text_output_dir: Path, emo_speaker: defaultdict) -> None:
+ text_ext = "txt"
+ speaker = "olga"
+ emotion = "neutral"
+ df: pd.DataFrame = pd.read_csv(metadata_path, delimiter="|", header=None, names=["path", "original", "stressed"])
+ for (_, path, original, stressed) in df.itertuples():
+ old_dir, filename = path.split("/")
+ new_filename = f"{old_dir}-{emotion}_{filename}.{text_ext}"
+ new_dir = text_output_dir / speaker
+ new_dir.mkdir(parents=True, exist_ok=True)
+ new_filepath = new_dir / new_filename
+ emo_speaker[emotion][speaker].add(new_filepath.stem)
+ with open(new_filepath, "w", encoding="utf8") as text_output_file:
+ text_output_file.write(original)
+
+
+@click.command()
+@click.option(
+ "--dataset-dir", type=Path, help="Directory with original russian dataset"
+)
+@click.option(
+ "--text-output-dir",
+ type=Path,
+ default="texts",
+ help="Directory for text files extracted from annotations.",
+)
+@click.option(
+ "--audio-output-dir",
+ type=Path,
+ default="wavs",
+ help="Directory for rearranged audio files.",
+)
+@click.option(
+ "--meta-output-dir",
+ type=Path,
+ default="meta",
+ help="Directory for newly created metadata files.",
+)
+@click.option(
+ "--log-path",
+ type=Path,
+ default="logs/preprocessing/russian-skipped-paths.txt",
+ help="Path for logging list of skipped items.",
+)
+@click.option(
+ "--metadata-filename",
+ type=str,
+ default="metadata.csv",
+ help="Name of metadata file to search in dataset.",
+)
+@click.option("--audio-ext", type=str, default="wav", help="Extension of audio files.")
+def main(
+ dataset_dir: Path,
+ text_output_dir: Path,
+ audio_output_dir: Path,
+ meta_output_dir: Path,
+ log_path: Path,
+ audio_ext: str,
+ metadata_filename: str,
+) -> None:
+
+ text_output_dir.mkdir(exist_ok=True, parents=True)
+ audio_output_dir.mkdir(exist_ok=True, parents=True)
+ meta_output_dir.mkdir(exist_ok=True, parents=True)
+ log_path.parent.mkdir(exist_ok=True, parents=True)
+ log_path.unlink(missing_ok=True)
+
+ emo_speaker_json = defaultdict(lambda: defaultdict(set))
+
+ for path in tqdm(list(dataset_dir.rglob("*"))):
+ # If audio, get speaker, get emotion and copy it with new name
+ if path.suffix == f".{audio_ext}":
+ process_audio(path, audio_output_dir, emo_speaker_json)
+ # If metadata, parse it and rearrange texts
+ elif path.name == metadata_filename:
+ process_metadata(path, text_output_dir, emo_speaker_json)
+ # else do nothing, log skipped path
+ else:
+ with open(log_path, "a") as logfile:
+ logfile.write(f"{path}\n")
+ continue
+
+ emo_speaker_json = dict(emo_speaker_json)
+ for emotion in emo_speaker_json.keys():
+ for speaker in emo_speaker_json[emotion].keys():
+ emo_speaker_json[emotion][speaker] = list(emo_speaker_json[emotion][speaker])
+ with open(meta_output_dir / "neutral_speaker_file.json", "w", encoding="utf8") as f:
+ json.dump(emo_speaker_json, f)
+
+
+if __name__ == "__main__":
+ main()
From 01a9c49fcc04077f84a4e823c9053db553b1c773 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Mon, 18 Apr 2022 05:42:26 -0700
Subject: [PATCH 05/17] Fix text files renaming pattern
---
src/preprocessing/prep_files_russian_neutral.py | 1 +
1 file changed, 1 insertion(+)
diff --git a/src/preprocessing/prep_files_russian_neutral.py b/src/preprocessing/prep_files_russian_neutral.py
index 0dab729..5a8a160 100644
--- a/src/preprocessing/prep_files_russian_neutral.py
+++ b/src/preprocessing/prep_files_russian_neutral.py
@@ -28,6 +28,7 @@ def process_metadata(metadata_path: Path, text_output_dir: Path, emo_speaker: de
df: pd.DataFrame = pd.read_csv(metadata_path, delimiter="|", header=None, names=["path", "original", "stressed"])
for (_, path, original, stressed) in df.itertuples():
old_dir, filename = path.split("/")
+ old_dir = old_dir.replace("_", "-")
new_filename = f"{old_dir}-{emotion}_{filename}.{text_ext}"
new_dir = text_output_dir / speaker
new_dir.mkdir(parents=True, exist_ok=True)
From 2c2369b23d5cd90e754189190a27345c133aae02 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Tue, 19 Apr 2022 13:26:55 +0300
Subject: [PATCH 06/17] Implement espeak-based phonemizer prototype
---
environment.yml | 1 +
src/preprocessing/phonemizer.py | 80 +++++++++++++++++++++++++++++++++
2 files changed, 81 insertions(+)
create mode 100644 src/preprocessing/phonemizer.py
diff --git a/environment.yml b/environment.yml
index 0379f6c..aca4305 100644
--- a/environment.yml
+++ b/environment.yml
@@ -32,5 +32,6 @@ dependencies:
- uvicorn
- xlrd
- pip:
+ - phonemizer
- tgt
\ No newline at end of file
diff --git a/src/preprocessing/phonemizer.py b/src/preprocessing/phonemizer.py
new file mode 100644
index 0000000..445b9e5
--- /dev/null
+++ b/src/preprocessing/phonemizer.py
@@ -0,0 +1,80 @@
+from phonemizer.phonemize import phonemize
+import re, regex
+
+
+## from Tacotron (from SIWIS corpus)
+punkt_class = "“”„«»!,.:;–?\"'…\[\](){}—\-" ## NOTE: without the whitespace
+re_punkt_class = re.compile("([" + punkt_class + "])")
+
+
+def espeak_phon(
+ text,
+ lang="ru",
+ accent=None,
+ clean=True,
+ add_punkt=True,
+ mark_pausation=True,
+ pausation_symbol="%",
+ _spec_seq="@@@",
+ verbose=False,
+):
+ language = lang
+ if accent:
+ language += f"-{accent}"
+ if verbose:
+ print(f"Original input:\n{text}\n")
+
+ punkt = None
+ if add_punkt:
+ spec_phonseq = phonemize(_spec_seq, language=language, backend="espeak").strip()
+ assert len(spec_phonseq) > 0
+ assert not re.match("\s", spec_phonseq)
+ punkt = re_punkt_class.finditer(text)
+ # punkt = re_punkt_class.findall(text)
+ # punkt = regex.findall('([' + punkt_class + '])', text)
+ punkt = [x.group(0) for x in punkt]
+ if verbose:
+ print(f"Punctuation recognized:\n{punkt}\n")
+ if len(punkt) > 0:
+ punkt = iter(punkt)
+ else:
+ punkt = None
+ text = re.sub(re_punkt_class, _spec_seq + r"\1", text)
+ if verbose:
+ print(f"Input with marked punctuation:\n{text}\n")
+
+ phoneseq = phonemize(text, language=language, backend="espeak")
+ if mark_pausation:
+ phoneseq = re.sub("\n", pausation_symbol, phoneseq)
+ else:
+ phoneseq = re.sub("\n", " ", phoneseq)
+ if verbose:
+ print(f"Input with marked pausation:\n{phoneseq}\n")
+
+ if clean:
+ phoneseq = regex.sub(
+ "\(.+?\)", "", phoneseq
+ ) ## use regex for non-greedy matching
+ ## zz = liaison after z
+ phoneseq = re.sub("z+", "z", phoneseq)
+ if verbose:
+ print(f'Input after "cleaning":\n{phoneseq}\n')
+
+ out_phoneseq = ""
+ if add_punkt and (punkt is not None):
+ split_phoneseq = [x for x in re.split("(" + spec_phonseq + ")", phoneseq) if x]
+ for x in split_phoneseq:
+ if x == spec_phonseq:
+ out_phoneseq += next(punkt)
+ else:
+ out_phoneseq += x
+ else:
+ out_phoneseq = phoneseq
+ out_phoneseq = re.sub(r" %", r"%", out_phoneseq)
+ out_phoneseq = re.sub(r"([" + punkt_class + "]+)(%)", r"\2\1 ", out_phoneseq)
+ out_phoneseq = re.sub(r" %", r"%", out_phoneseq)
+ out_phoneseq = re.sub("\s+", " ", out_phoneseq)
+ if verbose:
+ print(f"Output:\n{out_phoneseq}")
+
+ return out_phoneseq
From be2dc5e7f7d81643c930a6332df9263ecd9d7181 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Tue, 19 Apr 2022 20:39:20 +0300
Subject: [PATCH 07/17] Add script for creating phonematic lexicon from word
corpus with espeak backend
---
src/preprocessing/create_lexicon.py | 47 +++++++++++++++++++
.../{phonemizer.py => espeak_phon.py} | 3 ++
2 files changed, 50 insertions(+)
create mode 100644 src/preprocessing/create_lexicon.py
rename src/preprocessing/{phonemizer.py => espeak_phon.py} (96%)
diff --git a/src/preprocessing/create_lexicon.py b/src/preprocessing/create_lexicon.py
new file mode 100644
index 0000000..ceed1e4
--- /dev/null
+++ b/src/preprocessing/create_lexicon.py
@@ -0,0 +1,47 @@
+"""
+Util to create phonematic lexicon for given corpus.
+Espeak backend must be installed on the system.
+"""
+
+from pathlib import Path
+
+import click
+from phonemizer.phonemize import phonemize
+from phonemizer.separator import Separator
+from tqdm import tqdm
+
+ENCODING = "utf8"
+SEPARATOR = Separator(phone=" ", syllable="", word="")
+
+
+@click.command()
+@click.option(
+ "--input-path", type=Path, help="", required=True,
+)
+@click.option(
+ "--output-path",
+ type=Path,
+ default="russian-lexicon-espeak.txt",
+ help="Filepath to write lexicon.",
+ required=True,
+)
+def main(input_path: Path, output_path: Path) -> None:
+ with open(input_path, "r", encoding=ENCODING) as corpus_file:
+ with open(output_path, "w", encoding=ENCODING) as lexicon_file:
+ for word in tqdm(list(corpus_file.readlines())):
+ word = word.strip()
+ phones = phonemize(
+ word,
+ language="ru",
+ backend="espeak",
+ preserve_punctuation=True,
+ with_stress=True,
+ separator=SEPARATOR,
+ )
+ lexicon_line = f"{word}\t{phones}\n"
+ lexicon_file.write(lexicon_line)
+ print(f"Lexicon file saved at:\n{output_path}")
+
+
+if __name__ == "__main__":
+ main()
diff --git a/src/preprocessing/phonemizer.py b/src/preprocessing/espeak_phon.py
similarity index 96%
rename from src/preprocessing/phonemizer.py
rename to src/preprocessing/espeak_phon.py
index 445b9e5..82a9d1a 100644
--- a/src/preprocessing/phonemizer.py
+++ b/src/preprocessing/espeak_phon.py
@@ -1,4 +1,5 @@
from phonemizer.phonemize import phonemize
+from phonemizer.separator import Separator
import re, regex
@@ -24,6 +25,8 @@ def espeak_phon(
if verbose:
print(f"Original input:\n{text}\n")
+ separator = Separator(phone=" ", syllable="", word="\n")
+
punkt = None
if add_punkt:
spec_phonseq = phonemize(_spec_seq, language=language, backend="espeak").strip()
From e34a13afbb85629b03734bc7442f186b13cb5f22 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Tue, 19 Apr 2022 22:51:07 +0300
Subject: [PATCH 08/17] Radically improve performance
---
src/preprocessing/create_lexicon.py | 59 ++++++++++++++++++++---------
1 file changed, 42 insertions(+), 17 deletions(-)
diff --git a/src/preprocessing/create_lexicon.py b/src/preprocessing/create_lexicon.py
index ceed1e4..02c1be6 100644
--- a/src/preprocessing/create_lexicon.py
+++ b/src/preprocessing/create_lexicon.py
@@ -8,38 +8,63 @@
import click
from phonemizer.phonemize import phonemize
from phonemizer.separator import Separator
-from tqdm import tqdm
ENCODING = "utf8"
-SEPARATOR = Separator(phone=" ", syllable="", word="")
+SEPARATOR = Separator(phone=" ", syllable="", word="\n")
+CORPUS_STRING_WORD_SEPARATOR = " "
@click.command()
@click.option(
- "--input-path", type=Path, help="", required=True,
+ "-i",
+ "--input-path",
+ type=Path,
+ help="Path to corpus file (1 word per line).",
+ required=True,
)
@click.option(
+ "-o",
"--output-path",
type=Path,
default="russian-lexicon-espeak.txt",
help="Filepath to write lexicon.",
- required=True,
+ required=False,
)
def main(input_path: Path, output_path: Path) -> None:
+
+ print("Reading corpus...", end=" ")
with open(input_path, "r", encoding=ENCODING) as corpus_file:
- with open(output_path, "w", encoding=ENCODING) as lexicon_file:
- for word in tqdm(list(corpus_file.readlines())):
- word = word.strip()
- phones = phonemize(
- word,
- language="ru",
- backend="espeak",
- preserve_punctuation=True,
- with_stress=True,
- separator=SEPARATOR,
- )
- lexicon_line = f"{word}\t{phones}\n"
- lexicon_file.write(lexicon_line)
+ corpus_string = CORPUS_STRING_WORD_SEPARATOR.join(
+ corpus_file.read().splitlines()
+ )
+ print("Done.")
+
+ print("Getting phonemizations...", end=" ")
+ phones_string = phonemize(
+ corpus_string,
+ language="ru",
+ backend="espeak",
+ preserve_punctuation=True,
+ with_stress=True,
+ strip=True,
+ separator=SEPARATOR,
+ )
+ print("Done.")
+
+ print("Creating lexicon...", end=" ")
+ corpus = corpus_string.split(CORPUS_STRING_WORD_SEPARATOR)
+ phones = phones_string.split(SEPARATOR.word)
+ assert len(corpus) == len(phones), (
+ f"# of words should match # of phones after phomenization"
+ f"but you have {len(corpus)} words and {len(phones)} phones"
+ )
+ lexicon = [f"{word}\t{phon}" for word, phon in zip(corpus, phones)]
+ lexicon_str = "\n".join(lexicon)
+ print("Done.")
+
+ output_path.parent.mkdir(exist_ok=True, parents=True)
+ with open(output_path, "w", encoding=ENCODING) as lexicon_file:
+ lexicon_file.write(lexicon_str)
print(f"Lexicon file saved at:\n{output_path}")
From 8263bb23fef714d4363954c564b38617f61162df Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Tue, 19 Apr 2022 23:16:08 +0300
Subject: [PATCH 09/17] Parametrize language
---
src/preprocessing/create_lexicon.py | 24 ++++++++++++++++++------
1 file changed, 18 insertions(+), 6 deletions(-)
diff --git a/src/preprocessing/create_lexicon.py b/src/preprocessing/create_lexicon.py
index 02c1be6..12fc223 100644
--- a/src/preprocessing/create_lexicon.py
+++ b/src/preprocessing/create_lexicon.py
@@ -30,7 +30,15 @@
help="Filepath to write lexicon.",
required=False,
)
-def main(input_path: Path, output_path: Path) -> None:
+@click.option(
+ "-l",
+ "--language",
+ type=str,
+ default="en-us",
+ help="Language in espeak format. See for more info: https://github.com/espeak-ng/espeak-ng/blob/master/docs/languages.md",
+ required=False,
+)
+def main(input_path: Path, output_path: Path, language: str) -> None:
print("Reading corpus...", end=" ")
with open(input_path, "r", encoding=ENCODING) as corpus_file:
@@ -38,11 +46,12 @@ def main(input_path: Path, output_path: Path) -> None:
corpus_file.read().splitlines()
)
print("Done.")
+ print(corpus_string[:80], end="\n\n")
print("Getting phonemizations...", end=" ")
phones_string = phonemize(
corpus_string,
- language="ru",
+ language=language,
backend="espeak",
preserve_punctuation=True,
with_stress=True,
@@ -50,22 +59,25 @@ def main(input_path: Path, output_path: Path) -> None:
separator=SEPARATOR,
)
print("Done.")
+ print(phones_string[:80], end="\n\n")
print("Creating lexicon...", end=" ")
corpus = corpus_string.split(CORPUS_STRING_WORD_SEPARATOR)
phones = phones_string.split(SEPARATOR.word)
assert len(corpus) == len(phones), (
- f"# of words should match # of phones after phomenization"
- f"but you have {len(corpus)} words and {len(phones)} phones"
+ f"# of words should match # of phones after phomenization\n"
+ f"but you have {len(corpus)} words and {len(phones)} phones\n"
+ f"First 5 words: {corpus[:5]}\n"
+ f"First 5 phones: {phones[:5]}\n"
)
lexicon = [f"{word}\t{phon}" for word, phon in zip(corpus, phones)]
lexicon_str = "\n".join(lexicon)
- print("Done.")
+ print("Done.", end="\n\n")
output_path.parent.mkdir(exist_ok=True, parents=True)
with open(output_path, "w", encoding=ENCODING) as lexicon_file:
lexicon_file.write(lexicon_str)
- print(f"Lexicon file saved at:\n{output_path}")
+ print(f"Lexicon file saved at:\n{output_path}", end="\n\n")
if __name__ == "__main__":
From aee0ea97c67f873aded65ea8be2f37da019db6e0 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Wed, 20 Apr 2022 13:35:01 +0300
Subject: [PATCH 10/17] Add lexicon creation with espeak phonemizer step
---
russian_preprocessing/steps.sh | 9 +++++++--
1 file changed, 7 insertions(+), 2 deletions(-)
diff --git a/russian_preprocessing/steps.sh b/russian_preprocessing/steps.sh
index f10bf8c..c7a0595 100644
--- a/russian_preprocessing/steps.sh
+++ b/russian_preprocessing/steps.sh
@@ -53,13 +53,18 @@ export RUS_ESPEAK_LEXICON=/media/diskB/ruslan_a/models/mfa/rus-espeak-mfa/rus-mf
# 16069/16069 [00:00<00:00, 21508.15it/s]
echo -e "\n6.1) Creating word list from dataset"
-python src/preprocessing/create_corpus.py --input-dir $EMO_OUTPUT_DIR/text/raw --output-path $EMO_OUTPUT_DIR/meta/words.txt
+python src/preprocessing/create_corpus.py --input-dir $EMO_OUTPUT_DIR/mfa_inputs --output-path $EMO_OUTPUT_DIR/meta/words.txt
+python src/preprocessing/create_corpus.py --input-dir $NEUTRAL_OUTPUT_DIR/mfa_inputs --output-path $NEUTRAL_OUTPUT_DIR/meta/words.txt
# 25849/25983 [01:19<00:00, 326.82it/s]
-echo -e "\n6.2) Creating G2P lexicon from word list"
+echo -e "\n6.2.a) Creating G2P lexicon from word list with G2P"
mfa g2p -t mfa_tmp -j 32 --clean --overwrite models/g2p/russian_g2p.zip $EMO_OUTPUT_DIR/meta/words.txt models/mfa/russian_lexicon.txt
rm -rf mfa_tmp
+echo -e "\n6.2.b) Creating G2P lexicon from word list with espeak"
+python src/preprocessing/create_lexicon.py -i $EMO_OUTPUT_DIR/meta/words.txt -o $EMO_OUTPUT_DIR/meta/lexicon.txt -l ru
+python src/preprocessing/create_lexicon.py -i $NEUTRAL_OUTPUT_DIR/meta/words.txt -o $NEUTRAL_OUTPUT_DIR/meta/lexicon.txt -l ru
+
# 42it [00:10, 4.01it/s]
# 58it [00:12, 4.54it/s] mix
echo -e "\n7) MFA Preprocessing"
From de36f30b5185f08391e791b35417501a9234f8e0 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Wed, 20 Apr 2022 15:42:43 +0300
Subject: [PATCH 11/17] fix g2p download links
---
models/download_g2p.sh | 4 ++--
1 file changed, 2 insertions(+), 2 deletions(-)
diff --git a/models/download_g2p.sh b/models/download_g2p.sh
index 2e1faf4..3124bf1 100644
--- a/models/download_g2p.sh
+++ b/models/download_g2p.sh
@@ -1,6 +1,6 @@
-G2P_ENGLISH_URL="https://github.com/MontrealCorpusTools/mfa-models/blob/main/g2p/english_g2p.zip"
+G2P_ENGLISH_URL="https://github.com/MontrealCorpusTools/mfa-models/raw/main/g2p/english_g2p.zip"
G2P_ENGLISH_PATH="models/en/g2p/english_g2p.zip"
-G2P_RUSSIAN_URL="https://github.com/MontrealCorpusTools/mfa-models/blob/main/g2p/russian_g2p.zip"
+G2P_RUSSIAN_URL="https://github.com/MontrealCorpusTools/mfa-models/raw/main/g2p/russian_g2p.zip"
G2P_RUSSIAN_PATH="models/ru/g2p/russian_g2p.zip"
echo Downloading English G2P model...
From c766102c9eafe6893f774916dfe718a4fca06507 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Wed, 4 May 2022 19:48:39 +0300
Subject: [PATCH 12/17] Add notebook for HTML-with-wavs generation.
---
generate_listener_html.ipynb | 1596 ++++++++++++++++++++++++++++++++++
1 file changed, 1596 insertions(+)
create mode 100644 generate_listener_html.ipynb
diff --git a/generate_listener_html.ipynb b/generate_listener_html.ipynb
new file mode 100644
index 0000000..36192f4
--- /dev/null
+++ b/generate_listener_html.ipynb
@@ -0,0 +1,1596 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "60f2a2f5-75b6-4f29-bfa3-687283fc3edd",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import csv\n",
+ "from itertools import combinations\n",
+ "from pathlib import Path\n",
+ "\n",
+ "import numpy as np\n",
+ "import pandas as pd\n",
+ "from IPython.display import HTML, Audio, display\n",
+ "\n",
+ "\n",
+ "pd.set_option('display.max_colwidth', None)\n",
+ "pd.set_option('display.colheader_justify', 'center')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "f0d165ce-a7bb-4e83-b37e-dc0692ed1089",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "texts = [\n",
+ " 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'The journey was continued at dawn .',\n",
+ " 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'A dead man is of no use on a plantation .',\n",
+ " 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'Earthquakes damage all structures, including bridges.',\n",
+ " 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'Was it using language that caused their brains to develop?',\n",
+ " 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'\n",
+ "]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "f0871808-7396-4a82-b529-404babb6be8d",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "huawei_phones = [\n",
+ " ' W IY1 G AA1 T F Y UW1 V EH1 JH T AH0 B AH0 L Z AH0 N D F R UW1 T S AH0 N D B IH0 K EY1 M F IH1 SH IY1 T ER0 Z ',\n",
+ " ' F IH1 F T IY0 Y AA1 R D Z AH0 HH EH1 D AH1 V HH ER1 W ER1 DH AH0 F ER1 S T AH1 V DH AH0 R AA1 K S ',\n",
+ " ' IH1 T S IY1 M D DH IY0 AO0 R D EY1 N D AO1 R D ER0 AH1 V TH IH1 NG Z DH AE1 T D AA1 G Z SH UH1 D W ER1 K ',\n",
+ " ' DH AH0 JH ER1 N IY0 W AA1 Z K AH0 N T IH1 N Y UW0 D AE1 T D AO1 N ',\n",
+ " ' W AA1 Z IH1 T DH AH0 R AA1 N D IH0 V UW2 AH1 V DH OW1 Z HH UW1 W ER1 S T R AY1 V IH0 NG T UW1 W ER1 K HH IH1 Z R UW1 AH0 N ',\n",
+ " ' AH0 D EH1 D M AE1 N IH1 Z AH1 V N OW1 Y UW1 S AA1 N AH0 P L AE2 N T EY1 SH AH0 N ',\n",
+ " ' DH AH0 K L AO0 D IY1 N W AA1 Z L IY1 V IH0 NG N EH1 K S T M AO1 R N IH0 NG F AO1 R HH AA2 N AH0 L UW1 L UW0 ',\n",
+ " ' P R AA1 S IH0 K Y UW2 T ER0 Z HH AE1 V OW1 P AH0 N D AH0 M AE1 S IH0 V IH2 N V EH2 S T AH0 G EY1 SH AH0 N IH1 N T UW0 AE2 L AH0 G EY1 SH AH0 N Z AH1 V F IH1 K S IH0 NG G EY1 M Z AH0 N D IH2 L IY1 G AH0 L B EH1 T IH0 NG ',\n",
+ " ' D IH1 F ER0 AH0 N T T EH1 L AH0 S K OW2 P D IH0 Z AY1 N Z P ER0 F AO1 R M D IH1 F R AH0 N T L IY0 AH0 N D HH AE1 V D IH1 F ER0 AH0 N T S T R EH1 NG K TH S AH0 N D W IY1 K N AH0 S AH0 Z ',\n",
+ " ' HH Y UW1 M AH0 N Z AO1 L S OW0 JH AH1 JH D IH1 S T AH0 N S B AY1 Y UW1 Z IH0 NG DH AH0 R EH1 L AH0 T IH0 V S AY1 Z AH0 Z AH1 V AA1 B JH EH0 K T S ',\n",
+ " ' IH1 F DH IH1 S IH1 Z T R UW1 DH EH1 N DH OW1 Z HH UW1 T EH1 N D T UW1 TH IH1 NG K K R IY0 EY1 T IH0 V L IY0 R IH1 L IY0 AA1 R S AH1 M HH AW2 D IH1 F ER0 AH0 N T ',\n",
+ " ' B AH1 T R IH1 L IY0 IH0 N DH AH0 G R AE1 N D S K IY1 M AH1 V TH IH1 NG Z DH IH1 S IH2 N F ER0 M EY1 SH AH0 N IH1 Z IH2 N S IH0 G N Y IH1 F IH0 K AH0 N T ',\n",
+ " ' HH IY1 HH AE1 D AH0 P R AY1 V AH0 T JH EH1 T W IH1 DH TH R IY1 K IH1 NG S AY1 Z B EH1 D Z IH0 K S P EH1 N S IH0 V R AH1 G Z P AO1 R S AH0 L AH0 N V EY1 S AH0 Z AH0 N D AH0 D AY1 N IH0 NG EH1 R IY0 AH0 ',\n",
+ " ' W EH1 N AY1 R IY1 CH T AE0 T L AE1 N T AH0 M AY1 S T EH1 D AH0 L IY0 IH2 N K R IY1 S IH0 NG D IH2 S AH0 P OY1 N T M AH0 N T W AA1 Z N AA1 T L EH1 S AH0 N D AY1 F AW1 N D IH1 T AH0 B IH1 G D AH1 L R EH1 D T AW1 N ',\n",
+ " ' SH IY1 W OW1 K M EH1 G W IH1 DH AH0 M EH1 R IY0 K R IH1 S M AH0 S AH0 N D B EY1 D HH ER1 S IY1 W AH1 T W AA1 Z AH1 N D ER0 HH ER1 P IH1 L OW0 AH0 G R IY1 N K AH1 V ER0 D B UH1 K AH0 P IH1 R D W IH1 DH DH AH0 S EY1 M P IH1 K CH ER0 IH2 N S AY1 D AH0 N D AH0 F Y UW1 W ER1 D Z R IH1 T AH0 N B AY1 DH EH1 R M AH1 DH ER0 W IH1 CH M EY1 D DH EH1 R W AH1 N P R EH1 Z AH0 N T V EH1 R IY0 P R EH1 SH AH0 S IH0 N DH EH1 R AY1 Z ',\n",
+ " ' D AH1 Z JH EY1 N N OW1 AH0 B AW1 T Y AO1 R N UW1 JH AA1 B N OW1 AH0 N D D OW1 N T Y UW1 D EH1 R T EH1 L HH ER1 SH IY1 W IH1 L B IY1 F Y UH1 R IY0 AH0 S ',\n",
+ " ' D AH1 Z SH IY1 L AY1 K AY1 S K R IY1 M AO1 R S W IY1 T S SH IY1 L AY1 K S EH1 N IY0 K AY1 N D AH1 V AY1 S K R IY1 M CH AO1 K L AH0 T V AH0 N IH1 L AH0 S T R AO1 B EH2 R IY0 B AH0 N AE1 N AH0 DH AH0 W AH1 N W IH1 DH K EH1 R AH0 M AH0 L K OW1 K AH0 N AH2 T EH1 N IY0 Y UW1 K AE1 N TH IH1 NG K AH1 V ',\n",
+ " ' ER1 TH K W EY2 K S D AE1 M AH0 JH AO1 L S T R AH1 K CH ER0 Z IH2 N K L UW1 D IH0 NG B R IH1 JH AH0 Z ',\n",
+ " ' L AH1 K AH0 L IY0 DH IH1 S K AY1 N D AH1 V K AH0 L AE1 P S IH1 Z R EH1 L AH0 T IH0 V L IY0 IH2 N F R IY1 K W AH0 N T ',\n",
+ " ' W AA1 Z IH1 T Y UW1 Z IH0 NG L AE1 NG G W AH0 JH DH AE1 T K AA1 Z D DH EH1 R B R EY1 N Z T UW1 D IH0 V EH1 L AH0 P ',\n",
+ " ' IH1 F EH1 V R IY0 W AH2 N F AA1 L OW0 D AH0 S IH1 M AH0 L ER0 P L AE1 N DH AH0 R IH0 Z AH1 L T S W UH1 D B IY1 IH2 M P R EH1 S IH0 V ',\n",
+ " ' N EH1 K S T DH AH0 HH IH1 R OW0 OW1 V ER0 K AH2 M Z AA1 B S T AH0 K AH0 L Z AA1 N DH AH0 W EY1 T UW1 F EY1 S IH0 NG DH EH1 R G R EY1 T AH0 S T CH AE1 L AH0 N JH ',\n",
+ " ' F AO1 R M AO1 R DH AE1 N T UW1 HH AH1 N D R AH0 D Y IH1 R Z DH AH0 P EH1 S AH0 M IH0 S T S HH AE1 V B IH1 N W IH1 N IH0 NG DH AH0 P AH1 B L IH0 K D AH0 B EY1 T ',\n",
+ " ' IH1 T S W EH1 R IH0 NG M IY1 AW1 T T R AY1 IH0 NG T UW1 JH AH1 G AH0 L W ER1 K W IH1 DH L UH1 K IH0 NG AE1 F T ER0 M AY1 CH IH1 L D R AH0 N AH0 N D M AY1 F AE1 M AH0 L IY0 ',\n",
+ " ' Y AH1 NG P IY1 P AH0 L W AA1 N T T UW1 F IY1 L S AH0 P AO1 R T IH0 D AH0 N D AH0 P R IY1 SH IY0 EY2 T IH0 D B AY1 DH EH1 R K AH1 M P AH0 N IY2 AH0 N D DH EH1 R S UW0 P IH1 R IY0 ER0 Z ',\n",
+ " ' W IY1 S T AA1 R T T UW1 S IY1 DH IY0 EH1 V AH0 D AH0 N S AH1 V ER1 L IY0 HH Y UW1 M AH0 N S IH1 V AH0 L IH0 S EY1 SH AH0 N TH R UW1 K EY1 V P EY1 N T IH0 NG Z F AO1 R IH0 G Z AE1 M P AH0 L ',\n",
+ " ' IH0 N DH IH1 S K AH1 L CH ER0 AH0 S OW1 K AO1 L D S M AY1 L AH1 V R IH0 S P EH1 K T IH1 Z S IY1 N AE1 Z IH2 N S IH0 N S IH1 R AH0 N D AO1 F AH0 N R IH0 G AA1 R D IH0 D W IH1 DH S AH0 S P IH1 SH AH0 N ',\n",
+ " ' W IY1 K AE1 N IH0 K S P R EH1 S K AA1 M P L EH0 K S TH AO1 T S K AH0 N V EY1 S AH1 T AH0 L IH0 M OW1 SH AH0 N Z AH0 N D K AH0 M Y UW1 N AH0 K EY2 T AH0 B AW1 T S AH1 M AE1 B S T R AE0 K T K AA1 N S EH0 P T S ',\n",
+ " ' DH IY0 AE1 K T AH0 V AH0 S T S S EH1 N D AH0 K L IH1 R M EH1 S AH0 JH T UW1 K AH1 M P AH0 N IY2 Z DH AE1 T P IY1 P AH0 L AA1 R N OW1 L AO1 NG G ER0 W IH1 L IH0 NG T UW1 AE0 K S EH1 P T DH IY0 IH0 N V AY2 R AH0 N M EH1 N T AH0 L AH0 N D HH Y UW1 M AH0 N K AA1 S T AH1 V OW1 V ER0 K AH0 N S AH2 M P SH AH0 N ',\n",
+ " ' AO1 L DH IH1 S IH1 Z TH AE1 NG K S T UW1 HH IH1 Z CH AY1 L D HH UH2 D IH0 N DH AH0 M AW1 N T AH0 N Z AH0 N D T UW1 JH AH0 N EH1 T IH0 K S B AH1 T IH1 T IH1 Z HH IH1 Z M EH1 N T AH0 L S T R EH1 NG K TH DH AE1 T S EH1 T S HH IH1 M AH0 P AA1 R T '\n",
+ "]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "d7942da8-a539-4a50-98ef-d93cbdcec403",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## NOTE: all model keys need to be composed of a single letter followed by a number\n",
+ "model2folder = {\n",
+ " \"m1\": 'generated_hifi/esd_tune/g_3164999',\n",
+ " \"m2\": 'generated_hifi/esd_tune_reversal/g_3164999',\n",
+ " \"m3\": 'generated_hifi/esd_tune_advloss0/g_3164999',\n",
+ "}"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "d4d44f9e-525a-4e3d-bb5c-679b64bd7861",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "total_K_models = len(model2folder)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "51e4eae6-ea64-4d69-947c-2a0c7b15678b",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "m1: 1350 wav files total\n",
+ "m2: 1350 wav files total\n",
+ "m3: 1350 wav files total\n"
+ ]
+ }
+ ],
+ "source": [
+ "wav_files = {}\n",
+ "total_wavs_per_model = 0\n",
+ "for ip in model2folder.keys():\n",
+ " wav_files[ip] = list(Path(model2folder[ip]).rglob(\"*.wav\"))\n",
+ " total_wavs_per_model = len(wav_files[ip])\n",
+ " print(f\"{ip}: {total_wavs_per_model} wav files total\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "id": "e2031149-e1e8-421f-983c-83833c1b67ad",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "x_range = np.array(list(range(total_wavs_per_model)))\n",
+ "x_indices = x_range * 2\n",
+ "y_indices = x_range * 2 + 1"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "f60b3404-269a-407e-bedd-898b754c5651",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " m1 | \n",
+ " m2 | \n",
+ " m3 | \n",
+ " m1_wavbasename | \n",
+ " m1_accent_speaker | \n",
+ " m1_text | \n",
+ " m2_wavbasename | \n",
+ " m2_accent_speaker | \n",
+ " m2_text | \n",
+ " m3_wavbasename | \n",
+ " m3_accent_speaker | \n",
+ " m3_text | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 12 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " m1 m2 m3 m1_wavbasename m1_accent_speaker m1_text \\\n",
+ "0 None None None None None None \n",
+ "1 None None None None None None \n",
+ "2 None None None None None None \n",
+ "3 None None None None None None \n",
+ "4 None None None None None None \n",
+ "... ... ... ... ... ... ... \n",
+ "2695 None None None None None None \n",
+ "2696 None None None None None None \n",
+ "2697 None None None None None None \n",
+ "2698 None None None None None None \n",
+ "2699 None None None None None None \n",
+ "\n",
+ " m2_wavbasename m2_accent_speaker m2_text m3_wavbasename \\\n",
+ "0 None None None None \n",
+ "1 None None None None \n",
+ "2 None None None None \n",
+ "3 None None None None \n",
+ "4 None None None None \n",
+ "... ... ... ... ... \n",
+ "2695 None None None None \n",
+ "2696 None None None None \n",
+ "2697 None None None None \n",
+ "2698 None None None None \n",
+ "2699 None None None None \n",
+ "\n",
+ " m3_accent_speaker m3_text \n",
+ "0 None None \n",
+ "1 None None \n",
+ "2 None None \n",
+ "3 None None \n",
+ "4 None None \n",
+ "... ... ... \n",
+ "2695 None None \n",
+ "2696 None None \n",
+ "2697 None None \n",
+ "2698 None None \n",
+ "2699 None None \n",
+ "\n",
+ "[2700 rows x 12 columns]"
+ ]
+ },
+ "execution_count": 8,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def allocate_empty_array(alength):\n",
+ " return [None]*alength\n",
+ "\n",
+ "\n",
+ "def create_empty_dataframe(total_wavs_per_model: int, total_K_models: int):\n",
+ "\n",
+ " df = pd.DataFrame({\n",
+ " 'm' + str(i): allocate_empty_array(2 * total_wavs_per_model)\n",
+ " for i in range(1, total_K_models + 1, 1)\n",
+ " })\n",
+ "\n",
+ " for i in range(1, total_K_models + 1, 1):\n",
+ " df['m' + str(i) + '_wavbasename'] = None\n",
+ " df['m' + str(i) + '_accent_speaker'] = None\n",
+ " df['m' + str(i) + '_text'] = None\n",
+ " \n",
+ " return df\n",
+ "\n",
+ "\n",
+ "df_empty = create_empty_dataframe(total_wavs_per_model, total_K_models)\n",
+ "df_empty"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "id": "2b88d46e-c3af-43eb-8af7-282492147a1f",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " m1 | \n",
+ " m2 | \n",
+ " m3 | \n",
+ " m1_wavbasename | \n",
+ " m1_accent_speaker | \n",
+ " m1_text | \n",
+ " m2_wavbasename | \n",
+ " m2_accent_speaker | \n",
+ " m2_text | \n",
+ " m3_wavbasename | \n",
+ " m3_accent_speaker | \n",
+ " m3_text | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " id_1 | \n",
+ " id_2 | \n",
+ " id_3 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
+ " 1.wav | \n",
+ " 0011 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 1.wav | \n",
+ " 0011 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 1.wav | \n",
+ " 0011 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " id_4 | \n",
+ " id_5 | \n",
+ " id_6 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
+ " 10.wav | \n",
+ " 0011 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 10.wav | \n",
+ " 0011 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 10.wav | \n",
+ " 0011 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " id_7 | \n",
+ " id_8 | \n",
+ " id_9 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
+ " 7.wav | \n",
+ " 0020 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 7.wav | \n",
+ " 0020 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 7.wav | \n",
+ " 0020 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " id_4045 | \n",
+ " id_4046 | \n",
+ " id_4047 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
+ " 8.wav | \n",
+ " 0020 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 8.wav | \n",
+ " 0020 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 8.wav | \n",
+ " 0020 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " id_4048 | \n",
+ " id_4049 | \n",
+ " id_4050 | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
+ " 9.wav | \n",
+ " 0020 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 9.wav | \n",
+ " 0020 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 9.wav | \n",
+ " 0020 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 12 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " m1 \\\n",
+ "0 id_1 \n",
+ "1 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "2 id_4 \n",
+ "3 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "4 id_7 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4045 \n",
+ "2697 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4048 \n",
+ "2699 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m3 \\\n",
+ "0 id_3 \n",
+ "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "2 id_6 \n",
+ "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4047 \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4050 \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m1_wavbasename m1_accent_speaker \\\n",
+ "0 None None \n",
+ "1 1.wav 0011 \n",
+ "2 None None \n",
+ "3 10.wav 0011 \n",
+ "4 None None \n",
+ "... ... ... \n",
+ "2695 7.wav 0020 \n",
+ "2696 None None \n",
+ "2697 8.wav 0020 \n",
+ "2698 None None \n",
+ "2699 9.wav 0020 \n",
+ "\n",
+ " m1_text \\\n",
+ "0 None \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 None \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 None \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 None \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " m2_wavbasename m2_accent_speaker \\\n",
+ "0 None None \n",
+ "1 1.wav 0011 \n",
+ "2 None None \n",
+ "3 10.wav 0011 \n",
+ "4 None None \n",
+ "... ... ... \n",
+ "2695 7.wav 0020 \n",
+ "2696 None None \n",
+ "2697 8.wav 0020 \n",
+ "2698 None None \n",
+ "2699 9.wav 0020 \n",
+ "\n",
+ " m2_text \\\n",
+ "0 None \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 None \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 None \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 None \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " m3_wavbasename m3_accent_speaker \\\n",
+ "0 None None \n",
+ "1 1.wav 0011 \n",
+ "2 None None \n",
+ "3 10.wav 0011 \n",
+ "4 None None \n",
+ "... ... ... \n",
+ "2695 7.wav 0020 \n",
+ "2696 None None \n",
+ "2697 8.wav 0020 \n",
+ "2698 None None \n",
+ "2699 9.wav 0020 \n",
+ "\n",
+ " m3_text \n",
+ "0 None \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 None \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 None \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 None \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ "[2700 rows x 12 columns]"
+ ]
+ },
+ "execution_count": 9,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def populate_dataframe(df, model2folder, wav_files, total_K_models, total_wavs_per_model):\n",
+ "\n",
+ " for model_key in model2folder.keys():\n",
+ "\n",
+ " column_name = model_key\n",
+ " model_index = int(model_key[1:])\n",
+ " paths_orig_wavs = sorted(wav_files[model_key])\n",
+ " assert(total_wavs_per_model == len(paths_orig_wavs))\n",
+ "\n",
+ " wavids = np.array(list(range(len(paths_orig_wavs)))) * total_K_models + model_index\n",
+ " wavids = ['id_' + str(x) for x in wavids]\n",
+ " df[column_name].iloc[x_indices] = wavids\n",
+ " df[column_name].iloc[y_indices] = paths_orig_wavs\n",
+ "\n",
+ " df[column_name + '_wavbasename'].iloc[y_indices] = (\n",
+ " df[column_name]\n",
+ " .iloc[y_indices]\n",
+ " .apply(lambda x: x.name)\n",
+ " )\n",
+ " \n",
+ " df[column_name + '_text'].iloc[y_indices] = (\n",
+ " df[column_name]\n",
+ " .iloc[y_indices]\n",
+ " .apply(lambda x: texts[int(x.stem) - 1])\n",
+ " )\n",
+ " \n",
+ " df[column_name + '_accent_speaker'].iloc[y_indices] = (\n",
+ " df[column_name]\n",
+ " .iloc[y_indices]\n",
+ " .apply(lambda x: x.parent.parent.stem)\n",
+ " )\n",
+ " \n",
+ " return df\n",
+ "\n",
+ "\n",
+ "df_populated = populate_dataframe(df_empty, model2folder, wav_files, total_K_models, total_wavs_per_model)\n",
+ "df_populated"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "id": "efc3b273-7b7d-4165-aef8-38da88cfc154",
+ "metadata": {
+ "tags": []
+ },
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "m1 m2\n",
+ "m1 m3\n",
+ "m2 m3\n"
+ ]
+ }
+ ],
+ "source": [
+ "def validate_pairs(df):\n",
+ " all_possible_pairs = list(combinations(model2folder.keys(), 2))\n",
+ " for k, v in all_possible_pairs:\n",
+ " print(k, v)\n",
+ " assert((df[k + '_text'].iloc[y_indices] == df[v + '_text'].iloc[y_indices]).all())\n",
+ " assert((df[k + '_accent_speaker'].iloc[y_indices] == df[v + '_accent_speaker'].iloc[y_indices]).all())\n",
+ " \n",
+ " \n",
+ "validate_pairs(df_populated)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "id": "e3f303a2-0923-4b6a-802c-11c497fe5e58",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "['m1', 'm2', 'm3']"
+ ]
+ },
+ "execution_count": 11,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "model_columns = ['m' + str(i) for i in range(1, total_K_models + 1, 1)]\n",
+ "model_columns"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "id": "d1b37dd4-39c3-4956-adf0-22cf45b49f85",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " m1_text | \n",
+ " m1_accent_speaker | \n",
+ " m1 | \n",
+ " m2 | \n",
+ " m3 | \n",
+ " m2_text | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " None | \n",
+ " None | \n",
+ " id_1 | \n",
+ " id_2 | \n",
+ " id_3 | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 0011 | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " None | \n",
+ " None | \n",
+ " id_4 | \n",
+ " id_5 | \n",
+ " id_6 | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 0011 | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " None | \n",
+ " None | \n",
+ " id_7 | \n",
+ " id_8 | \n",
+ " id_9 | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " None | \n",
+ " None | \n",
+ " id_4045 | \n",
+ " id_4046 | \n",
+ " id_4047 | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " None | \n",
+ " None | \n",
+ " id_4048 | \n",
+ " id_4049 | \n",
+ " id_4050 | \n",
+ " None | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 6 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " m1_text \\\n",
+ "0 None \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 None \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 None \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 None \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " m1_accent_speaker m1 \\\n",
+ "0 None id_1 \n",
+ "1 0011 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "2 None id_4 \n",
+ "3 0011 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "4 None id_7 \n",
+ "... ... ... \n",
+ "2695 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2696 None id_4045 \n",
+ "2697 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2698 None id_4048 \n",
+ "2699 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m3 \\\n",
+ "0 id_3 \n",
+ "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "2 id_6 \n",
+ "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4047 \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4050 \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m2_text \n",
+ "0 None \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 None \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 None \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 None \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ "[2700 rows x 6 columns]"
+ ]
+ },
+ "execution_count": 12,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def choose_columns_to_render(df):\n",
+ " chosen_columns = ['m1_text', 'm1_accent_speaker'] + model_columns + ['m2_text']\n",
+ " df = df.loc[:, chosen_columns]\n",
+ " return df\n",
+ "\n",
+ "\n",
+ "df_filtered = choose_columns_to_render(df_populated)\n",
+ "df_filtered"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "id": "a9915d2e-01e5-40c0-923b-4bf6bf7389cf",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " m1_text | \n",
+ " m1_accent_speaker | \n",
+ " m1 | \n",
+ " m2 | \n",
+ " m3 | \n",
+ " m2_text | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " - | \n",
+ " - | \n",
+ " id_1 | \n",
+ " id_2 | \n",
+ " id_3 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 0011 | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4 | \n",
+ " id_5 | \n",
+ " id_6 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 0011 | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " - | \n",
+ " - | \n",
+ " id_7 | \n",
+ " id_8 | \n",
+ " id_9 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4045 | \n",
+ " id_4046 | \n",
+ " id_4047 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4048 | \n",
+ " id_4049 | \n",
+ " id_4050 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 6 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " m1_text \\\n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " m1_accent_speaker \\\n",
+ "0 - \n",
+ "1 0011 \n",
+ "2 - \n",
+ "3 0011 \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 0020 \n",
+ "2696 - \n",
+ "2697 0020 \n",
+ "2698 - \n",
+ "2699 0020 \n",
+ "\n",
+ " m1 \\\n",
+ "0 id_1 \n",
+ "1 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "2 id_4 \n",
+ "3 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "4 id_7 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4045 \n",
+ "2697 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4048 \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m3 \\\n",
+ "0 id_3 \n",
+ "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "2 id_6 \n",
+ "3 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4047 \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4050 \n",
+ "2699 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " m2_text \n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ "[2700 rows x 6 columns]"
+ ]
+ },
+ "execution_count": 13,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def permute_wavs_and_fillna(df):\n",
+ " df1 = df.loc[:,model_columns]\n",
+ " ## random permutation of each row (independently)\n",
+ " for i in y_indices:\n",
+ " df1.iloc[i,:] = np.random.permutation(df1.iloc[i,:])\n",
+ " df.loc[:,model_columns] = df1\n",
+ " df = df.fillna('-')\n",
+ " return df\n",
+ "\n",
+ "\n",
+ "df_permuted = permute_wavs_and_fillna(df_filtered)\n",
+ "df_permuted"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "id": "eef3b325-c26e-457a-b575-eb6b210aff7f",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df_permuted.to_csv(\n",
+ " 'reports/eval_map.csv',\n",
+ " sep = \"\\t\",\n",
+ " header = False,\n",
+ " index = False,\n",
+ " quoting = csv.QUOTE_NONE\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "id": "d32630c2-aca7-4ee9-b44c-a949d0fd17c4",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def columns_from_filenames(df, column_names):\n",
+ " res = []\n",
+ " for colname in column_names:\n",
+ " filenames = df[colname]\n",
+ " col = [Audio(filename)._repr_html_() if Path(filename).exists() else filename for filename in filenames]\n",
+ " res.append(col)\n",
+ " columns = res\n",
+ " return columns, column_names"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 16,
+ "id": "2c11c3ca-abe4-4bbd-930f-8a4f62c9dc8f",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def make_table(columns, column_names):\n",
+ " names = \"\\n\".join([f\"{name} | \" for name in column_names])\n",
+ " table = [f\"{names}
\"]\n",
+ " for row in zip(*columns):\n",
+ " row = \"\\n\".join([f\"{elem} | \" for elem in row])\n",
+ " row = f'{row}
'\n",
+ " table.append(row)\n",
+ " \n",
+ " content = \"\\n\".join(table)\n",
+ " table_html = f''\n",
+ " \n",
+ " html = HTML(table_html)\n",
+ " # display(html)\n",
+ " return html"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "id": "11d84c76-841a-4215-a45f-268076e4ae21",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def make_table_from_df(df, column_names):\n",
+ " columns, column_names = columns_from_filenames(df, column_names)\n",
+ " return make_table(columns, column_names)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "id": "26b577fe-3957-4902-8758-e5501f5d81a0",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "column_names = df_permuted.columns\n",
+ "chunk_size = 100"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "id": "f37b7fb3-93eb-448c-a8a3-a23cb0d165ae",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "output_folder = Path('reports/html')\n",
+ "output_folder.mkdir(parents=True, exist_ok=True)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "id": "24aef771-215a-4fe6-82cb-1ff375681189",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "0 100\n",
+ "reports/html/nat_vctk_esd_tune_test_1.html\n",
+ "100 200\n",
+ "reports/html/nat_vctk_esd_tune_test_2.html\n",
+ "200 300\n",
+ "reports/html/nat_vctk_esd_tune_test_3.html\n",
+ "300 400\n",
+ "reports/html/nat_vctk_esd_tune_test_4.html\n",
+ "400 500\n",
+ "reports/html/nat_vctk_esd_tune_test_5.html\n",
+ "500 600\n",
+ "reports/html/nat_vctk_esd_tune_test_6.html\n",
+ "600 700\n",
+ "reports/html/nat_vctk_esd_tune_test_7.html\n",
+ "700 800\n",
+ "reports/html/nat_vctk_esd_tune_test_8.html\n",
+ "800 900\n",
+ "reports/html/nat_vctk_esd_tune_test_9.html\n",
+ "900 1000\n",
+ "reports/html/nat_vctk_esd_tune_test_10.html\n",
+ "1000 1100\n",
+ "reports/html/nat_vctk_esd_tune_test_11.html\n",
+ "1100 1200\n",
+ "reports/html/nat_vctk_esd_tune_test_12.html\n",
+ "1200 1300\n",
+ "reports/html/nat_vctk_esd_tune_test_13.html\n",
+ "1300 1400\n",
+ "reports/html/nat_vctk_esd_tune_test_14.html\n",
+ "1400 1500\n",
+ "reports/html/nat_vctk_esd_tune_test_15.html\n",
+ "1500 1600\n",
+ "reports/html/nat_vctk_esd_tune_test_16.html\n",
+ "1600 1700\n",
+ "reports/html/nat_vctk_esd_tune_test_17.html\n",
+ "1700 1800\n",
+ "reports/html/nat_vctk_esd_tune_test_18.html\n",
+ "1800 1900\n",
+ "reports/html/nat_vctk_esd_tune_test_19.html\n",
+ "1900 2000\n",
+ "reports/html/nat_vctk_esd_tune_test_20.html\n",
+ "2000 2100\n",
+ "reports/html/nat_vctk_esd_tune_test_21.html\n",
+ "2100 2200\n",
+ "reports/html/nat_vctk_esd_tune_test_22.html\n",
+ "2200 2300\n",
+ "reports/html/nat_vctk_esd_tune_test_23.html\n",
+ "2300 2400\n",
+ "reports/html/nat_vctk_esd_tune_test_24.html\n",
+ "2400 2500\n",
+ "reports/html/nat_vctk_esd_tune_test_25.html\n",
+ "2500 2600\n",
+ "reports/html/nat_vctk_esd_tune_test_26.html\n",
+ "2600 2700\n",
+ "reports/html/nat_vctk_esd_tune_test_27.html\n"
+ ]
+ }
+ ],
+ "source": [
+ "def create_htmls(df, column_names, chunk_size):\n",
+ " import os\n",
+ " chunk_number = 0\n",
+ " start = 0\n",
+ " experiment_prefix = \"nat_vctk_esd_tune_test_\"\n",
+ " while (start < len(df)):\n",
+ " end = start + chunk_size\n",
+ " end = min(end, len(df))\n",
+ " print(start, end)\n",
+ " chunk_number += 1\n",
+ " df_chunk = df.iloc[start:end,:]\n",
+ " final_html = make_table_from_df(df_chunk, column_names)\n",
+ " f_html = output_folder.joinpath(experiment_prefix + str(chunk_number) + '.html')\n",
+ " print(f_html)\n",
+ " with open(f_html, 'w') as f:\n",
+ " f.write(final_html.data)\n",
+ " start = end\n",
+ "\n",
+ " \n",
+ "create_htmls(df_permuted, column_names, chunk_size)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "id": "49a60285-31bf-4263-9162-c3d928aa9068",
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "reports/scores/scores.csv\n",
+ "reports/scores/scores.xlsx\n"
+ ]
+ }
+ ],
+ "source": [
+ "def create_scores_file(df, output_dir):\n",
+ " \n",
+ " output_dir = Path(output_dir)\n",
+ " output_dir.mkdir(exist_ok=True, parents=True)\n",
+ " \n",
+ " for k in model2folder.keys():\n",
+ " df[k].iloc[y_indices] = ''\n",
+ " \n",
+ " csv_path = output_dir / \"scores.csv\"\n",
+ " df.to_csv(\n",
+ " csv_path,\n",
+ " sep = \"\\t\",\n",
+ " header = True,\n",
+ " index = False,\n",
+ " quoting = csv.QUOTE_NONE,\n",
+ " )\n",
+ " \n",
+ " excel_path = output_dir / \"scores.xlsx\" \n",
+ " df.to_excel(excel_path)\n",
+ " \n",
+ " print(csv_path)\n",
+ " print(excel_path)\n",
+ "\n",
+ "\n",
+ "create_scores_file(df_permuted, \"reports/scores\")"
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.8.12"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
From f1996df97f4dd40fa46f84cd207e9de1a8e423ef Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Thu, 5 May 2022 13:07:27 +0300
Subject: [PATCH 13/17] Add notebook for analyzing gathered MOS/pref scores.
---
analyze_scores.ipynb | 13171 +++++++++++++++++++++++++++++++++++++++++
1 file changed, 13171 insertions(+)
create mode 100644 analyze_scores.ipynb
diff --git a/analyze_scores.ipynb b/analyze_scores.ipynb
new file mode 100644
index 0000000..e62b14a
--- /dev/null
+++ b/analyze_scores.ipynb
@@ -0,0 +1,13171 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "9169e316-80c7-460e-86d1-bca78ce044d3",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import csv\n",
+ "from pathlib import Path\n",
+ "\n",
+ "import numpy as np\n",
+ "import pandas as pd"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "9573a7f9-058c-47af-9af1-50fb4d454abb",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "pd.set_option('display.max_colwidth', None)\n",
+ "pd.set_option('display.colheader_justify', 'center')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "a199810d-893f-494d-b560-a1a82612bd13",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "SAMPLE_AUDIO_PATH = \"generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav\"\n",
+ "EVAL_MAP_PATH = \"reports/eval_map.csv\"\n",
+ "SCORES_PATH = \"data/scores_results.xlsx\""
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "ac502266-1c5e-4dce-add2-a57d107571ed",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## NOTE: all model keys need to be composed of a single letter followed by a number\n",
+ "model2folder = {\n",
+ " \"m1\": 'generated_hifi/esd_tune/g_3164999',\n",
+ " \"m2\": 'generated_hifi/esd_tune_reversal/g_3164999',\n",
+ " \"m3\": 'generated_hifi/esd_tune_advloss0/g_3164999',\n",
+ "}"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "b79125a1-4e4a-483a-a498-ea95ed0eb61d",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'generated_hifi/esd_tune/g_3164999': 'm1',\n",
+ " 'generated_hifi/esd_tune_reversal/g_3164999': 'm2',\n",
+ " 'generated_hifi/esd_tune_advloss0/g_3164999': 'm3'}"
+ ]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "folder2model = {v: k for k, v in model2folder.items()}\n",
+ "folder2model"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "8a2711f2-14ea-48f8-b8a4-bd6e5d845a0d",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " 0 | \n",
+ " 1 | \n",
+ " 2 | \n",
+ " 3 | \n",
+ " 4 | \n",
+ " 5 | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " - | \n",
+ " - | \n",
+ " id_1 | \n",
+ " id_2 | \n",
+ " id_3 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 0011 | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4 | \n",
+ " id_5 | \n",
+ " id_6 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 0011 | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " - | \n",
+ " - | \n",
+ " id_7 | \n",
+ " id_8 | \n",
+ " id_9 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4045 | \n",
+ " id_4046 | \n",
+ " id_4047 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4048 | \n",
+ " id_4049 | \n",
+ " id_4050 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 0020 | \n",
+ " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 6 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " 0 \\\n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " 1 2 \\\n",
+ "0 - id_1 \n",
+ "1 0011 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "2 - id_4 \n",
+ "3 0011 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "4 - id_7 \n",
+ "... ... ... \n",
+ "2695 0020 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2696 - id_4045 \n",
+ "2697 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2698 - id_4048 \n",
+ "2699 0020 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " 3 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " 4 \\\n",
+ "0 id_3 \n",
+ "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "2 id_6 \n",
+ "3 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2696 id_4047 \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2698 id_4050 \n",
+ "2699 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "\n",
+ " 5 \n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ "[2700 rows x 6 columns]"
+ ]
+ },
+ "execution_count": 6,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_map = pd.read_csv(\n",
+ " EVAL_MAP_PATH,\n",
+ " sep = \"\\t\",\n",
+ " header = None,\n",
+ " quoting = csv.QUOTE_NONE,\n",
+ ")\n",
+ "\n",
+ "df_map"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "id": "cb751630-b2aa-41e4-a8ad-333c4c514c4e",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'model': 'm3', 'sent_id': 9, 'speaker': '0020', 'accent': None}"
+ ]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def get_audio_details(f):\n",
+ " f_path = Path(f)\n",
+ " model_ = folder2model[str(f_path.parent.parent.parent)]\n",
+ " basename_ = f_path.name\n",
+ " sentence_id = int(f_path.stem)\n",
+ " speaker = f_path.parent.parent.name\n",
+ " accent = None\n",
+ " return {\n",
+ " 'model': model_,\n",
+ " 'sent_id': sentence_id,\n",
+ " 'speaker': speaker,\n",
+ " 'accent': accent\n",
+ " }\n",
+ "\n",
+ "\n",
+ "get_audio_details(SAMPLE_AUDIO_PATH)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "id": "0e1d24c8-b8a8-4dfe-a5b1-e390dbf939bd",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def process_cell(f):\n",
+ " if Path(f).exists():\n",
+ " return get_audio_details(f)\n",
+ " return (f)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "id": "b016e6c7-a310-443b-83ca-6b477d5efb3d",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " text_left | \n",
+ " speaker | \n",
+ " m1 | \n",
+ " m2 | \n",
+ " m3 | \n",
+ " text_right | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " - | \n",
+ " - | \n",
+ " id_1 | \n",
+ " id_2 | \n",
+ " id_3 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 0011 | \n",
+ " {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None} | \n",
+ " {'model': 'm1', 'sent_id': 1, 'speaker': '0011', 'accent': None} | \n",
+ " {'model': 'm3', 'sent_id': 1, 'speaker': '0011', 'accent': None} | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4 | \n",
+ " id_5 | \n",
+ " id_6 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 0011 | \n",
+ " {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None} | \n",
+ " {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None} | \n",
+ " {'model': 'm1', 'sent_id': 10, 'speaker': '0011', 'accent': None} | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " - | \n",
+ " - | \n",
+ " id_7 | \n",
+ " id_8 | \n",
+ " id_9 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 0020 | \n",
+ " {'model': 'm2', 'sent_id': 7, 'speaker': '0020', 'accent': None} | \n",
+ " {'model': 'm1', 'sent_id': 7, 'speaker': '0020', 'accent': None} | \n",
+ " {'model': 'm3', 'sent_id': 7, 'speaker': '0020', 'accent': None} | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4045 | \n",
+ " id_4046 | \n",
+ " id_4047 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 0020 | \n",
+ " {'model': 'm1', 'sent_id': 8, 'speaker': '0020', 'accent': None} | \n",
+ " {'model': 'm2', 'sent_id': 8, 'speaker': '0020', 'accent': None} | \n",
+ " {'model': 'm3', 'sent_id': 8, 'speaker': '0020', 'accent': None} | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4048 | \n",
+ " id_4049 | \n",
+ " id_4050 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 0020 | \n",
+ " {'model': 'm3', 'sent_id': 9, 'speaker': '0020', 'accent': None} | \n",
+ " {'model': 'm2', 'sent_id': 9, 'speaker': '0020', 'accent': None} | \n",
+ " {'model': 'm1', 'sent_id': 9, 'speaker': '0020', 'accent': None} | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 6 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " text_left \\\n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " speaker \\\n",
+ "0 - \n",
+ "1 0011 \n",
+ "2 - \n",
+ "3 0011 \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 0020 \n",
+ "2696 - \n",
+ "2697 0020 \n",
+ "2698 - \n",
+ "2699 0020 \n",
+ "\n",
+ " m1 \\\n",
+ "0 id_1 \n",
+ "1 {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None} \n",
+ "2 id_4 \n",
+ "3 {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None} \n",
+ "4 id_7 \n",
+ "... ... \n",
+ "2695 {'model': 'm2', 'sent_id': 7, 'speaker': '0020', 'accent': None} \n",
+ "2696 id_4045 \n",
+ "2697 {'model': 'm1', 'sent_id': 8, 'speaker': '0020', 'accent': None} \n",
+ "2698 id_4048 \n",
+ "2699 {'model': 'm3', 'sent_id': 9, 'speaker': '0020', 'accent': None} \n",
+ "\n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 {'model': 'm1', 'sent_id': 1, 'speaker': '0011', 'accent': None} \n",
+ "2 id_5 \n",
+ "3 {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None} \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 {'model': 'm1', 'sent_id': 7, 'speaker': '0020', 'accent': None} \n",
+ "2696 id_4046 \n",
+ "2697 {'model': 'm2', 'sent_id': 8, 'speaker': '0020', 'accent': None} \n",
+ "2698 id_4049 \n",
+ "2699 {'model': 'm2', 'sent_id': 9, 'speaker': '0020', 'accent': None} \n",
+ "\n",
+ " m3 \\\n",
+ "0 id_3 \n",
+ "1 {'model': 'm3', 'sent_id': 1, 'speaker': '0011', 'accent': None} \n",
+ "2 id_6 \n",
+ "3 {'model': 'm1', 'sent_id': 10, 'speaker': '0011', 'accent': None} \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 {'model': 'm3', 'sent_id': 7, 'speaker': '0020', 'accent': None} \n",
+ "2696 id_4047 \n",
+ "2697 {'model': 'm3', 'sent_id': 8, 'speaker': '0020', 'accent': None} \n",
+ "2698 id_4050 \n",
+ "2699 {'model': 'm1', 'sent_id': 9, 'speaker': '0020', 'accent': None} \n",
+ "\n",
+ " text_right \n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ "[2700 rows x 6 columns]"
+ ]
+ },
+ "execution_count": 9,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_detailed = df_map.applymap(lambda f: process_cell(f))\n",
+ "df_detailed.columns = ['text_left', 'speaker', 'm1', 'm2', 'm3', 'text_right']\n",
+ "df_detailed"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "id": "16a4bd24-b5e8-4762-98b5-62c38ca5f72e",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "3"
+ ]
+ },
+ "execution_count": 10,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "total_K_models = len(model2folder)\n",
+ "total_K_models"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "id": "b1184636-00f8-4ab7-a9d3-629095c56876",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "1350"
+ ]
+ },
+ "execution_count": 11,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "total_wavs_per_model = int(len(df_map) / 2)\n",
+ "total_wavs_per_model"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "id": "85b862ab-fd48-45cf-af1e-78e26c9183e4",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "x_range = np.array(list(range(total_wavs_per_model)))\n",
+ "x_indices = x_range * 2\n",
+ "y_indices = x_range * 2 + 1"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "id": "9bd825c9-5b4e-4e62-a1b3-63c1208a78ae",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "0 id_1\n",
+ "2 id_4\n",
+ "4 id_7\n",
+ "6 id_10\n",
+ "8 id_13\n",
+ " ... \n",
+ "2690 id_4036\n",
+ "2692 id_4039\n",
+ "2694 id_4042\n",
+ "2696 id_4045\n",
+ "2698 id_4048\n",
+ "Name: m1, Length: 1350, dtype: object"
+ ]
+ },
+ "execution_count": 13,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "m1_indices = df_detailed['m1'].iloc[x_indices]\n",
+ "m2_indices = df_detailed['m2'].iloc[x_indices]\n",
+ "m3_indices = df_detailed['m3'].iloc[x_indices]\n",
+ "m1_indices"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "id": "bbac06d5-fcb6-457c-ac87-557c9634bd1e",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'id_1': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n",
+ " 'id_4': {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n",
+ " 'id_7': {'model': 'm1', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n",
+ " 'id_10': {'model': 'm1', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n",
+ " 'id_13': {'model': 'm3', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n",
+ " 'id_16': {'model': 'm3', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n",
+ " 'id_19': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n",
+ " 'id_22': {'model': 'm3', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n",
+ " 'id_25': {'model': 'm1', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n",
+ " 'id_28': {'model': 'm3', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n",
+ " 'id_31': {'model': 'm1', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n",
+ " 'id_34': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n",
+ " 'id_37': {'model': 'm3', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n",
+ " 'id_40': {'model': 'm3', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n",
+ " 'id_43': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n",
+ " 'id_46': {'model': 'm2', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n",
+ " 'id_49': {'model': 'm3', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n",
+ " 'id_52': {'model': 'm2', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n",
+ " 'id_55': {'model': 'm3', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n",
+ " 'id_58': {'model': 'm1', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n",
+ " 'id_61': {'model': 'm1', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n",
+ " 'id_64': {'model': 'm2', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n",
+ " 'id_67': {'model': 'm3', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n",
+ " 'id_70': {'model': 'm2', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n",
+ " 'id_73': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n",
+ " 'id_76': {'model': 'm3', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n",
+ " 'id_79': {'model': 'm1', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n",
+ " 'id_82': {'model': 'm1', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n",
+ " 'id_85': {'model': 'm3', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n",
+ " 'id_88': {'model': 'm1', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n",
+ " 'id_91': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n",
+ " 'id_94': {'model': 'm1', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n",
+ " 'id_97': {'model': 'm3', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n",
+ " 'id_100': {'model': 'm3', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n",
+ " 'id_103': {'model': 'm3', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n",
+ " 'id_106': {'model': 'm1', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n",
+ " 'id_109': {'model': 'm2', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n",
+ " 'id_112': {'model': 'm1', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n",
+ " 'id_115': {'model': 'm3', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n",
+ " 'id_118': {'model': 'm2', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n",
+ " 'id_121': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n",
+ " 'id_124': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n",
+ " 'id_127': {'model': 'm1', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n",
+ " 'id_130': {'model': 'm3', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n",
+ " 'id_133': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n",
+ " 'id_136': {'model': 'm2', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n",
+ " 'id_139': {'model': 'm1', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n",
+ " 'id_142': {'model': 'm1', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n",
+ " 'id_145': {'model': 'm2', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n",
+ " 'id_148': {'model': 'm2', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n",
+ " 'id_151': {'model': 'm2', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n",
+ " 'id_154': {'model': 'm1', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n",
+ " 'id_157': {'model': 'm2', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n",
+ " 'id_160': {'model': 'm3', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n",
+ " 'id_163': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n",
+ " 'id_166': {'model': 'm1', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n",
+ " 'id_169': {'model': 'm2', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n",
+ " 'id_172': {'model': 'm1', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n",
+ " 'id_175': {'model': 'm3', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n",
+ " 'id_178': {'model': 'm3', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n",
+ " 'id_181': {'model': 'm3', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n",
+ " 'id_184': {'model': 'm2', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n",
+ " 'id_187': {'model': 'm2', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n",
+ " 'id_190': {'model': 'm2', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n",
+ " 'id_193': {'model': 'm3', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n",
+ " 'id_196': {'model': 'm2', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n",
+ " 'id_199': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n",
+ " 'id_202': {'model': 'm1', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n",
+ " 'id_205': {'model': 'm2', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n",
+ " 'id_208': {'model': 'm3', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n",
+ " 'id_211': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n",
+ " 'id_214': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n",
+ " 'id_217': {'model': 'm3', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n",
+ " 'id_220': {'model': 'm2', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n",
+ " 'id_223': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n",
+ " 'id_226': {'model': 'm3', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n",
+ " 'id_229': {'model': 'm1', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n",
+ " 'id_232': {'model': 'm1', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n",
+ " 'id_235': {'model': 'm1', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n",
+ " 'id_238': {'model': 'm1', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n",
+ " 'id_241': {'model': 'm3', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n",
+ " 'id_244': {'model': 'm2', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n",
+ " 'id_247': {'model': 'm1', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n",
+ " 'id_250': {'model': 'm2', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n",
+ " 'id_253': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n",
+ " 'id_256': {'model': 'm3', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n",
+ " 'id_259': {'model': 'm3', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n",
+ " 'id_262': {'model': 'm1', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n",
+ " 'id_265': {'model': 'm1', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n",
+ " 'id_268': {'model': 'm2', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n",
+ " 'id_271': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n",
+ " 'id_274': {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n",
+ " 'id_277': {'model': 'm3', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n",
+ " 'id_280': {'model': 'm1', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n",
+ " 'id_283': {'model': 'm1', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n",
+ " 'id_286': {'model': 'm1', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n",
+ " 'id_289': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n",
+ " 'id_292': {'model': 'm3', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n",
+ " 'id_295': {'model': 'm3', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n",
+ " 'id_298': {'model': 'm1', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n",
+ " 'id_301': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n",
+ " 'id_304': {'model': 'm2', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n",
+ " 'id_307': {'model': 'm2', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n",
+ " 'id_310': {'model': 'm3', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n",
+ " 'id_313': {'model': 'm3', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n",
+ " 'id_316': {'model': 'm3', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n",
+ " 'id_319': {'model': 'm1', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n",
+ " 'id_322': {'model': 'm2', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n",
+ " 'id_325': {'model': 'm2', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n",
+ " 'id_328': {'model': 'm2', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n",
+ " 'id_331': {'model': 'm2', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n",
+ " 'id_334': {'model': 'm1', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n",
+ " 'id_337': {'model': 'm3', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n",
+ " 'id_340': {'model': 'm3', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n",
+ " 'id_343': {'model': 'm3', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n",
+ " 'id_346': {'model': 'm1', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n",
+ " 'id_349': {'model': 'm3', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n",
+ " 'id_352': {'model': 'm2', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n",
+ " 'id_355': {'model': 'm1', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n",
+ " 'id_358': {'model': 'm2', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n",
+ " 'id_361': {'model': 'm2', 'sent_id': 1, 'speaker': '0011', 'accent': None},\n",
+ " 'id_364': {'model': 'm3', 'sent_id': 10, 'speaker': '0011', 'accent': None},\n",
+ " 'id_367': {'model': 'm3', 'sent_id': 11, 'speaker': '0011', 'accent': None},\n",
+ " 'id_370': {'model': 'm2', 'sent_id': 12, 'speaker': '0011', 'accent': None},\n",
+ " 'id_373': {'model': 'm1', 'sent_id': 13, 'speaker': '0011', 'accent': None},\n",
+ " 'id_376': {'model': 'm3', 'sent_id': 14, 'speaker': '0011', 'accent': None},\n",
+ " 'id_379': {'model': 'm1', 'sent_id': 15, 'speaker': '0011', 'accent': None},\n",
+ " 'id_382': {'model': 'm2', 'sent_id': 16, 'speaker': '0011', 'accent': None},\n",
+ " 'id_385': {'model': 'm2', 'sent_id': 17, 'speaker': '0011', 'accent': None},\n",
+ " 'id_388': {'model': 'm3', 'sent_id': 18, 'speaker': '0011', 'accent': None},\n",
+ " 'id_391': {'model': 'm2', 'sent_id': 19, 'speaker': '0011', 'accent': None},\n",
+ " 'id_394': {'model': 'm3', 'sent_id': 2, 'speaker': '0011', 'accent': None},\n",
+ " 'id_397': {'model': 'm3', 'sent_id': 20, 'speaker': '0011', 'accent': None},\n",
+ " 'id_400': {'model': 'm2', 'sent_id': 21, 'speaker': '0011', 'accent': None},\n",
+ " 'id_403': {'model': 'm2', 'sent_id': 22, 'speaker': '0011', 'accent': None},\n",
+ " 'id_406': {'model': 'm2', 'sent_id': 23, 'speaker': '0011', 'accent': None},\n",
+ " 'id_409': {'model': 'm3', 'sent_id': 24, 'speaker': '0011', 'accent': None},\n",
+ " 'id_412': {'model': 'm1', 'sent_id': 25, 'speaker': '0011', 'accent': None},\n",
+ " 'id_415': {'model': 'm2', 'sent_id': 26, 'speaker': '0011', 'accent': None},\n",
+ " 'id_418': {'model': 'm1', 'sent_id': 27, 'speaker': '0011', 'accent': None},\n",
+ " 'id_421': {'model': 'm2', 'sent_id': 28, 'speaker': '0011', 'accent': None},\n",
+ " 'id_424': {'model': 'm2', 'sent_id': 29, 'speaker': '0011', 'accent': None},\n",
+ " 'id_427': {'model': 'm2', 'sent_id': 3, 'speaker': '0011', 'accent': None},\n",
+ " 'id_430': {'model': 'm3', 'sent_id': 30, 'speaker': '0011', 'accent': None},\n",
+ " 'id_433': {'model': 'm2', 'sent_id': 4, 'speaker': '0011', 'accent': None},\n",
+ " 'id_436': {'model': 'm3', 'sent_id': 5, 'speaker': '0011', 'accent': None},\n",
+ " 'id_439': {'model': 'm1', 'sent_id': 6, 'speaker': '0011', 'accent': None},\n",
+ " 'id_442': {'model': 'm3', 'sent_id': 7, 'speaker': '0011', 'accent': None},\n",
+ " 'id_445': {'model': 'm1', 'sent_id': 8, 'speaker': '0011', 'accent': None},\n",
+ " 'id_448': {'model': 'm3', 'sent_id': 9, 'speaker': '0011', 'accent': None},\n",
+ " 'id_451': {'model': 'm3', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n",
+ " 'id_454': {'model': 'm3', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n",
+ " 'id_457': {'model': 'm3', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n",
+ " 'id_460': {'model': 'm2', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n",
+ " 'id_463': {'model': 'm3', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n",
+ " 'id_466': {'model': 'm2', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n",
+ " 'id_469': {'model': 'm3', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n",
+ " 'id_472': {'model': 'm2', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n",
+ " 'id_475': {'model': 'm2', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n",
+ " 'id_478': {'model': 'm2', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n",
+ " 'id_481': {'model': 'm1', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n",
+ " 'id_484': {'model': 'm2', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n",
+ " 'id_487': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n",
+ " 'id_490': {'model': 'm2', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n",
+ " 'id_493': {'model': 'm2', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n",
+ " 'id_496': {'model': 'm3', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n",
+ " 'id_499': {'model': 'm1', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n",
+ " 'id_502': {'model': 'm2', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n",
+ " 'id_505': {'model': 'm3', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n",
+ " 'id_508': {'model': 'm2', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n",
+ " 'id_511': {'model': 'm2', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n",
+ " 'id_514': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n",
+ " 'id_517': {'model': 'm3', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n",
+ " 'id_520': {'model': 'm3', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n",
+ " 'id_523': {'model': 'm3', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n",
+ " 'id_526': {'model': 'm1', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n",
+ " 'id_529': {'model': 'm2', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n",
+ " 'id_532': {'model': 'm3', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n",
+ " 'id_535': {'model': 'm3', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n",
+ " 'id_538': {'model': 'm3', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n",
+ " 'id_541': {'model': 'm3', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n",
+ " 'id_544': {'model': 'm3', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n",
+ " 'id_547': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n",
+ " 'id_550': {'model': 'm3', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n",
+ " 'id_553': {'model': 'm2', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n",
+ " 'id_556': {'model': 'm1', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n",
+ " 'id_559': {'model': 'm3', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n",
+ " 'id_562': {'model': 'm3', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n",
+ " 'id_565': {'model': 'm1', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n",
+ " 'id_568': {'model': 'm2', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n",
+ " 'id_571': {'model': 'm3', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n",
+ " 'id_574': {'model': 'm1', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n",
+ " 'id_577': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n",
+ " 'id_580': {'model': 'm2', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n",
+ " 'id_583': {'model': 'm3', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n",
+ " 'id_586': {'model': 'm2', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n",
+ " 'id_589': {'model': 'm3', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n",
+ " 'id_592': {'model': 'm2', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n",
+ " 'id_595': {'model': 'm3', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n",
+ " 'id_598': {'model': 'm3', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n",
+ " 'id_601': {'model': 'm2', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n",
+ " 'id_604': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n",
+ " 'id_607': {'model': 'm2', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n",
+ " 'id_610': {'model': 'm2', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n",
+ " 'id_613': {'model': 'm2', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n",
+ " 'id_616': {'model': 'm3', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n",
+ " 'id_619': {'model': 'm2', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n",
+ " 'id_622': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n",
+ " 'id_625': {'model': 'm2', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n",
+ " 'id_628': {'model': 'm2', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n",
+ " 'id_631': {'model': 'm1', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n",
+ " 'id_634': {'model': 'm1', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n",
+ " 'id_637': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n",
+ " 'id_640': {'model': 'm3', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n",
+ " 'id_643': {'model': 'm2', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n",
+ " 'id_646': {'model': 'm2', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n",
+ " 'id_649': {'model': 'm2', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n",
+ " 'id_652': {'model': 'm1', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n",
+ " 'id_655': {'model': 'm1', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n",
+ " 'id_658': {'model': 'm2', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n",
+ " 'id_661': {'model': 'm2', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n",
+ " 'id_664': {'model': 'm3', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n",
+ " 'id_667': {'model': 'm3', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n",
+ " 'id_670': {'model': 'm3', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n",
+ " 'id_673': {'model': 'm3', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n",
+ " 'id_676': {'model': 'm2', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n",
+ " 'id_679': {'model': 'm1', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n",
+ " 'id_682': {'model': 'm2', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n",
+ " 'id_685': {'model': 'm3', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n",
+ " 'id_688': {'model': 'm1', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n",
+ " 'id_691': {'model': 'm3', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n",
+ " 'id_694': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n",
+ " 'id_697': {'model': 'm3', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n",
+ " 'id_700': {'model': 'm3', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n",
+ " 'id_703': {'model': 'm1', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n",
+ " 'id_706': {'model': 'm1', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n",
+ " 'id_709': {'model': 'm2', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n",
+ " 'id_712': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n",
+ " 'id_715': {'model': 'm3', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n",
+ " 'id_718': {'model': 'm3', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n",
+ " 'id_721': {'model': 'm3', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n",
+ " 'id_724': {'model': 'm1', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n",
+ " 'id_727': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n",
+ " 'id_730': {'model': 'm2', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n",
+ " 'id_733': {'model': 'm1', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n",
+ " 'id_736': {'model': 'm1', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n",
+ " 'id_739': {'model': 'm1', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n",
+ " 'id_742': {'model': 'm3', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n",
+ " 'id_745': {'model': 'm2', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n",
+ " 'id_748': {'model': 'm3', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n",
+ " 'id_751': {'model': 'm1', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n",
+ " 'id_754': {'model': 'm1', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n",
+ " 'id_757': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n",
+ " 'id_760': {'model': 'm1', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n",
+ " 'id_763': {'model': 'm2', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n",
+ " 'id_766': {'model': 'm1', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n",
+ " 'id_769': {'model': 'm2', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n",
+ " 'id_772': {'model': 'm1', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n",
+ " 'id_775': {'model': 'm2', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n",
+ " 'id_778': {'model': 'm1', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n",
+ " 'id_781': {'model': 'm3', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n",
+ " 'id_784': {'model': 'm3', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n",
+ " 'id_787': {'model': 'm2', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n",
+ " 'id_790': {'model': 'm2', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n",
+ " 'id_793': {'model': 'm1', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n",
+ " 'id_796': {'model': 'm3', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n",
+ " 'id_799': {'model': 'm3', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n",
+ " 'id_802': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n",
+ " 'id_805': {'model': 'm2', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n",
+ " 'id_808': {'model': 'm1', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n",
+ " 'id_811': {'model': 'm1', 'sent_id': 1, 'speaker': '0012', 'accent': None},\n",
+ " 'id_814': {'model': 'm3', 'sent_id': 10, 'speaker': '0012', 'accent': None},\n",
+ " 'id_817': {'model': 'm2', 'sent_id': 11, 'speaker': '0012', 'accent': None},\n",
+ " 'id_820': {'model': 'm1', 'sent_id': 12, 'speaker': '0012', 'accent': None},\n",
+ " 'id_823': {'model': 'm1', 'sent_id': 13, 'speaker': '0012', 'accent': None},\n",
+ " 'id_826': {'model': 'm2', 'sent_id': 14, 'speaker': '0012', 'accent': None},\n",
+ " 'id_829': {'model': 'm1', 'sent_id': 15, 'speaker': '0012', 'accent': None},\n",
+ " 'id_832': {'model': 'm2', 'sent_id': 16, 'speaker': '0012', 'accent': None},\n",
+ " 'id_835': {'model': 'm3', 'sent_id': 17, 'speaker': '0012', 'accent': None},\n",
+ " 'id_838': {'model': 'm3', 'sent_id': 18, 'speaker': '0012', 'accent': None},\n",
+ " 'id_841': {'model': 'm1', 'sent_id': 19, 'speaker': '0012', 'accent': None},\n",
+ " 'id_844': {'model': 'm2', 'sent_id': 2, 'speaker': '0012', 'accent': None},\n",
+ " 'id_847': {'model': 'm1', 'sent_id': 20, 'speaker': '0012', 'accent': None},\n",
+ " 'id_850': {'model': 'm3', 'sent_id': 21, 'speaker': '0012', 'accent': None},\n",
+ " 'id_853': {'model': 'm2', 'sent_id': 22, 'speaker': '0012', 'accent': None},\n",
+ " 'id_856': {'model': 'm1', 'sent_id': 23, 'speaker': '0012', 'accent': None},\n",
+ " 'id_859': {'model': 'm1', 'sent_id': 24, 'speaker': '0012', 'accent': None},\n",
+ " 'id_862': {'model': 'm3', 'sent_id': 25, 'speaker': '0012', 'accent': None},\n",
+ " 'id_865': {'model': 'm1', 'sent_id': 26, 'speaker': '0012', 'accent': None},\n",
+ " 'id_868': {'model': 'm3', 'sent_id': 27, 'speaker': '0012', 'accent': None},\n",
+ " 'id_871': {'model': 'm3', 'sent_id': 28, 'speaker': '0012', 'accent': None},\n",
+ " 'id_874': {'model': 'm2', 'sent_id': 29, 'speaker': '0012', 'accent': None},\n",
+ " 'id_877': {'model': 'm1', 'sent_id': 3, 'speaker': '0012', 'accent': None},\n",
+ " 'id_880': {'model': 'm1', 'sent_id': 30, 'speaker': '0012', 'accent': None},\n",
+ " 'id_883': {'model': 'm1', 'sent_id': 4, 'speaker': '0012', 'accent': None},\n",
+ " 'id_886': {'model': 'm3', 'sent_id': 5, 'speaker': '0012', 'accent': None},\n",
+ " 'id_889': {'model': 'm1', 'sent_id': 6, 'speaker': '0012', 'accent': None},\n",
+ " 'id_892': {'model': 'm2', 'sent_id': 7, 'speaker': '0012', 'accent': None},\n",
+ " 'id_895': {'model': 'm2', 'sent_id': 8, 'speaker': '0012', 'accent': None},\n",
+ " 'id_898': {'model': 'm3', 'sent_id': 9, 'speaker': '0012', 'accent': None},\n",
+ " 'id_901': {'model': 'm2', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n",
+ " 'id_904': {'model': 'm2', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n",
+ " 'id_907': {'model': 'm2', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n",
+ " 'id_910': {'model': 'm1', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n",
+ " 'id_913': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n",
+ " 'id_916': {'model': 'm3', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n",
+ " 'id_919': {'model': 'm2', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n",
+ " 'id_922': {'model': 'm2', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n",
+ " 'id_925': {'model': 'm1', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n",
+ " 'id_928': {'model': 'm3', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n",
+ " 'id_931': {'model': 'm2', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n",
+ " 'id_934': {'model': 'm3', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n",
+ " 'id_937': {'model': 'm3', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n",
+ " 'id_940': {'model': 'm3', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n",
+ " 'id_943': {'model': 'm3', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n",
+ " 'id_946': {'model': 'm3', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n",
+ " 'id_949': {'model': 'm1', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n",
+ " 'id_952': {'model': 'm2', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n",
+ " 'id_955': {'model': 'm3', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n",
+ " 'id_958': {'model': 'm1', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n",
+ " 'id_961': {'model': 'm1', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n",
+ " 'id_964': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n",
+ " 'id_967': {'model': 'm1', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n",
+ " 'id_970': {'model': 'm3', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n",
+ " 'id_973': {'model': 'm3', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n",
+ " 'id_976': {'model': 'm1', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n",
+ " 'id_979': {'model': 'm3', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n",
+ " 'id_982': {'model': 'm1', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n",
+ " 'id_985': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n",
+ " 'id_988': {'model': 'm2', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n",
+ " 'id_991': {'model': 'm3', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n",
+ " 'id_994': {'model': 'm1', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n",
+ " 'id_997': {'model': 'm3', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1000': {'model': 'm3', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1003': {'model': 'm2', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1006': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1009': {'model': 'm3', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1012': {'model': 'm2', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1015': {'model': 'm3', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1018': {'model': 'm3', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1021': {'model': 'm3', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1024': {'model': 'm1', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1027': {'model': 'm2', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1030': {'model': 'm2', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1033': {'model': 'm1', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1036': {'model': 'm3', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1039': {'model': 'm2', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1042': {'model': 'm1', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1045': {'model': 'm3', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1048': {'model': 'm3', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1051': {'model': 'm2', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1054': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1057': {'model': 'm3', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1060': {'model': 'm3', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1063': {'model': 'm2', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1066': {'model': 'm3', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1069': {'model': 'm1', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1072': {'model': 'm3', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1075': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1078': {'model': 'm2', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1081': {'model': 'm3', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1084': {'model': 'm3', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1087': {'model': 'm1', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1090': {'model': 'm2', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1093': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1096': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1099': {'model': 'm3', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1102': {'model': 'm1', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1105': {'model': 'm3', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1108': {'model': 'm3', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1111': {'model': 'm2', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1114': {'model': 'm3', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1117': {'model': 'm2', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1120': {'model': 'm1', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1123': {'model': 'm2', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1126': {'model': 'm1', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1129': {'model': 'm1', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1132': {'model': 'm2', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1135': {'model': 'm1', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1138': {'model': 'm3', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1141': {'model': 'm3', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1144': {'model': 'm3', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1147': {'model': 'm3', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1150': {'model': 'm1', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1153': {'model': 'm2', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1156': {'model': 'm3', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1159': {'model': 'm1', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1162': {'model': 'm1', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1165': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1168': {'model': 'm3', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1171': {'model': 'm2', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1174': {'model': 'm3', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1177': {'model': 'm2', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1180': {'model': 'm3', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1183': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1186': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1189': {'model': 'm1', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1192': {'model': 'm2', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1195': {'model': 'm2', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1198': {'model': 'm2', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1201': {'model': 'm3', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1204': {'model': 'm1', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1207': {'model': 'm2', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1210': {'model': 'm1', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1213': {'model': 'm1', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1216': {'model': 'm2', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1219': {'model': 'm1', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1222': {'model': 'm3', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1225': {'model': 'm3', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1228': {'model': 'm3', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1231': {'model': 'm1', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1234': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1237': {'model': 'm2', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1240': {'model': 'm2', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1243': {'model': 'm2', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1246': {'model': 'm2', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1249': {'model': 'm2', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1252': {'model': 'm3', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1255': {'model': 'm1', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1258': {'model': 'm3', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1261': {'model': 'm2', 'sent_id': 1, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1264': {'model': 'm3', 'sent_id': 10, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1267': {'model': 'm3', 'sent_id': 11, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1270': {'model': 'm3', 'sent_id': 12, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1273': {'model': 'm3', 'sent_id': 13, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1276': {'model': 'm2', 'sent_id': 14, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1279': {'model': 'm1', 'sent_id': 15, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1282': {'model': 'm3', 'sent_id': 16, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1285': {'model': 'm1', 'sent_id': 17, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1288': {'model': 'm1', 'sent_id': 18, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1291': {'model': 'm1', 'sent_id': 19, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1294': {'model': 'm3', 'sent_id': 2, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1297': {'model': 'm1', 'sent_id': 20, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1300': {'model': 'm2', 'sent_id': 21, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1303': {'model': 'm3', 'sent_id': 22, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1306': {'model': 'm1', 'sent_id': 23, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1309': {'model': 'm3', 'sent_id': 24, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1312': {'model': 'm2', 'sent_id': 25, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1315': {'model': 'm2', 'sent_id': 26, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1318': {'model': 'm1', 'sent_id': 27, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1321': {'model': 'm1', 'sent_id': 28, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1324': {'model': 'm1', 'sent_id': 29, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1327': {'model': 'm2', 'sent_id': 3, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1330': {'model': 'm3', 'sent_id': 30, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1333': {'model': 'm1', 'sent_id': 4, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1336': {'model': 'm1', 'sent_id': 5, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1339': {'model': 'm2', 'sent_id': 6, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1342': {'model': 'm1', 'sent_id': 7, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1345': {'model': 'm2', 'sent_id': 8, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1348': {'model': 'm3', 'sent_id': 9, 'speaker': '0013', 'accent': None},\n",
+ " 'id_1351': {'model': 'm2', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1354': {'model': 'm1', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1357': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1360': {'model': 'm2', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1363': {'model': 'm1', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1366': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1369': {'model': 'm2', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1372': {'model': 'm3', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1375': {'model': 'm3', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1378': {'model': 'm3', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1381': {'model': 'm3', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1384': {'model': 'm2', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1387': {'model': 'm2', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1390': {'model': 'm1', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1393': {'model': 'm3', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1396': {'model': 'm1', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1399': {'model': 'm1', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1402': {'model': 'm1', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1405': {'model': 'm2', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1408': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1411': {'model': 'm1', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1414': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1417': {'model': 'm2', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1420': {'model': 'm3', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1423': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1426': {'model': 'm3', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1429': {'model': 'm3', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1432': {'model': 'm1', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1435': {'model': 'm1', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1438': {'model': 'm1', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1441': {'model': 'm1', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1444': {'model': 'm2', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1447': {'model': 'm2', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1450': {'model': 'm2', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1453': {'model': 'm1', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1456': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1459': {'model': 'm1', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1462': {'model': 'm2', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1465': {'model': 'm2', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1468': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1471': {'model': 'm1', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1474': {'model': 'm3', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1477': {'model': 'm1', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1480': {'model': 'm1', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1483': {'model': 'm2', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1486': {'model': 'm3', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1489': {'model': 'm1', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1492': {'model': 'm2', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1495': {'model': 'm2', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1498': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1501': {'model': 'm1', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1504': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1507': {'model': 'm3', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1510': {'model': 'm1', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1513': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1516': {'model': 'm2', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1519': {'model': 'm2', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1522': {'model': 'm3', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1525': {'model': 'm1', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1528': {'model': 'm2', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1531': {'model': 'm1', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1534': {'model': 'm1', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1537': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1540': {'model': 'm3', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1543': {'model': 'm3', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1546': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1549': {'model': 'm1', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1552': {'model': 'm3', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1555': {'model': 'm2', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1558': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1561': {'model': 'm1', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1564': {'model': 'm3', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1567': {'model': 'm3', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1570': {'model': 'm3', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1573': {'model': 'm2', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1576': {'model': 'm1', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1579': {'model': 'm3', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1582': {'model': 'm3', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1585': {'model': 'm1', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1588': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1591': {'model': 'm1', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1594': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1597': {'model': 'm1', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1600': {'model': 'm2', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1603': {'model': 'm3', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1606': {'model': 'm3', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1609': {'model': 'm1', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1612': {'model': 'm1', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1615': {'model': 'm3', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1618': {'model': 'm2', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1621': {'model': 'm2', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1624': {'model': 'm1', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1627': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1630': {'model': 'm2', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1633': {'model': 'm1', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1636': {'model': 'm1', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1639': {'model': 'm2', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1642': {'model': 'm2', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1645': {'model': 'm1', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1648': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1651': {'model': 'm3', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1654': {'model': 'm1', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1657': {'model': 'm2', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1660': {'model': 'm2', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1663': {'model': 'm2', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1666': {'model': 'm1', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1669': {'model': 'm3', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1672': {'model': 'm3', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1675': {'model': 'm1', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1678': {'model': 'm1', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1681': {'model': 'm2', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1684': {'model': 'm1', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1687': {'model': 'm2', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1690': {'model': 'm2', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1693': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1696': {'model': 'm1', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1699': {'model': 'm2', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1702': {'model': 'm1', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1705': {'model': 'm3', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1708': {'model': 'm3', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1711': {'model': 'm1', 'sent_id': 1, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1714': {'model': 'm3', 'sent_id': 10, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1717': {'model': 'm1', 'sent_id': 11, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1720': {'model': 'm1', 'sent_id': 12, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1723': {'model': 'm2', 'sent_id': 13, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1726': {'model': 'm3', 'sent_id': 14, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1729': {'model': 'm2', 'sent_id': 15, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1732': {'model': 'm1', 'sent_id': 16, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1735': {'model': 'm3', 'sent_id': 17, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1738': {'model': 'm2', 'sent_id': 18, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1741': {'model': 'm1', 'sent_id': 19, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1744': {'model': 'm3', 'sent_id': 2, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1747': {'model': 'm2', 'sent_id': 20, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1750': {'model': 'm2', 'sent_id': 21, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1753': {'model': 'm1', 'sent_id': 22, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1756': {'model': 'm2', 'sent_id': 23, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1759': {'model': 'm3', 'sent_id': 24, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1762': {'model': 'm1', 'sent_id': 25, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1765': {'model': 'm3', 'sent_id': 26, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1768': {'model': 'm2', 'sent_id': 27, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1771': {'model': 'm2', 'sent_id': 28, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1774': {'model': 'm3', 'sent_id': 29, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1777': {'model': 'm2', 'sent_id': 3, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1780': {'model': 'm3', 'sent_id': 30, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1783': {'model': 'm2', 'sent_id': 4, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1786': {'model': 'm2', 'sent_id': 5, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1789': {'model': 'm2', 'sent_id': 6, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1792': {'model': 'm3', 'sent_id': 7, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1795': {'model': 'm1', 'sent_id': 8, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1798': {'model': 'm2', 'sent_id': 9, 'speaker': '0014', 'accent': None},\n",
+ " 'id_1801': {'model': 'm2', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1804': {'model': 'm1', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1807': {'model': 'm2', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1810': {'model': 'm1', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1813': {'model': 'm3', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1816': {'model': 'm3', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1819': {'model': 'm3', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1822': {'model': 'm1', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1825': {'model': 'm2', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1828': {'model': 'm1', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1831': {'model': 'm3', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1834': {'model': 'm3', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1837': {'model': 'm1', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1840': {'model': 'm2', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1843': {'model': 'm1', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1846': {'model': 'm1', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1849': {'model': 'm1', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1852': {'model': 'm2', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1855': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1858': {'model': 'm3', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1861': {'model': 'm2', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1864': {'model': 'm1', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1867': {'model': 'm1', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1870': {'model': 'm1', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1873': {'model': 'm3', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1876': {'model': 'm1', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1879': {'model': 'm3', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1882': {'model': 'm1', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1885': {'model': 'm3', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1888': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1891': {'model': 'm1', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1894': {'model': 'm1', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1897': {'model': 'm1', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1900': {'model': 'm2', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1903': {'model': 'm3', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1906': {'model': 'm2', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1909': {'model': 'm3', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1912': {'model': 'm1', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1915': {'model': 'm3', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1918': {'model': 'm1', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1921': {'model': 'm2', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1924': {'model': 'm1', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1927': {'model': 'm3', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1930': {'model': 'm3', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1933': {'model': 'm1', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1936': {'model': 'm3', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1939': {'model': 'm2', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1942': {'model': 'm3', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1945': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1948': {'model': 'm2', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1951': {'model': 'm3', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1954': {'model': 'm2', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1957': {'model': 'm3', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1960': {'model': 'm2', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1963': {'model': 'm2', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1966': {'model': 'm3', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1969': {'model': 'm1', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1972': {'model': 'm1', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1975': {'model': 'm3', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1978': {'model': 'm1', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1981': {'model': 'm1', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1984': {'model': 'm2', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1987': {'model': 'm1', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1990': {'model': 'm1', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1993': {'model': 'm1', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1996': {'model': 'm2', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n",
+ " 'id_1999': {'model': 'm3', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2002': {'model': 'm1', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2005': {'model': 'm2', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2008': {'model': 'm2', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2011': {'model': 'm1', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2014': {'model': 'm1', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2017': {'model': 'm1', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2020': {'model': 'm1', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2023': {'model': 'm1', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2026': {'model': 'm2', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2029': {'model': 'm1', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2032': {'model': 'm2', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2035': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2038': {'model': 'm3', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2041': {'model': 'm3', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2044': {'model': 'm1', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2047': {'model': 'm2', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2050': {'model': 'm1', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2053': {'model': 'm2', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2056': {'model': 'm2', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2059': {'model': 'm3', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2062': {'model': 'm2', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2065': {'model': 'm1', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2068': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2071': {'model': 'm2', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2074': {'model': 'm1', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2077': {'model': 'm3', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2080': {'model': 'm3', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2083': {'model': 'm2', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2086': {'model': 'm1', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2089': {'model': 'm1', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2092': {'model': 'm2', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2095': {'model': 'm2', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2098': {'model': 'm2', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2101': {'model': 'm3', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2104': {'model': 'm1', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2107': {'model': 'm3', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2110': {'model': 'm2', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2113': {'model': 'm2', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2116': {'model': 'm1', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2119': {'model': 'm3', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2122': {'model': 'm1', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2125': {'model': 'm1', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2128': {'model': 'm2', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2131': {'model': 'm2', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2134': {'model': 'm1', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2137': {'model': 'm2', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2140': {'model': 'm3', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2143': {'model': 'm1', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2146': {'model': 'm1', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2149': {'model': 'm2', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2152': {'model': 'm2', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2155': {'model': 'm1', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2158': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2161': {'model': 'm1', 'sent_id': 1, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2164': {'model': 'm2', 'sent_id': 10, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2167': {'model': 'm3', 'sent_id': 11, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2170': {'model': 'm2', 'sent_id': 12, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2173': {'model': 'm1', 'sent_id': 13, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2176': {'model': 'm3', 'sent_id': 14, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2179': {'model': 'm1', 'sent_id': 15, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2182': {'model': 'm3', 'sent_id': 16, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2185': {'model': 'm1', 'sent_id': 17, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2188': {'model': 'm1', 'sent_id': 18, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2191': {'model': 'm2', 'sent_id': 19, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2194': {'model': 'm2', 'sent_id': 2, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2197': {'model': 'm2', 'sent_id': 20, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2200': {'model': 'm1', 'sent_id': 21, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2203': {'model': 'm3', 'sent_id': 22, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2206': {'model': 'm2', 'sent_id': 23, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2209': {'model': 'm2', 'sent_id': 24, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2212': {'model': 'm3', 'sent_id': 25, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2215': {'model': 'm3', 'sent_id': 26, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2218': {'model': 'm2', 'sent_id': 27, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2221': {'model': 'm2', 'sent_id': 28, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2224': {'model': 'm3', 'sent_id': 29, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2227': {'model': 'm2', 'sent_id': 3, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2230': {'model': 'm3', 'sent_id': 30, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2233': {'model': 'm2', 'sent_id': 4, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2236': {'model': 'm2', 'sent_id': 5, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2239': {'model': 'm3', 'sent_id': 6, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2242': {'model': 'm1', 'sent_id': 7, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2245': {'model': 'm1', 'sent_id': 8, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2248': {'model': 'm2', 'sent_id': 9, 'speaker': '0015', 'accent': None},\n",
+ " 'id_2251': {'model': 'm2', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2254': {'model': 'm3', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2257': {'model': 'm1', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2260': {'model': 'm1', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2263': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2266': {'model': 'm3', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2269': {'model': 'm1', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2272': {'model': 'm3', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2275': {'model': 'm1', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2278': {'model': 'm1', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2281': {'model': 'm2', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2284': {'model': 'm2', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2287': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2290': {'model': 'm2', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2293': {'model': 'm2', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2296': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2299': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2302': {'model': 'm1', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2305': {'model': 'm1', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2308': {'model': 'm3', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2311': {'model': 'm2', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2314': {'model': 'm2', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2317': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2320': {'model': 'm1', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2323': {'model': 'm1', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2326': {'model': 'm2', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2329': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2332': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2335': {'model': 'm1', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2338': {'model': 'm2', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2341': {'model': 'm3', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2344': {'model': 'm2', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2347': {'model': 'm3', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2350': {'model': 'm2', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2353': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2356': {'model': 'm3', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2359': {'model': 'm1', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2362': {'model': 'm2', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2365': {'model': 'm1', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2368': {'model': 'm3', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2371': {'model': 'm2', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2374': {'model': 'm3', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2377': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2380': {'model': 'm3', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2383': {'model': 'm1', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2386': {'model': 'm1', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2389': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2392': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2395': {'model': 'm2', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2398': {'model': 'm2', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2401': {'model': 'm3', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2404': {'model': 'm3', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2407': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2410': {'model': 'm3', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2413': {'model': 'm2', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2416': {'model': 'm2', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2419': {'model': 'm3', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2422': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2425': {'model': 'm3', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2428': {'model': 'm2', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2431': {'model': 'm3', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2434': {'model': 'm3', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2437': {'model': 'm3', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2440': {'model': 'm1', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2443': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2446': {'model': 'm3', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2449': {'model': 'm3', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2452': {'model': 'm3', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2455': {'model': 'm2', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2458': {'model': 'm3', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2461': {'model': 'm1', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2464': {'model': 'm1', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2467': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2470': {'model': 'm1', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2473': {'model': 'm1', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2476': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2479': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2482': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2485': {'model': 'm2', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2488': {'model': 'm3', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2491': {'model': 'm1', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2494': {'model': 'm1', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2497': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2500': {'model': 'm3', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2503': {'model': 'm1', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2506': {'model': 'm1', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2509': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2512': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2515': {'model': 'm2', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2518': {'model': 'm3', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2521': {'model': 'm1', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2524': {'model': 'm1', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2527': {'model': 'm2', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2530': {'model': 'm2', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2533': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2536': {'model': 'm1', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2539': {'model': 'm3', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2542': {'model': 'm3', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2545': {'model': 'm1', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2548': {'model': 'm2', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2551': {'model': 'm3', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2554': {'model': 'm3', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2557': {'model': 'm3', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2560': {'model': 'm3', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2563': {'model': 'm3', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2566': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2569': {'model': 'm2', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2572': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2575': {'model': 'm2', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2578': {'model': 'm1', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2581': {'model': 'm1', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2584': {'model': 'm3', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2587': {'model': 'm2', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2590': {'model': 'm2', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2593': {'model': 'm3', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2596': {'model': 'm3', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2599': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2602': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2605': {'model': 'm2', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2608': {'model': 'm3', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2611': {'model': 'm1', 'sent_id': 1, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2614': {'model': 'm2', 'sent_id': 10, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2617': {'model': 'm2', 'sent_id': 11, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2620': {'model': 'm2', 'sent_id': 12, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2623': {'model': 'm1', 'sent_id': 13, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2626': {'model': 'm2', 'sent_id': 14, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2629': {'model': 'm3', 'sent_id': 15, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2632': {'model': 'm2', 'sent_id': 16, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2635': {'model': 'm2', 'sent_id': 17, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2638': {'model': 'm1', 'sent_id': 18, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2641': {'model': 'm2', 'sent_id': 19, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2644': {'model': 'm1', 'sent_id': 2, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2647': {'model': 'm2', 'sent_id': 20, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2650': {'model': 'm3', 'sent_id': 21, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2653': {'model': 'm1', 'sent_id': 22, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2656': {'model': 'm2', 'sent_id': 23, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2659': {'model': 'm3', 'sent_id': 24, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2662': {'model': 'm3', 'sent_id': 25, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2665': {'model': 'm1', 'sent_id': 26, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2668': {'model': 'm2', 'sent_id': 27, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2671': {'model': 'm2', 'sent_id': 28, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2674': {'model': 'm3', 'sent_id': 29, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2677': {'model': 'm1', 'sent_id': 3, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2680': {'model': 'm3', 'sent_id': 30, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2683': {'model': 'm2', 'sent_id': 4, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2686': {'model': 'm1', 'sent_id': 5, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2689': {'model': 'm1', 'sent_id': 6, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2692': {'model': 'm2', 'sent_id': 7, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2695': {'model': 'm2', 'sent_id': 8, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2698': {'model': 'm1', 'sent_id': 9, 'speaker': '0016', 'accent': None},\n",
+ " 'id_2701': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2704': {'model': 'm2', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2707': {'model': 'm3', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2710': {'model': 'm1', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2713': {'model': 'm1', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2716': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2719': {'model': 'm3', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2722': {'model': 'm3', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2725': {'model': 'm2', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2728': {'model': 'm3', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2731': {'model': 'm2', 'sent_id': 19, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2734': {'model': 'm1', 'sent_id': 2, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2737': {'model': 'm3', 'sent_id': 20, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2740': {'model': 'm3', 'sent_id': 21, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2743': {'model': 'm1', 'sent_id': 22, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2746': {'model': 'm3', 'sent_id': 23, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2749': {'model': 'm2', 'sent_id': 24, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2752': {'model': 'm3', 'sent_id': 25, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2755': {'model': 'm3', 'sent_id': 26, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2758': {'model': 'm3', 'sent_id': 27, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2761': {'model': 'm2', 'sent_id': 28, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2764': {'model': 'm1', 'sent_id': 29, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2767': {'model': 'm3', 'sent_id': 3, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2770': {'model': 'm3', 'sent_id': 30, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2773': {'model': 'm2', 'sent_id': 4, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2776': {'model': 'm1', 'sent_id': 5, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2779': {'model': 'm3', 'sent_id': 6, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2782': {'model': 'm2', 'sent_id': 7, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2785': {'model': 'm1', 'sent_id': 8, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2788': {'model': 'm2', 'sent_id': 9, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2791': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2794': {'model': 'm3', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2797': {'model': 'm1', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2800': {'model': 'm2', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2803': {'model': 'm1', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2806': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2809': {'model': 'm3', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2812': {'model': 'm1', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2815': {'model': 'm1', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2818': {'model': 'm1', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2821': {'model': 'm1', 'sent_id': 19, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2824': {'model': 'm3', 'sent_id': 2, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2827': {'model': 'm2', 'sent_id': 20, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2830': {'model': 'm2', 'sent_id': 21, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2833': {'model': 'm3', 'sent_id': 22, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2836': {'model': 'm2', 'sent_id': 23, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2839': {'model': 'm2', 'sent_id': 24, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2842': {'model': 'm3', 'sent_id': 25, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2845': {'model': 'm2', 'sent_id': 26, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2848': {'model': 'm2', 'sent_id': 27, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2851': {'model': 'm1', 'sent_id': 28, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2854': {'model': 'm3', 'sent_id': 29, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2857': {'model': 'm1', 'sent_id': 3, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2860': {'model': 'm3', 'sent_id': 30, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2863': {'model': 'm1', 'sent_id': 4, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2866': {'model': 'm2', 'sent_id': 5, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2869': {'model': 'm3', 'sent_id': 6, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2872': {'model': 'm2', 'sent_id': 7, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2875': {'model': 'm1', 'sent_id': 8, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2878': {'model': 'm2', 'sent_id': 9, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2881': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2884': {'model': 'm2', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2887': {'model': 'm1', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2890': {'model': 'm3', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2893': {'model': 'm3', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2896': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2899': {'model': 'm3', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2902': {'model': 'm1', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2905': {'model': 'm2', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2908': {'model': 'm3', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2911': {'model': 'm2', 'sent_id': 19, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2914': {'model': 'm3', 'sent_id': 2, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2917': {'model': 'm2', 'sent_id': 20, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2920': {'model': 'm2', 'sent_id': 21, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2923': {'model': 'm1', 'sent_id': 22, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2926': {'model': 'm2', 'sent_id': 23, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2929': {'model': 'm2', 'sent_id': 24, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2932': {'model': 'm3', 'sent_id': 25, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2935': {'model': 'm3', 'sent_id': 26, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2938': {'model': 'm2', 'sent_id': 27, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2941': {'model': 'm3', 'sent_id': 28, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2944': {'model': 'm1', 'sent_id': 29, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2947': {'model': 'm1', 'sent_id': 3, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2950': {'model': 'm2', 'sent_id': 30, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2953': {'model': 'm1', 'sent_id': 4, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2956': {'model': 'm3', 'sent_id': 5, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2959': {'model': 'm3', 'sent_id': 6, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2962': {'model': 'm3', 'sent_id': 7, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2965': {'model': 'm2', 'sent_id': 8, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2968': {'model': 'm2', 'sent_id': 9, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2971': {'model': 'm1', 'sent_id': 1, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2974': {'model': 'm3', 'sent_id': 10, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2977': {'model': 'm3', 'sent_id': 11, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2980': {'model': 'm2', 'sent_id': 12, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2983': {'model': 'm3', 'sent_id': 13, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2986': {'model': 'm3', 'sent_id': 14, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2989': {'model': 'm1', 'sent_id': 15, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2992': {'model': 'm1', 'sent_id': 16, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2995': {'model': 'm1', 'sent_id': 17, 'speaker': '0017', 'accent': None},\n",
+ " 'id_2998': {'model': 'm1', 'sent_id': 18, 'speaker': '0017', 'accent': None},\n",
+ " ...}"
+ ]
+ },
+ "execution_count": 14,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "meta = {}\n",
+ "\n",
+ "for model_ in folder2model.values():\n",
+ " meta.update(\n",
+ " dict(zip(df_detailed[model_].iloc[x_indices], df_detailed[model_].iloc[y_indices]))\n",
+ " )\n",
+ "\n",
+ "meta"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "id": "cd459e48-9aa1-4f8d-bad3-17e55340344a",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "assert(len(meta) == total_K_models*total_wavs_per_model)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 16,
+ "id": "bef6f710-8aa1-4422-b5c4-711497388ec9",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'id_1': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_4': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_7': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_10': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_13': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_16': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_19': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_22': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_25': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_28': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_31': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_34': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_37': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_40': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_43': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_46': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_49': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_52': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_55': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_58': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_61': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_64': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_67': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_70': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_73': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_76': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_79': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_82': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_85': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_88': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_91': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_94': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_97': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_100': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_103': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_106': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_109': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_112': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_115': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_118': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_121': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_124': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_127': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_130': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_133': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_136': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_139': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_142': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_145': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_148': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_151': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_154': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_157': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_160': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_163': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_166': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_169': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_172': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_175': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_178': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_181': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_184': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_187': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_190': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_193': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_196': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_199': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_202': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_205': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_208': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_211': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_214': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_217': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_220': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_223': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_226': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_229': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_232': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_235': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_238': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_241': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_244': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_247': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_250': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_253': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_256': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_259': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_262': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_265': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_268': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_271': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_274': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_277': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_280': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_283': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_286': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_289': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_292': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_295': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_298': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_301': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_304': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_307': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_310': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_313': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_316': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_319': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_322': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_325': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_328': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_331': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_334': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_337': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_340': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_343': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_346': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_349': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_352': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_355': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_358': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_361': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_364': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_367': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_370': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_373': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_376': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_379': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_382': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_385': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_388': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_391': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_394': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_397': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_400': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_403': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_406': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_409': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_412': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_415': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_418': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_421': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_424': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_427': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_430': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_433': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_436': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_439': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_442': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_445': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_448': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_451': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_454': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_457': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_460': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_463': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_466': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_469': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_472': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_475': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_478': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_481': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_484': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_487': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_490': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_493': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_496': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_499': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_502': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_505': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_508': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_511': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_514': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_517': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_520': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_523': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_526': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_529': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_532': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_535': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_538': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_541': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_544': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_547': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_550': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_553': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_556': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_559': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_562': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_565': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_568': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_571': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_574': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_577': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_580': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_583': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_586': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_589': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_592': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_595': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_598': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_601': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_604': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_607': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_610': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_613': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_616': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_619': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_622': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_625': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_628': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_631': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_634': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_637': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_640': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_643': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_646': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_649': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_652': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_655': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_658': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_661': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_664': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_667': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_670': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_673': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_676': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_679': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_682': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_685': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_688': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_691': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_694': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_697': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_700': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_703': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_706': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_709': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_712': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_715': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_718': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_721': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_724': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_727': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_730': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_733': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_736': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_739': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_742': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_745': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_748': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_751': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_754': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_757': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_760': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_763': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_766': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_769': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_772': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_775': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_778': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_781': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_784': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_787': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_790': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_793': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_796': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_799': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_802': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_805': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_808': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_811': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_814': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_817': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_820': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_823': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_826': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_829': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_832': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_835': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_838': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_841': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_844': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_847': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_850': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_853': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_856': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_859': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_862': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_865': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_868': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_871': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_874': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_877': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_880': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_883': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_886': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_889': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_892': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_895': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_898': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_901': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_904': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_907': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_910': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_913': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_916': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_919': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_922': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_925': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_928': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_931': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_934': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_937': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_940': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_943': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_946': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_949': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_952': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_955': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_958': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_961': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_964': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_967': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_970': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_973': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_976': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_979': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_982': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_985': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_988': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_991': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_994': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_997': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1000': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1003': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1006': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1009': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1012': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1015': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1018': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1021': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1024': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1027': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1030': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1033': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1036': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1039': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1042': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1045': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1048': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1051': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1054': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1057': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1060': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1063': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1066': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1069': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1072': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1075': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1078': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1081': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1084': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1087': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1090': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1093': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1096': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1099': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1102': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1105': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1108': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1111': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1114': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1117': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1120': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1123': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1126': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1129': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1132': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1135': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1138': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1141': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1144': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1147': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1150': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1153': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1156': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1159': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1162': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1165': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1168': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1171': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1174': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1177': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1180': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1183': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1186': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1189': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1192': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1195': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1198': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1201': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1204': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1207': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1210': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1213': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1216': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1219': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1222': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1225': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1228': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1231': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1234': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1237': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1240': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1243': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1246': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1249': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1252': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1255': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1258': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1261': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1264': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1267': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1270': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1273': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1276': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1279': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1282': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1285': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1288': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1291': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1294': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1297': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1300': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1303': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1306': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1309': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1312': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1315': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1318': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1321': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1324': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1327': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1330': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1333': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1336': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1339': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1342': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1345': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1348': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1351': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1354': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1357': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1360': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1363': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1366': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1369': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1372': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1375': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1378': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1381': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1384': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1387': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1390': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1393': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1396': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1399': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1402': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1405': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1408': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1411': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1414': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1417': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1420': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1423': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1426': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1429': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1432': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1435': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1438': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1441': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1444': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1447': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1450': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1453': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1456': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1459': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1462': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1465': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1468': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1471': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1474': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1477': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1480': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1483': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1486': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1489': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1492': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1495': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1498': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1501': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1504': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1507': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1510': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1513': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1516': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1519': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1522': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1525': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1528': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1531': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1534': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1537': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1540': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1543': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1546': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1549': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1552': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1555': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1558': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1561': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1564': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1567': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1570': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1573': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1576': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1579': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1582': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1585': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1588': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1591': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1594': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1597': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1600': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1603': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1606': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1609': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1612': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1615': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1618': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1621': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1624': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1627': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1630': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1633': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1636': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1639': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1642': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1645': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1648': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1651': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1654': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1657': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1660': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1663': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1666': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1669': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1672': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1675': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1678': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1681': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1684': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1687': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1690': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1693': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1696': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1699': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1702': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1705': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1708': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1711': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1714': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1717': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1720': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1723': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1726': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1729': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1732': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1735': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1738': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1741': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1744': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1747': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1750': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1753': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1756': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1759': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1762': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1765': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1768': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1771': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1774': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1777': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1780': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1783': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1786': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1789': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1792': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1795': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1798': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1801': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1804': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1807': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1810': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1813': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1816': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1819': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1822': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1825': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1828': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1831': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1834': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1837': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1840': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1843': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1846': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1849': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1852': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1855': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1858': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1861': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1864': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1867': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1870': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1873': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1876': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1879': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1882': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1885': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1888': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1891': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1894': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1897': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1900': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1903': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1906': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1909': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_1912': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_1915': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_1918': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_1921': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_1924': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_1927': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_1930': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_1933': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_1936': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_1939': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_1942': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_1945': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_1948': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_1951': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_1954': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_1957': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_1960': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_1963': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_1966': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_1969': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_1972': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_1975': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_1978': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_1981': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_1984': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_1987': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_1990': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_1993': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_1996': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_1999': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2002': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2005': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2008': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2011': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2014': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2017': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2020': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2023': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2026': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2029': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2032': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2035': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2038': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2041': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2044': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2047': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2050': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2053': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2056': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2059': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2062': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2065': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2068': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2071': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2074': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2077': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2080': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2083': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2086': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2089': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2092': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2095': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2098': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2101': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2104': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2107': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2110': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2113': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2116': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2119': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2122': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2125': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2128': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2131': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2134': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2137': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2140': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2143': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2146': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2149': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2152': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2155': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2158': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2161': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2164': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2167': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2170': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2173': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2176': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2179': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2182': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2185': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2188': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2191': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2194': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2197': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2200': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2203': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2206': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2209': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2212': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2215': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2218': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2221': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2224': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2227': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2230': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2233': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2236': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2239': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2242': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2245': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2248': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2251': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2254': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2257': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2260': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2263': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2266': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2269': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2272': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2275': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2278': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2281': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2284': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2287': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2290': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2293': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2296': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2299': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2302': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2305': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2308': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2311': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2314': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2317': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2320': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2323': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2326': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2329': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2332': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2335': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2338': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2341': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2344': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2347': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2350': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2353': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2356': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2359': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2362': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2365': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2368': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2371': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2374': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2377': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2380': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2383': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2386': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2389': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2392': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2395': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2398': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2401': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2404': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2407': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2410': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2413': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2416': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2419': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2422': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2425': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2428': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2431': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2434': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2437': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2440': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2443': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2446': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2449': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2452': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2455': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2458': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2461': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2464': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2467': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2470': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2473': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2476': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2479': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2482': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2485': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2488': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2491': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2494': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2497': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2500': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2503': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2506': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2509': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2512': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2515': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2518': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2521': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2524': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2527': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2530': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2533': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2536': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2539': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2542': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2545': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2548': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2551': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2554': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2557': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2560': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2563': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2566': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2569': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2572': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2575': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2578': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2581': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2584': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2587': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2590': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2593': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2596': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2599': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2602': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2605': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2608': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2611': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2614': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2617': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2620': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2623': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2626': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2629': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2632': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2635': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2638': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2641': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2644': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2647': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2650': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2653': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2656': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2659': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2662': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2665': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2668': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2671': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2674': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2677': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2680': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2683': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2686': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2689': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2692': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2695': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2698': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2701': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2704': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2707': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2710': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2713': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2716': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2719': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2722': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2725': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2728': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2731': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2734': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2737': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2740': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2743': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2746': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2749': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2752': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2755': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2758': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2761': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2764': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2767': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2770': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2773': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2776': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2779': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2782': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2785': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2788': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2791': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2794': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2797': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2800': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2803': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2806': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2809': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2812': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2815': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2818': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2821': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2824': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2827': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2830': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2833': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2836': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2839': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2842': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2845': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2848': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2851': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2854': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2857': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2860': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2863': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2866': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2869': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2872': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2875': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2878': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2881': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2884': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2887': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2890': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2893': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2896': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2899': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2902': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2905': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2908': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " 'id_2911': {'text': 'Luckily, this kind of collapse is relatively infrequent.'},\n",
+ " 'id_2914': {'text': 'Fifty yards ahead of her were the first of the rocks .'},\n",
+ " 'id_2917': {'text': 'Was it using language that caused their brains to develop?'},\n",
+ " 'id_2920': {'text': 'If everyone followed a similar plan, the results would be impressive.'},\n",
+ " 'id_2923': {'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.'},\n",
+ " 'id_2926': {'text': 'For more than two hundred years the pessimists have been winning the public debate.'},\n",
+ " 'id_2929': {'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\"},\n",
+ " 'id_2932': {'text': 'Young people want to feel supported and appreciated by their company and their superiors.'},\n",
+ " 'id_2935': {'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.'},\n",
+ " 'id_2938': {'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.'},\n",
+ " 'id_2941': {'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.'},\n",
+ " 'id_2944': {'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.'},\n",
+ " 'id_2947': {'text': 'It seemed the ordained order of things that dogs should work .'},\n",
+ " 'id_2950': {'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'},\n",
+ " 'id_2953': {'text': 'The journey was continued at dawn .'},\n",
+ " 'id_2956': {'text': 'Was it the rendezvous of those who were striving to work his ruin .'},\n",
+ " 'id_2959': {'text': 'A dead man is of no use on a plantation .'},\n",
+ " 'id_2962': {'text': 'The Claudine was leaving next morning for Honolulu .'},\n",
+ " 'id_2965': {'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.'},\n",
+ " 'id_2968': {'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.'},\n",
+ " 'id_2971': {'text': 'We got few vegetables and fruits , and became fish eaters .'},\n",
+ " 'id_2974': {'text': 'Humans also judge distance by using the relative sizes of objects.'},\n",
+ " 'id_2977': {'text': 'If this is true then those who tend to think creatively, really are somehow different.'},\n",
+ " 'id_2980': {'text': 'But really in the grand scheme of things, this information is insignificant.'},\n",
+ " 'id_2983': {'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.'},\n",
+ " 'id_2986': {'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.'},\n",
+ " 'id_2989': {'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.'},\n",
+ " 'id_2992': {'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\"},\n",
+ " 'id_2995': {'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!'},\n",
+ " 'id_2998': {'text': 'Earthquakes damage all structures, including bridges.'},\n",
+ " ...}"
+ ]
+ },
+ "execution_count": 16,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "sentences = {}\n",
+ "\n",
+ "for model_ in folder2model.values():\n",
+ " sentences.update(\n",
+ " dict(zip(df_detailed[model_].iloc[x_indices], df_detailed['text_left'].iloc[y_indices]))\n",
+ " )\n",
+ "\n",
+ "for k, v in sentences.items():\n",
+ " sentences[k] = {'text': v}\n",
+ "\n",
+ "sentences"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "id": "d6d927dd-c249-47e1-836c-fc6951d1dffd",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Unnamed: 0 | \n",
+ " m1_text | \n",
+ " m1_accent_speaker | \n",
+ " m1 | \n",
+ " m2 | \n",
+ " m3 | \n",
+ " m2_text | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " 0 | \n",
+ " - | \n",
+ " - | \n",
+ " id_1 | \n",
+ " id_2 | \n",
+ " id_3 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " 1 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ " 0011 | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 1 | \n",
+ " We got few vegetables and fruits , and became fish eaters . | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " 2 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4 | \n",
+ " id_5 | \n",
+ " id_6 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " 3 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ " 0011 | \n",
+ " 3 | \n",
+ " 3 | \n",
+ " 3 | \n",
+ " Humans also judge distance by using the relative sizes of objects. | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " 4 | \n",
+ " - | \n",
+ " - | \n",
+ " id_7 | \n",
+ " id_8 | \n",
+ " id_9 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 2695 | \n",
+ " 2695 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ " 0020 | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 3 | \n",
+ " The Claudine was leaving next morning for Honolulu . | \n",
+ "
\n",
+ " \n",
+ " | 2696 | \n",
+ " 2696 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4045 | \n",
+ " id_4046 | \n",
+ " id_4047 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2697 | \n",
+ " 2697 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 0020 | \n",
+ " 1 | \n",
+ " 2 | \n",
+ " 3 | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ "
\n",
+ " \n",
+ " | 2698 | \n",
+ " 2698 | \n",
+ " - | \n",
+ " - | \n",
+ " id_4048 | \n",
+ " id_4049 | \n",
+ " id_4050 | \n",
+ " - | \n",
+ "
\n",
+ " \n",
+ " | 2699 | \n",
+ " 2699 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 0020 | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " 2 | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
2700 rows × 7 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Unnamed: 0 \\\n",
+ "0 0 \n",
+ "1 1 \n",
+ "2 2 \n",
+ "3 3 \n",
+ "4 4 \n",
+ "... ... \n",
+ "2695 2695 \n",
+ "2696 2696 \n",
+ "2697 2697 \n",
+ "2698 2698 \n",
+ "2699 2699 \n",
+ "\n",
+ " m1_text \\\n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ " m1_accent_speaker m1 m2 m3 \\\n",
+ "0 - id_1 id_2 id_3 \n",
+ "1 0011 2 2 1 \n",
+ "2 - id_4 id_5 id_6 \n",
+ "3 0011 3 3 3 \n",
+ "4 - id_7 id_8 id_9 \n",
+ "... ... ... ... ... \n",
+ "2695 0020 2 2 3 \n",
+ "2696 - id_4045 id_4046 id_4047 \n",
+ "2697 0020 1 2 3 \n",
+ "2698 - id_4048 id_4049 id_4050 \n",
+ "2699 0020 1 1 2 \n",
+ "\n",
+ " m2_text \n",
+ "0 - \n",
+ "1 We got few vegetables and fruits , and became fish eaters . \n",
+ "2 - \n",
+ "3 Humans also judge distance by using the relative sizes of objects. \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 The Claudine was leaving next morning for Honolulu . \n",
+ "2696 - \n",
+ "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "2698 - \n",
+ "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "\n",
+ "[2700 rows x 7 columns]"
+ ]
+ },
+ "execution_count": 17,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def fillna_with_random_scores(df):\n",
+ " val_range = [1, 2, 3]\n",
+ " ranval_array = np.random.choice(val_range, size=(df.shape[0], df.shape[1]))\n",
+ " ranval_df = pd.DataFrame(ranval_array, columns=df.columns, index=df.index)\n",
+ " return df.fillna(ranval_df)\n",
+ "\n",
+ "\n",
+ "df_scores = pd.read_excel(SCORES_PATH)\n",
+ "df_scores = fillna_with_random_scores(df_scores) # If scores are unfilled\n",
+ "df_scores"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "id": "31e816a7-214b-479a-bdb7-d2d6652f135e",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'id_1': {'nmistakes': 2},\n",
+ " 'id_4': {'nmistakes': 3},\n",
+ " 'id_7': {'nmistakes': 3},\n",
+ " 'id_10': {'nmistakes': 3},\n",
+ " 'id_13': {'nmistakes': 2},\n",
+ " 'id_16': {'nmistakes': 3},\n",
+ " 'id_19': {'nmistakes': 1},\n",
+ " 'id_22': {'nmistakes': 2},\n",
+ " 'id_25': {'nmistakes': 3},\n",
+ " 'id_28': {'nmistakes': 2},\n",
+ " 'id_31': {'nmistakes': 3},\n",
+ " 'id_34': {'nmistakes': 1},\n",
+ " 'id_37': {'nmistakes': 2},\n",
+ " 'id_40': {'nmistakes': 2},\n",
+ " 'id_43': {'nmistakes': 3},\n",
+ " 'id_46': {'nmistakes': 3},\n",
+ " 'id_49': {'nmistakes': 1},\n",
+ " 'id_52': {'nmistakes': 1},\n",
+ " 'id_55': {'nmistakes': 2},\n",
+ " 'id_58': {'nmistakes': 2},\n",
+ " 'id_61': {'nmistakes': 2},\n",
+ " 'id_64': {'nmistakes': 1},\n",
+ " 'id_67': {'nmistakes': 3},\n",
+ " 'id_70': {'nmistakes': 3},\n",
+ " 'id_73': {'nmistakes': 3},\n",
+ " 'id_76': {'nmistakes': 1},\n",
+ " 'id_79': {'nmistakes': 2},\n",
+ " 'id_82': {'nmistakes': 1},\n",
+ " 'id_85': {'nmistakes': 2},\n",
+ " 'id_88': {'nmistakes': 2},\n",
+ " 'id_91': {'nmistakes': 2},\n",
+ " 'id_94': {'nmistakes': 1},\n",
+ " 'id_97': {'nmistakes': 1},\n",
+ " 'id_100': {'nmistakes': 2},\n",
+ " 'id_103': {'nmistakes': 2},\n",
+ " 'id_106': {'nmistakes': 3},\n",
+ " 'id_109': {'nmistakes': 2},\n",
+ " 'id_112': {'nmistakes': 2},\n",
+ " 'id_115': {'nmistakes': 1},\n",
+ " 'id_118': {'nmistakes': 1},\n",
+ " 'id_121': {'nmistakes': 1},\n",
+ " 'id_124': {'nmistakes': 1},\n",
+ " 'id_127': {'nmistakes': 2},\n",
+ " 'id_130': {'nmistakes': 3},\n",
+ " 'id_133': {'nmistakes': 1},\n",
+ " 'id_136': {'nmistakes': 1},\n",
+ " 'id_139': {'nmistakes': 1},\n",
+ " 'id_142': {'nmistakes': 1},\n",
+ " 'id_145': {'nmistakes': 3},\n",
+ " 'id_148': {'nmistakes': 3},\n",
+ " 'id_151': {'nmistakes': 3},\n",
+ " 'id_154': {'nmistakes': 2},\n",
+ " 'id_157': {'nmistakes': 1},\n",
+ " 'id_160': {'nmistakes': 2},\n",
+ " 'id_163': {'nmistakes': 3},\n",
+ " 'id_166': {'nmistakes': 3},\n",
+ " 'id_169': {'nmistakes': 1},\n",
+ " 'id_172': {'nmistakes': 1},\n",
+ " 'id_175': {'nmistakes': 1},\n",
+ " 'id_178': {'nmistakes': 2},\n",
+ " 'id_181': {'nmistakes': 3},\n",
+ " 'id_184': {'nmistakes': 2},\n",
+ " 'id_187': {'nmistakes': 1},\n",
+ " 'id_190': {'nmistakes': 2},\n",
+ " 'id_193': {'nmistakes': 1},\n",
+ " 'id_196': {'nmistakes': 1},\n",
+ " 'id_199': {'nmistakes': 3},\n",
+ " 'id_202': {'nmistakes': 1},\n",
+ " 'id_205': {'nmistakes': 2},\n",
+ " 'id_208': {'nmistakes': 3},\n",
+ " 'id_211': {'nmistakes': 2},\n",
+ " 'id_214': {'nmistakes': 1},\n",
+ " 'id_217': {'nmistakes': 3},\n",
+ " 'id_220': {'nmistakes': 1},\n",
+ " 'id_223': {'nmistakes': 2},\n",
+ " 'id_226': {'nmistakes': 1},\n",
+ " 'id_229': {'nmistakes': 3},\n",
+ " 'id_232': {'nmistakes': 1},\n",
+ " 'id_235': {'nmistakes': 1},\n",
+ " 'id_238': {'nmistakes': 3},\n",
+ " 'id_241': {'nmistakes': 3},\n",
+ " 'id_244': {'nmistakes': 2},\n",
+ " 'id_247': {'nmistakes': 1},\n",
+ " 'id_250': {'nmistakes': 2},\n",
+ " 'id_253': {'nmistakes': 1},\n",
+ " 'id_256': {'nmistakes': 1},\n",
+ " 'id_259': {'nmistakes': 1},\n",
+ " 'id_262': {'nmistakes': 1},\n",
+ " 'id_265': {'nmistakes': 2},\n",
+ " 'id_268': {'nmistakes': 1},\n",
+ " 'id_271': {'nmistakes': 2},\n",
+ " 'id_274': {'nmistakes': 1},\n",
+ " 'id_277': {'nmistakes': 1},\n",
+ " 'id_280': {'nmistakes': 3},\n",
+ " 'id_283': {'nmistakes': 3},\n",
+ " 'id_286': {'nmistakes': 2},\n",
+ " 'id_289': {'nmistakes': 1},\n",
+ " 'id_292': {'nmistakes': 2},\n",
+ " 'id_295': {'nmistakes': 2},\n",
+ " 'id_298': {'nmistakes': 1},\n",
+ " 'id_301': {'nmistakes': 2},\n",
+ " 'id_304': {'nmistakes': 3},\n",
+ " 'id_307': {'nmistakes': 1},\n",
+ " 'id_310': {'nmistakes': 3},\n",
+ " 'id_313': {'nmistakes': 3},\n",
+ " 'id_316': {'nmistakes': 1},\n",
+ " 'id_319': {'nmistakes': 3},\n",
+ " 'id_322': {'nmistakes': 3},\n",
+ " 'id_325': {'nmistakes': 3},\n",
+ " 'id_328': {'nmistakes': 1},\n",
+ " 'id_331': {'nmistakes': 1},\n",
+ " 'id_334': {'nmistakes': 3},\n",
+ " 'id_337': {'nmistakes': 2},\n",
+ " 'id_340': {'nmistakes': 1},\n",
+ " 'id_343': {'nmistakes': 1},\n",
+ " 'id_346': {'nmistakes': 3},\n",
+ " 'id_349': {'nmistakes': 2},\n",
+ " 'id_352': {'nmistakes': 1},\n",
+ " 'id_355': {'nmistakes': 2},\n",
+ " 'id_358': {'nmistakes': 3},\n",
+ " 'id_361': {'nmistakes': 3},\n",
+ " 'id_364': {'nmistakes': 3},\n",
+ " 'id_367': {'nmistakes': 2},\n",
+ " 'id_370': {'nmistakes': 3},\n",
+ " 'id_373': {'nmistakes': 3},\n",
+ " 'id_376': {'nmistakes': 3},\n",
+ " 'id_379': {'nmistakes': 3},\n",
+ " 'id_382': {'nmistakes': 1},\n",
+ " 'id_385': {'nmistakes': 1},\n",
+ " 'id_388': {'nmistakes': 1},\n",
+ " 'id_391': {'nmistakes': 2},\n",
+ " 'id_394': {'nmistakes': 2},\n",
+ " 'id_397': {'nmistakes': 1},\n",
+ " 'id_400': {'nmistakes': 1},\n",
+ " 'id_403': {'nmistakes': 2},\n",
+ " 'id_406': {'nmistakes': 1},\n",
+ " 'id_409': {'nmistakes': 3},\n",
+ " 'id_412': {'nmistakes': 2},\n",
+ " 'id_415': {'nmistakes': 2},\n",
+ " 'id_418': {'nmistakes': 3},\n",
+ " 'id_421': {'nmistakes': 3},\n",
+ " 'id_424': {'nmistakes': 1},\n",
+ " 'id_427': {'nmistakes': 2},\n",
+ " 'id_430': {'nmistakes': 2},\n",
+ " 'id_433': {'nmistakes': 3},\n",
+ " 'id_436': {'nmistakes': 3},\n",
+ " 'id_439': {'nmistakes': 2},\n",
+ " 'id_442': {'nmistakes': 1},\n",
+ " 'id_445': {'nmistakes': 3},\n",
+ " 'id_448': {'nmistakes': 2},\n",
+ " 'id_451': {'nmistakes': 1},\n",
+ " 'id_454': {'nmistakes': 3},\n",
+ " 'id_457': {'nmistakes': 3},\n",
+ " 'id_460': {'nmistakes': 3},\n",
+ " 'id_463': {'nmistakes': 1},\n",
+ " 'id_466': {'nmistakes': 1},\n",
+ " 'id_469': {'nmistakes': 2},\n",
+ " 'id_472': {'nmistakes': 2},\n",
+ " 'id_475': {'nmistakes': 3},\n",
+ " 'id_478': {'nmistakes': 3},\n",
+ " 'id_481': {'nmistakes': 2},\n",
+ " 'id_484': {'nmistakes': 3},\n",
+ " 'id_487': {'nmistakes': 1},\n",
+ " 'id_490': {'nmistakes': 2},\n",
+ " 'id_493': {'nmistakes': 3},\n",
+ " 'id_496': {'nmistakes': 1},\n",
+ " 'id_499': {'nmistakes': 1},\n",
+ " 'id_502': {'nmistakes': 2},\n",
+ " 'id_505': {'nmistakes': 3},\n",
+ " 'id_508': {'nmistakes': 3},\n",
+ " 'id_511': {'nmistakes': 1},\n",
+ " 'id_514': {'nmistakes': 1},\n",
+ " 'id_517': {'nmistakes': 3},\n",
+ " 'id_520': {'nmistakes': 3},\n",
+ " 'id_523': {'nmistakes': 3},\n",
+ " 'id_526': {'nmistakes': 1},\n",
+ " 'id_529': {'nmistakes': 3},\n",
+ " 'id_532': {'nmistakes': 2},\n",
+ " 'id_535': {'nmistakes': 1},\n",
+ " 'id_538': {'nmistakes': 2},\n",
+ " 'id_541': {'nmistakes': 3},\n",
+ " 'id_544': {'nmistakes': 3},\n",
+ " 'id_547': {'nmistakes': 3},\n",
+ " 'id_550': {'nmistakes': 1},\n",
+ " 'id_553': {'nmistakes': 3},\n",
+ " 'id_556': {'nmistakes': 2},\n",
+ " 'id_559': {'nmistakes': 1},\n",
+ " 'id_562': {'nmistakes': 2},\n",
+ " 'id_565': {'nmistakes': 3},\n",
+ " 'id_568': {'nmistakes': 1},\n",
+ " 'id_571': {'nmistakes': 2},\n",
+ " 'id_574': {'nmistakes': 2},\n",
+ " 'id_577': {'nmistakes': 3},\n",
+ " 'id_580': {'nmistakes': 2},\n",
+ " 'id_583': {'nmistakes': 3},\n",
+ " 'id_586': {'nmistakes': 3},\n",
+ " 'id_589': {'nmistakes': 3},\n",
+ " 'id_592': {'nmistakes': 3},\n",
+ " 'id_595': {'nmistakes': 3},\n",
+ " 'id_598': {'nmistakes': 2},\n",
+ " 'id_601': {'nmistakes': 1},\n",
+ " 'id_604': {'nmistakes': 1},\n",
+ " 'id_607': {'nmistakes': 2},\n",
+ " 'id_610': {'nmistakes': 1},\n",
+ " 'id_613': {'nmistakes': 3},\n",
+ " 'id_616': {'nmistakes': 3},\n",
+ " 'id_619': {'nmistakes': 1},\n",
+ " 'id_622': {'nmistakes': 1},\n",
+ " 'id_625': {'nmistakes': 1},\n",
+ " 'id_628': {'nmistakes': 1},\n",
+ " 'id_631': {'nmistakes': 2},\n",
+ " 'id_634': {'nmistakes': 1},\n",
+ " 'id_637': {'nmistakes': 3},\n",
+ " 'id_640': {'nmistakes': 1},\n",
+ " 'id_643': {'nmistakes': 3},\n",
+ " 'id_646': {'nmistakes': 2},\n",
+ " 'id_649': {'nmistakes': 3},\n",
+ " 'id_652': {'nmistakes': 3},\n",
+ " 'id_655': {'nmistakes': 3},\n",
+ " 'id_658': {'nmistakes': 3},\n",
+ " 'id_661': {'nmistakes': 3},\n",
+ " 'id_664': {'nmistakes': 1},\n",
+ " 'id_667': {'nmistakes': 1},\n",
+ " 'id_670': {'nmistakes': 1},\n",
+ " 'id_673': {'nmistakes': 2},\n",
+ " 'id_676': {'nmistakes': 2},\n",
+ " 'id_679': {'nmistakes': 1},\n",
+ " 'id_682': {'nmistakes': 1},\n",
+ " 'id_685': {'nmistakes': 3},\n",
+ " 'id_688': {'nmistakes': 3},\n",
+ " 'id_691': {'nmistakes': 1},\n",
+ " 'id_694': {'nmistakes': 3},\n",
+ " 'id_697': {'nmistakes': 2},\n",
+ " 'id_700': {'nmistakes': 1},\n",
+ " 'id_703': {'nmistakes': 1},\n",
+ " 'id_706': {'nmistakes': 2},\n",
+ " 'id_709': {'nmistakes': 1},\n",
+ " 'id_712': {'nmistakes': 1},\n",
+ " 'id_715': {'nmistakes': 2},\n",
+ " 'id_718': {'nmistakes': 1},\n",
+ " 'id_721': {'nmistakes': 3},\n",
+ " 'id_724': {'nmistakes': 3},\n",
+ " 'id_727': {'nmistakes': 2},\n",
+ " 'id_730': {'nmistakes': 3},\n",
+ " 'id_733': {'nmistakes': 2},\n",
+ " 'id_736': {'nmistakes': 1},\n",
+ " 'id_739': {'nmistakes': 3},\n",
+ " 'id_742': {'nmistakes': 2},\n",
+ " 'id_745': {'nmistakes': 1},\n",
+ " 'id_748': {'nmistakes': 2},\n",
+ " 'id_751': {'nmistakes': 1},\n",
+ " 'id_754': {'nmistakes': 3},\n",
+ " 'id_757': {'nmistakes': 2},\n",
+ " 'id_760': {'nmistakes': 3},\n",
+ " 'id_763': {'nmistakes': 3},\n",
+ " 'id_766': {'nmistakes': 2},\n",
+ " 'id_769': {'nmistakes': 3},\n",
+ " 'id_772': {'nmistakes': 3},\n",
+ " 'id_775': {'nmistakes': 3},\n",
+ " 'id_778': {'nmistakes': 3},\n",
+ " 'id_781': {'nmistakes': 3},\n",
+ " 'id_784': {'nmistakes': 3},\n",
+ " 'id_787': {'nmistakes': 1},\n",
+ " 'id_790': {'nmistakes': 1},\n",
+ " 'id_793': {'nmistakes': 2},\n",
+ " 'id_796': {'nmistakes': 1},\n",
+ " 'id_799': {'nmistakes': 3},\n",
+ " 'id_802': {'nmistakes': 3},\n",
+ " 'id_805': {'nmistakes': 1},\n",
+ " 'id_808': {'nmistakes': 3},\n",
+ " 'id_811': {'nmistakes': 1},\n",
+ " 'id_814': {'nmistakes': 1},\n",
+ " 'id_817': {'nmistakes': 1},\n",
+ " 'id_820': {'nmistakes': 1},\n",
+ " 'id_823': {'nmistakes': 2},\n",
+ " 'id_826': {'nmistakes': 3},\n",
+ " 'id_829': {'nmistakes': 2},\n",
+ " 'id_832': {'nmistakes': 3},\n",
+ " 'id_835': {'nmistakes': 2},\n",
+ " 'id_838': {'nmistakes': 1},\n",
+ " 'id_841': {'nmistakes': 2},\n",
+ " 'id_844': {'nmistakes': 1},\n",
+ " 'id_847': {'nmistakes': 1},\n",
+ " 'id_850': {'nmistakes': 2},\n",
+ " 'id_853': {'nmistakes': 3},\n",
+ " 'id_856': {'nmistakes': 3},\n",
+ " 'id_859': {'nmistakes': 2},\n",
+ " 'id_862': {'nmistakes': 3},\n",
+ " 'id_865': {'nmistakes': 3},\n",
+ " 'id_868': {'nmistakes': 3},\n",
+ " 'id_871': {'nmistakes': 3},\n",
+ " 'id_874': {'nmistakes': 3},\n",
+ " 'id_877': {'nmistakes': 1},\n",
+ " 'id_880': {'nmistakes': 2},\n",
+ " 'id_883': {'nmistakes': 1},\n",
+ " 'id_886': {'nmistakes': 1},\n",
+ " 'id_889': {'nmistakes': 3},\n",
+ " 'id_892': {'nmistakes': 3},\n",
+ " 'id_895': {'nmistakes': 1},\n",
+ " 'id_898': {'nmistakes': 3},\n",
+ " 'id_901': {'nmistakes': 1},\n",
+ " 'id_904': {'nmistakes': 2},\n",
+ " 'id_907': {'nmistakes': 2},\n",
+ " 'id_910': {'nmistakes': 2},\n",
+ " 'id_913': {'nmistakes': 1},\n",
+ " 'id_916': {'nmistakes': 2},\n",
+ " 'id_919': {'nmistakes': 2},\n",
+ " 'id_922': {'nmistakes': 1},\n",
+ " 'id_925': {'nmistakes': 3},\n",
+ " 'id_928': {'nmistakes': 2},\n",
+ " 'id_931': {'nmistakes': 2},\n",
+ " 'id_934': {'nmistakes': 3},\n",
+ " 'id_937': {'nmistakes': 1},\n",
+ " 'id_940': {'nmistakes': 2},\n",
+ " 'id_943': {'nmistakes': 1},\n",
+ " 'id_946': {'nmistakes': 2},\n",
+ " 'id_949': {'nmistakes': 3},\n",
+ " 'id_952': {'nmistakes': 2},\n",
+ " 'id_955': {'nmistakes': 1},\n",
+ " 'id_958': {'nmistakes': 3},\n",
+ " 'id_961': {'nmistakes': 3},\n",
+ " 'id_964': {'nmistakes': 2},\n",
+ " 'id_967': {'nmistakes': 3},\n",
+ " 'id_970': {'nmistakes': 1},\n",
+ " 'id_973': {'nmistakes': 2},\n",
+ " 'id_976': {'nmistakes': 1},\n",
+ " 'id_979': {'nmistakes': 2},\n",
+ " 'id_982': {'nmistakes': 3},\n",
+ " 'id_985': {'nmistakes': 2},\n",
+ " 'id_988': {'nmistakes': 3},\n",
+ " 'id_991': {'nmistakes': 3},\n",
+ " 'id_994': {'nmistakes': 2},\n",
+ " 'id_997': {'nmistakes': 1},\n",
+ " 'id_1000': {'nmistakes': 1},\n",
+ " 'id_1003': {'nmistakes': 3},\n",
+ " 'id_1006': {'nmistakes': 2},\n",
+ " 'id_1009': {'nmistakes': 3},\n",
+ " 'id_1012': {'nmistakes': 1},\n",
+ " 'id_1015': {'nmistakes': 2},\n",
+ " 'id_1018': {'nmistakes': 1},\n",
+ " 'id_1021': {'nmistakes': 3},\n",
+ " 'id_1024': {'nmistakes': 2},\n",
+ " 'id_1027': {'nmistakes': 2},\n",
+ " 'id_1030': {'nmistakes': 3},\n",
+ " 'id_1033': {'nmistakes': 1},\n",
+ " 'id_1036': {'nmistakes': 1},\n",
+ " 'id_1039': {'nmistakes': 2},\n",
+ " 'id_1042': {'nmistakes': 2},\n",
+ " 'id_1045': {'nmistakes': 1},\n",
+ " 'id_1048': {'nmistakes': 1},\n",
+ " 'id_1051': {'nmistakes': 2},\n",
+ " 'id_1054': {'nmistakes': 3},\n",
+ " 'id_1057': {'nmistakes': 3},\n",
+ " 'id_1060': {'nmistakes': 3},\n",
+ " 'id_1063': {'nmistakes': 3},\n",
+ " 'id_1066': {'nmistakes': 2},\n",
+ " 'id_1069': {'nmistakes': 2},\n",
+ " 'id_1072': {'nmistakes': 1},\n",
+ " 'id_1075': {'nmistakes': 3},\n",
+ " 'id_1078': {'nmistakes': 2},\n",
+ " 'id_1081': {'nmistakes': 2},\n",
+ " 'id_1084': {'nmistakes': 2},\n",
+ " 'id_1087': {'nmistakes': 2},\n",
+ " 'id_1090': {'nmistakes': 2},\n",
+ " 'id_1093': {'nmistakes': 3},\n",
+ " 'id_1096': {'nmistakes': 2},\n",
+ " 'id_1099': {'nmistakes': 2},\n",
+ " 'id_1102': {'nmistakes': 1},\n",
+ " 'id_1105': {'nmistakes': 1},\n",
+ " 'id_1108': {'nmistakes': 3},\n",
+ " 'id_1111': {'nmistakes': 2},\n",
+ " 'id_1114': {'nmistakes': 2},\n",
+ " 'id_1117': {'nmistakes': 1},\n",
+ " 'id_1120': {'nmistakes': 2},\n",
+ " 'id_1123': {'nmistakes': 2},\n",
+ " 'id_1126': {'nmistakes': 3},\n",
+ " 'id_1129': {'nmistakes': 2},\n",
+ " 'id_1132': {'nmistakes': 1},\n",
+ " 'id_1135': {'nmistakes': 2},\n",
+ " 'id_1138': {'nmistakes': 2},\n",
+ " 'id_1141': {'nmistakes': 1},\n",
+ " 'id_1144': {'nmistakes': 1},\n",
+ " 'id_1147': {'nmistakes': 3},\n",
+ " 'id_1150': {'nmistakes': 1},\n",
+ " 'id_1153': {'nmistakes': 1},\n",
+ " 'id_1156': {'nmistakes': 3},\n",
+ " 'id_1159': {'nmistakes': 1},\n",
+ " 'id_1162': {'nmistakes': 1},\n",
+ " 'id_1165': {'nmistakes': 3},\n",
+ " 'id_1168': {'nmistakes': 1},\n",
+ " 'id_1171': {'nmistakes': 2},\n",
+ " 'id_1174': {'nmistakes': 3},\n",
+ " 'id_1177': {'nmistakes': 2},\n",
+ " 'id_1180': {'nmistakes': 2},\n",
+ " 'id_1183': {'nmistakes': 1},\n",
+ " 'id_1186': {'nmistakes': 2},\n",
+ " 'id_1189': {'nmistakes': 1},\n",
+ " 'id_1192': {'nmistakes': 1},\n",
+ " 'id_1195': {'nmistakes': 2},\n",
+ " 'id_1198': {'nmistakes': 1},\n",
+ " 'id_1201': {'nmistakes': 3},\n",
+ " 'id_1204': {'nmistakes': 1},\n",
+ " 'id_1207': {'nmistakes': 1},\n",
+ " 'id_1210': {'nmistakes': 1},\n",
+ " 'id_1213': {'nmistakes': 1},\n",
+ " 'id_1216': {'nmistakes': 3},\n",
+ " 'id_1219': {'nmistakes': 1},\n",
+ " 'id_1222': {'nmistakes': 3},\n",
+ " 'id_1225': {'nmistakes': 3},\n",
+ " 'id_1228': {'nmistakes': 2},\n",
+ " 'id_1231': {'nmistakes': 2},\n",
+ " 'id_1234': {'nmistakes': 3},\n",
+ " 'id_1237': {'nmistakes': 1},\n",
+ " 'id_1240': {'nmistakes': 2},\n",
+ " 'id_1243': {'nmistakes': 2},\n",
+ " 'id_1246': {'nmistakes': 2},\n",
+ " 'id_1249': {'nmistakes': 3},\n",
+ " 'id_1252': {'nmistakes': 2},\n",
+ " 'id_1255': {'nmistakes': 2},\n",
+ " 'id_1258': {'nmistakes': 1},\n",
+ " 'id_1261': {'nmistakes': 2},\n",
+ " 'id_1264': {'nmistakes': 3},\n",
+ " 'id_1267': {'nmistakes': 3},\n",
+ " 'id_1270': {'nmistakes': 1},\n",
+ " 'id_1273': {'nmistakes': 2},\n",
+ " 'id_1276': {'nmistakes': 3},\n",
+ " 'id_1279': {'nmistakes': 3},\n",
+ " 'id_1282': {'nmistakes': 2},\n",
+ " 'id_1285': {'nmistakes': 3},\n",
+ " 'id_1288': {'nmistakes': 2},\n",
+ " 'id_1291': {'nmistakes': 3},\n",
+ " 'id_1294': {'nmistakes': 2},\n",
+ " 'id_1297': {'nmistakes': 2},\n",
+ " 'id_1300': {'nmistakes': 2},\n",
+ " 'id_1303': {'nmistakes': 3},\n",
+ " 'id_1306': {'nmistakes': 1},\n",
+ " 'id_1309': {'nmistakes': 1},\n",
+ " 'id_1312': {'nmistakes': 2},\n",
+ " 'id_1315': {'nmistakes': 3},\n",
+ " 'id_1318': {'nmistakes': 2},\n",
+ " 'id_1321': {'nmistakes': 3},\n",
+ " 'id_1324': {'nmistakes': 3},\n",
+ " 'id_1327': {'nmistakes': 2},\n",
+ " 'id_1330': {'nmistakes': 2},\n",
+ " 'id_1333': {'nmistakes': 1},\n",
+ " 'id_1336': {'nmistakes': 2},\n",
+ " 'id_1339': {'nmistakes': 3},\n",
+ " 'id_1342': {'nmistakes': 3},\n",
+ " 'id_1345': {'nmistakes': 2},\n",
+ " 'id_1348': {'nmistakes': 3},\n",
+ " 'id_1351': {'nmistakes': 3},\n",
+ " 'id_1354': {'nmistakes': 1},\n",
+ " 'id_1357': {'nmistakes': 2},\n",
+ " 'id_1360': {'nmistakes': 1},\n",
+ " 'id_1363': {'nmistakes': 3},\n",
+ " 'id_1366': {'nmistakes': 2},\n",
+ " 'id_1369': {'nmistakes': 3},\n",
+ " 'id_1372': {'nmistakes': 3},\n",
+ " 'id_1375': {'nmistakes': 2},\n",
+ " 'id_1378': {'nmistakes': 2},\n",
+ " 'id_1381': {'nmistakes': 3},\n",
+ " 'id_1384': {'nmistakes': 3},\n",
+ " 'id_1387': {'nmistakes': 2},\n",
+ " 'id_1390': {'nmistakes': 1},\n",
+ " 'id_1393': {'nmistakes': 1},\n",
+ " 'id_1396': {'nmistakes': 2},\n",
+ " 'id_1399': {'nmistakes': 2},\n",
+ " 'id_1402': {'nmistakes': 3},\n",
+ " 'id_1405': {'nmistakes': 1},\n",
+ " 'id_1408': {'nmistakes': 3},\n",
+ " 'id_1411': {'nmistakes': 3},\n",
+ " 'id_1414': {'nmistakes': 3},\n",
+ " 'id_1417': {'nmistakes': 1},\n",
+ " 'id_1420': {'nmistakes': 1},\n",
+ " 'id_1423': {'nmistakes': 1},\n",
+ " 'id_1426': {'nmistakes': 2},\n",
+ " 'id_1429': {'nmistakes': 2},\n",
+ " 'id_1432': {'nmistakes': 1},\n",
+ " 'id_1435': {'nmistakes': 2},\n",
+ " 'id_1438': {'nmistakes': 3},\n",
+ " 'id_1441': {'nmistakes': 3},\n",
+ " 'id_1444': {'nmistakes': 3},\n",
+ " 'id_1447': {'nmistakes': 3},\n",
+ " 'id_1450': {'nmistakes': 1},\n",
+ " 'id_1453': {'nmistakes': 2},\n",
+ " 'id_1456': {'nmistakes': 2},\n",
+ " 'id_1459': {'nmistakes': 1},\n",
+ " 'id_1462': {'nmistakes': 1},\n",
+ " 'id_1465': {'nmistakes': 2},\n",
+ " 'id_1468': {'nmistakes': 1},\n",
+ " 'id_1471': {'nmistakes': 1},\n",
+ " 'id_1474': {'nmistakes': 2},\n",
+ " 'id_1477': {'nmistakes': 3},\n",
+ " 'id_1480': {'nmistakes': 2},\n",
+ " 'id_1483': {'nmistakes': 3},\n",
+ " 'id_1486': {'nmistakes': 1},\n",
+ " 'id_1489': {'nmistakes': 3},\n",
+ " 'id_1492': {'nmistakes': 3},\n",
+ " 'id_1495': {'nmistakes': 1},\n",
+ " 'id_1498': {'nmistakes': 1},\n",
+ " 'id_1501': {'nmistakes': 2},\n",
+ " 'id_1504': {'nmistakes': 1},\n",
+ " 'id_1507': {'nmistakes': 3},\n",
+ " 'id_1510': {'nmistakes': 2},\n",
+ " 'id_1513': {'nmistakes': 3},\n",
+ " 'id_1516': {'nmistakes': 2},\n",
+ " 'id_1519': {'nmistakes': 3},\n",
+ " 'id_1522': {'nmistakes': 2},\n",
+ " 'id_1525': {'nmistakes': 3},\n",
+ " 'id_1528': {'nmistakes': 1},\n",
+ " 'id_1531': {'nmistakes': 2},\n",
+ " 'id_1534': {'nmistakes': 2},\n",
+ " 'id_1537': {'nmistakes': 3},\n",
+ " 'id_1540': {'nmistakes': 1},\n",
+ " 'id_1543': {'nmistakes': 2},\n",
+ " 'id_1546': {'nmistakes': 3},\n",
+ " 'id_1549': {'nmistakes': 1},\n",
+ " 'id_1552': {'nmistakes': 2},\n",
+ " 'id_1555': {'nmistakes': 1},\n",
+ " 'id_1558': {'nmistakes': 2},\n",
+ " 'id_1561': {'nmistakes': 1},\n",
+ " 'id_1564': {'nmistakes': 2},\n",
+ " 'id_1567': {'nmistakes': 2},\n",
+ " 'id_1570': {'nmistakes': 3},\n",
+ " 'id_1573': {'nmistakes': 2},\n",
+ " 'id_1576': {'nmistakes': 1},\n",
+ " 'id_1579': {'nmistakes': 1},\n",
+ " 'id_1582': {'nmistakes': 1},\n",
+ " 'id_1585': {'nmistakes': 1},\n",
+ " 'id_1588': {'nmistakes': 2},\n",
+ " 'id_1591': {'nmistakes': 3},\n",
+ " 'id_1594': {'nmistakes': 1},\n",
+ " 'id_1597': {'nmistakes': 3},\n",
+ " 'id_1600': {'nmistakes': 2},\n",
+ " 'id_1603': {'nmistakes': 1},\n",
+ " 'id_1606': {'nmistakes': 3},\n",
+ " 'id_1609': {'nmistakes': 1},\n",
+ " 'id_1612': {'nmistakes': 3},\n",
+ " 'id_1615': {'nmistakes': 2},\n",
+ " 'id_1618': {'nmistakes': 1},\n",
+ " 'id_1621': {'nmistakes': 2},\n",
+ " 'id_1624': {'nmistakes': 1},\n",
+ " 'id_1627': {'nmistakes': 1},\n",
+ " 'id_1630': {'nmistakes': 3},\n",
+ " 'id_1633': {'nmistakes': 3},\n",
+ " 'id_1636': {'nmistakes': 2},\n",
+ " 'id_1639': {'nmistakes': 2},\n",
+ " 'id_1642': {'nmistakes': 2},\n",
+ " 'id_1645': {'nmistakes': 2},\n",
+ " 'id_1648': {'nmistakes': 1},\n",
+ " 'id_1651': {'nmistakes': 3},\n",
+ " 'id_1654': {'nmistakes': 3},\n",
+ " 'id_1657': {'nmistakes': 2},\n",
+ " 'id_1660': {'nmistakes': 1},\n",
+ " 'id_1663': {'nmistakes': 3},\n",
+ " 'id_1666': {'nmistakes': 3},\n",
+ " 'id_1669': {'nmistakes': 2},\n",
+ " 'id_1672': {'nmistakes': 2},\n",
+ " 'id_1675': {'nmistakes': 2},\n",
+ " 'id_1678': {'nmistakes': 2},\n",
+ " 'id_1681': {'nmistakes': 2},\n",
+ " 'id_1684': {'nmistakes': 1},\n",
+ " 'id_1687': {'nmistakes': 2},\n",
+ " 'id_1690': {'nmistakes': 2},\n",
+ " 'id_1693': {'nmistakes': 1},\n",
+ " 'id_1696': {'nmistakes': 3},\n",
+ " 'id_1699': {'nmistakes': 3},\n",
+ " 'id_1702': {'nmistakes': 3},\n",
+ " 'id_1705': {'nmistakes': 1},\n",
+ " 'id_1708': {'nmistakes': 2},\n",
+ " 'id_1711': {'nmistakes': 1},\n",
+ " 'id_1714': {'nmistakes': 1},\n",
+ " 'id_1717': {'nmistakes': 3},\n",
+ " 'id_1720': {'nmistakes': 1},\n",
+ " 'id_1723': {'nmistakes': 2},\n",
+ " 'id_1726': {'nmistakes': 1},\n",
+ " 'id_1729': {'nmistakes': 3},\n",
+ " 'id_1732': {'nmistakes': 1},\n",
+ " 'id_1735': {'nmistakes': 2},\n",
+ " 'id_1738': {'nmistakes': 1},\n",
+ " 'id_1741': {'nmistakes': 1},\n",
+ " 'id_1744': {'nmistakes': 3},\n",
+ " 'id_1747': {'nmistakes': 1},\n",
+ " 'id_1750': {'nmistakes': 2},\n",
+ " 'id_1753': {'nmistakes': 1},\n",
+ " 'id_1756': {'nmistakes': 2},\n",
+ " 'id_1759': {'nmistakes': 2},\n",
+ " 'id_1762': {'nmistakes': 3},\n",
+ " 'id_1765': {'nmistakes': 2},\n",
+ " 'id_1768': {'nmistakes': 3},\n",
+ " 'id_1771': {'nmistakes': 1},\n",
+ " 'id_1774': {'nmistakes': 3},\n",
+ " 'id_1777': {'nmistakes': 3},\n",
+ " 'id_1780': {'nmistakes': 3},\n",
+ " 'id_1783': {'nmistakes': 2},\n",
+ " 'id_1786': {'nmistakes': 1},\n",
+ " 'id_1789': {'nmistakes': 1},\n",
+ " 'id_1792': {'nmistakes': 2},\n",
+ " 'id_1795': {'nmistakes': 3},\n",
+ " 'id_1798': {'nmistakes': 2},\n",
+ " 'id_1801': {'nmistakes': 1},\n",
+ " 'id_1804': {'nmistakes': 3},\n",
+ " 'id_1807': {'nmistakes': 3},\n",
+ " 'id_1810': {'nmistakes': 3},\n",
+ " 'id_1813': {'nmistakes': 2},\n",
+ " 'id_1816': {'nmistakes': 1},\n",
+ " 'id_1819': {'nmistakes': 2},\n",
+ " 'id_1822': {'nmistakes': 1},\n",
+ " 'id_1825': {'nmistakes': 1},\n",
+ " 'id_1828': {'nmistakes': 1},\n",
+ " 'id_1831': {'nmistakes': 3},\n",
+ " 'id_1834': {'nmistakes': 2},\n",
+ " 'id_1837': {'nmistakes': 3},\n",
+ " 'id_1840': {'nmistakes': 1},\n",
+ " 'id_1843': {'nmistakes': 1},\n",
+ " 'id_1846': {'nmistakes': 3},\n",
+ " 'id_1849': {'nmistakes': 2},\n",
+ " 'id_1852': {'nmistakes': 2},\n",
+ " 'id_1855': {'nmistakes': 1},\n",
+ " 'id_1858': {'nmistakes': 1},\n",
+ " 'id_1861': {'nmistakes': 3},\n",
+ " 'id_1864': {'nmistakes': 3},\n",
+ " 'id_1867': {'nmistakes': 2},\n",
+ " 'id_1870': {'nmistakes': 3},\n",
+ " 'id_1873': {'nmistakes': 2},\n",
+ " 'id_1876': {'nmistakes': 2},\n",
+ " 'id_1879': {'nmistakes': 3},\n",
+ " 'id_1882': {'nmistakes': 2},\n",
+ " 'id_1885': {'nmistakes': 3},\n",
+ " 'id_1888': {'nmistakes': 3},\n",
+ " 'id_1891': {'nmistakes': 1},\n",
+ " 'id_1894': {'nmistakes': 2},\n",
+ " 'id_1897': {'nmistakes': 1},\n",
+ " 'id_1900': {'nmistakes': 1},\n",
+ " 'id_1903': {'nmistakes': 1},\n",
+ " 'id_1906': {'nmistakes': 3},\n",
+ " 'id_1909': {'nmistakes': 3},\n",
+ " 'id_1912': {'nmistakes': 1},\n",
+ " 'id_1915': {'nmistakes': 3},\n",
+ " 'id_1918': {'nmistakes': 2},\n",
+ " 'id_1921': {'nmistakes': 3},\n",
+ " 'id_1924': {'nmistakes': 3},\n",
+ " 'id_1927': {'nmistakes': 2},\n",
+ " 'id_1930': {'nmistakes': 3},\n",
+ " 'id_1933': {'nmistakes': 1},\n",
+ " 'id_1936': {'nmistakes': 3},\n",
+ " 'id_1939': {'nmistakes': 1},\n",
+ " 'id_1942': {'nmistakes': 2},\n",
+ " 'id_1945': {'nmistakes': 2},\n",
+ " 'id_1948': {'nmistakes': 3},\n",
+ " 'id_1951': {'nmistakes': 2},\n",
+ " 'id_1954': {'nmistakes': 1},\n",
+ " 'id_1957': {'nmistakes': 2},\n",
+ " 'id_1960': {'nmistakes': 1},\n",
+ " 'id_1963': {'nmistakes': 1},\n",
+ " 'id_1966': {'nmistakes': 1},\n",
+ " 'id_1969': {'nmistakes': 3},\n",
+ " 'id_1972': {'nmistakes': 3},\n",
+ " 'id_1975': {'nmistakes': 1},\n",
+ " 'id_1978': {'nmistakes': 3},\n",
+ " 'id_1981': {'nmistakes': 1},\n",
+ " 'id_1984': {'nmistakes': 1},\n",
+ " 'id_1987': {'nmistakes': 3},\n",
+ " 'id_1990': {'nmistakes': 3},\n",
+ " 'id_1993': {'nmistakes': 1},\n",
+ " 'id_1996': {'nmistakes': 1},\n",
+ " 'id_1999': {'nmistakes': 2},\n",
+ " 'id_2002': {'nmistakes': 1},\n",
+ " 'id_2005': {'nmistakes': 2},\n",
+ " 'id_2008': {'nmistakes': 1},\n",
+ " 'id_2011': {'nmistakes': 2},\n",
+ " 'id_2014': {'nmistakes': 1},\n",
+ " 'id_2017': {'nmistakes': 1},\n",
+ " 'id_2020': {'nmistakes': 1},\n",
+ " 'id_2023': {'nmistakes': 2},\n",
+ " 'id_2026': {'nmistakes': 1},\n",
+ " 'id_2029': {'nmistakes': 2},\n",
+ " 'id_2032': {'nmistakes': 1},\n",
+ " 'id_2035': {'nmistakes': 1},\n",
+ " 'id_2038': {'nmistakes': 3},\n",
+ " 'id_2041': {'nmistakes': 1},\n",
+ " 'id_2044': {'nmistakes': 2},\n",
+ " 'id_2047': {'nmistakes': 3},\n",
+ " 'id_2050': {'nmistakes': 2},\n",
+ " 'id_2053': {'nmistakes': 1},\n",
+ " 'id_2056': {'nmistakes': 1},\n",
+ " 'id_2059': {'nmistakes': 3},\n",
+ " 'id_2062': {'nmistakes': 1},\n",
+ " 'id_2065': {'nmistakes': 2},\n",
+ " 'id_2068': {'nmistakes': 3},\n",
+ " 'id_2071': {'nmistakes': 2},\n",
+ " 'id_2074': {'nmistakes': 1},\n",
+ " 'id_2077': {'nmistakes': 1},\n",
+ " 'id_2080': {'nmistakes': 1},\n",
+ " 'id_2083': {'nmistakes': 3},\n",
+ " 'id_2086': {'nmistakes': 1},\n",
+ " 'id_2089': {'nmistakes': 1},\n",
+ " 'id_2092': {'nmistakes': 2},\n",
+ " 'id_2095': {'nmistakes': 3},\n",
+ " 'id_2098': {'nmistakes': 2},\n",
+ " 'id_2101': {'nmistakes': 1},\n",
+ " 'id_2104': {'nmistakes': 1},\n",
+ " 'id_2107': {'nmistakes': 2},\n",
+ " 'id_2110': {'nmistakes': 2},\n",
+ " 'id_2113': {'nmistakes': 2},\n",
+ " 'id_2116': {'nmistakes': 3},\n",
+ " 'id_2119': {'nmistakes': 1},\n",
+ " 'id_2122': {'nmistakes': 1},\n",
+ " 'id_2125': {'nmistakes': 2},\n",
+ " 'id_2128': {'nmistakes': 3},\n",
+ " 'id_2131': {'nmistakes': 1},\n",
+ " 'id_2134': {'nmistakes': 3},\n",
+ " 'id_2137': {'nmistakes': 2},\n",
+ " 'id_2140': {'nmistakes': 2},\n",
+ " 'id_2143': {'nmistakes': 3},\n",
+ " 'id_2146': {'nmistakes': 1},\n",
+ " 'id_2149': {'nmistakes': 1},\n",
+ " 'id_2152': {'nmistakes': 3},\n",
+ " 'id_2155': {'nmistakes': 3},\n",
+ " 'id_2158': {'nmistakes': 2},\n",
+ " 'id_2161': {'nmistakes': 2},\n",
+ " 'id_2164': {'nmistakes': 1},\n",
+ " 'id_2167': {'nmistakes': 2},\n",
+ " 'id_2170': {'nmistakes': 2},\n",
+ " 'id_2173': {'nmistakes': 3},\n",
+ " 'id_2176': {'nmistakes': 3},\n",
+ " 'id_2179': {'nmistakes': 2},\n",
+ " 'id_2182': {'nmistakes': 1},\n",
+ " 'id_2185': {'nmistakes': 3},\n",
+ " 'id_2188': {'nmistakes': 2},\n",
+ " 'id_2191': {'nmistakes': 3},\n",
+ " 'id_2194': {'nmistakes': 2},\n",
+ " 'id_2197': {'nmistakes': 2},\n",
+ " 'id_2200': {'nmistakes': 2},\n",
+ " 'id_2203': {'nmistakes': 2},\n",
+ " 'id_2206': {'nmistakes': 2},\n",
+ " 'id_2209': {'nmistakes': 3},\n",
+ " 'id_2212': {'nmistakes': 1},\n",
+ " 'id_2215': {'nmistakes': 2},\n",
+ " 'id_2218': {'nmistakes': 1},\n",
+ " 'id_2221': {'nmistakes': 1},\n",
+ " 'id_2224': {'nmistakes': 2},\n",
+ " 'id_2227': {'nmistakes': 2},\n",
+ " 'id_2230': {'nmistakes': 2},\n",
+ " 'id_2233': {'nmistakes': 2},\n",
+ " 'id_2236': {'nmistakes': 3},\n",
+ " 'id_2239': {'nmistakes': 2},\n",
+ " 'id_2242': {'nmistakes': 2},\n",
+ " 'id_2245': {'nmistakes': 3},\n",
+ " 'id_2248': {'nmistakes': 2},\n",
+ " 'id_2251': {'nmistakes': 3},\n",
+ " 'id_2254': {'nmistakes': 1},\n",
+ " 'id_2257': {'nmistakes': 2},\n",
+ " 'id_2260': {'nmistakes': 1},\n",
+ " 'id_2263': {'nmistakes': 2},\n",
+ " 'id_2266': {'nmistakes': 3},\n",
+ " 'id_2269': {'nmistakes': 3},\n",
+ " 'id_2272': {'nmistakes': 3},\n",
+ " 'id_2275': {'nmistakes': 1},\n",
+ " 'id_2278': {'nmistakes': 3},\n",
+ " 'id_2281': {'nmistakes': 2},\n",
+ " 'id_2284': {'nmistakes': 1},\n",
+ " 'id_2287': {'nmistakes': 2},\n",
+ " 'id_2290': {'nmistakes': 1},\n",
+ " 'id_2293': {'nmistakes': 3},\n",
+ " 'id_2296': {'nmistakes': 3},\n",
+ " 'id_2299': {'nmistakes': 2},\n",
+ " 'id_2302': {'nmistakes': 2},\n",
+ " 'id_2305': {'nmistakes': 1},\n",
+ " 'id_2308': {'nmistakes': 3},\n",
+ " 'id_2311': {'nmistakes': 2},\n",
+ " 'id_2314': {'nmistakes': 2},\n",
+ " 'id_2317': {'nmistakes': 1},\n",
+ " 'id_2320': {'nmistakes': 1},\n",
+ " 'id_2323': {'nmistakes': 3},\n",
+ " 'id_2326': {'nmistakes': 1},\n",
+ " 'id_2329': {'nmistakes': 1},\n",
+ " 'id_2332': {'nmistakes': 3},\n",
+ " 'id_2335': {'nmistakes': 2},\n",
+ " 'id_2338': {'nmistakes': 1},\n",
+ " 'id_2341': {'nmistakes': 3},\n",
+ " 'id_2344': {'nmistakes': 1},\n",
+ " 'id_2347': {'nmistakes': 1},\n",
+ " 'id_2350': {'nmistakes': 1},\n",
+ " 'id_2353': {'nmistakes': 1},\n",
+ " 'id_2356': {'nmistakes': 1},\n",
+ " 'id_2359': {'nmistakes': 1},\n",
+ " 'id_2362': {'nmistakes': 3},\n",
+ " 'id_2365': {'nmistakes': 3},\n",
+ " 'id_2368': {'nmistakes': 3},\n",
+ " 'id_2371': {'nmistakes': 2},\n",
+ " 'id_2374': {'nmistakes': 3},\n",
+ " 'id_2377': {'nmistakes': 1},\n",
+ " 'id_2380': {'nmistakes': 3},\n",
+ " 'id_2383': {'nmistakes': 2},\n",
+ " 'id_2386': {'nmistakes': 2},\n",
+ " 'id_2389': {'nmistakes': 3},\n",
+ " 'id_2392': {'nmistakes': 3},\n",
+ " 'id_2395': {'nmistakes': 2},\n",
+ " 'id_2398': {'nmistakes': 3},\n",
+ " 'id_2401': {'nmistakes': 2},\n",
+ " 'id_2404': {'nmistakes': 1},\n",
+ " 'id_2407': {'nmistakes': 1},\n",
+ " 'id_2410': {'nmistakes': 1},\n",
+ " 'id_2413': {'nmistakes': 2},\n",
+ " 'id_2416': {'nmistakes': 3},\n",
+ " 'id_2419': {'nmistakes': 3},\n",
+ " 'id_2422': {'nmistakes': 1},\n",
+ " 'id_2425': {'nmistakes': 1},\n",
+ " 'id_2428': {'nmistakes': 2},\n",
+ " 'id_2431': {'nmistakes': 2},\n",
+ " 'id_2434': {'nmistakes': 2},\n",
+ " 'id_2437': {'nmistakes': 2},\n",
+ " 'id_2440': {'nmistakes': 1},\n",
+ " 'id_2443': {'nmistakes': 3},\n",
+ " 'id_2446': {'nmistakes': 2},\n",
+ " 'id_2449': {'nmistakes': 1},\n",
+ " 'id_2452': {'nmistakes': 3},\n",
+ " 'id_2455': {'nmistakes': 2},\n",
+ " 'id_2458': {'nmistakes': 3},\n",
+ " 'id_2461': {'nmistakes': 1},\n",
+ " 'id_2464': {'nmistakes': 1},\n",
+ " 'id_2467': {'nmistakes': 2},\n",
+ " 'id_2470': {'nmistakes': 1},\n",
+ " 'id_2473': {'nmistakes': 3},\n",
+ " 'id_2476': {'nmistakes': 2},\n",
+ " 'id_2479': {'nmistakes': 3},\n",
+ " 'id_2482': {'nmistakes': 3},\n",
+ " 'id_2485': {'nmistakes': 3},\n",
+ " 'id_2488': {'nmistakes': 3},\n",
+ " 'id_2491': {'nmistakes': 1},\n",
+ " 'id_2494': {'nmistakes': 2},\n",
+ " 'id_2497': {'nmistakes': 2},\n",
+ " 'id_2500': {'nmistakes': 2},\n",
+ " 'id_2503': {'nmistakes': 1},\n",
+ " 'id_2506': {'nmistakes': 3},\n",
+ " 'id_2509': {'nmistakes': 2},\n",
+ " 'id_2512': {'nmistakes': 1},\n",
+ " 'id_2515': {'nmistakes': 1},\n",
+ " 'id_2518': {'nmistakes': 3},\n",
+ " 'id_2521': {'nmistakes': 3},\n",
+ " 'id_2524': {'nmistakes': 2},\n",
+ " 'id_2527': {'nmistakes': 2},\n",
+ " 'id_2530': {'nmistakes': 3},\n",
+ " 'id_2533': {'nmistakes': 3},\n",
+ " 'id_2536': {'nmistakes': 2},\n",
+ " 'id_2539': {'nmistakes': 3},\n",
+ " 'id_2542': {'nmistakes': 3},\n",
+ " 'id_2545': {'nmistakes': 3},\n",
+ " 'id_2548': {'nmistakes': 1},\n",
+ " 'id_2551': {'nmistakes': 1},\n",
+ " 'id_2554': {'nmistakes': 1},\n",
+ " 'id_2557': {'nmistakes': 2},\n",
+ " 'id_2560': {'nmistakes': 1},\n",
+ " 'id_2563': {'nmistakes': 1},\n",
+ " 'id_2566': {'nmistakes': 2},\n",
+ " 'id_2569': {'nmistakes': 1},\n",
+ " 'id_2572': {'nmistakes': 2},\n",
+ " 'id_2575': {'nmistakes': 2},\n",
+ " 'id_2578': {'nmistakes': 3},\n",
+ " 'id_2581': {'nmistakes': 2},\n",
+ " 'id_2584': {'nmistakes': 1},\n",
+ " 'id_2587': {'nmistakes': 2},\n",
+ " 'id_2590': {'nmistakes': 2},\n",
+ " 'id_2593': {'nmistakes': 3},\n",
+ " 'id_2596': {'nmistakes': 3},\n",
+ " 'id_2599': {'nmistakes': 3},\n",
+ " 'id_2602': {'nmistakes': 2},\n",
+ " 'id_2605': {'nmistakes': 3},\n",
+ " 'id_2608': {'nmistakes': 2},\n",
+ " 'id_2611': {'nmistakes': 1},\n",
+ " 'id_2614': {'nmistakes': 2},\n",
+ " 'id_2617': {'nmistakes': 2},\n",
+ " 'id_2620': {'nmistakes': 2},\n",
+ " 'id_2623': {'nmistakes': 3},\n",
+ " 'id_2626': {'nmistakes': 2},\n",
+ " 'id_2629': {'nmistakes': 3},\n",
+ " 'id_2632': {'nmistakes': 3},\n",
+ " 'id_2635': {'nmistakes': 2},\n",
+ " 'id_2638': {'nmistakes': 1},\n",
+ " 'id_2641': {'nmistakes': 3},\n",
+ " 'id_2644': {'nmistakes': 2},\n",
+ " 'id_2647': {'nmistakes': 3},\n",
+ " 'id_2650': {'nmistakes': 1},\n",
+ " 'id_2653': {'nmistakes': 3},\n",
+ " 'id_2656': {'nmistakes': 1},\n",
+ " 'id_2659': {'nmistakes': 1},\n",
+ " 'id_2662': {'nmistakes': 3},\n",
+ " 'id_2665': {'nmistakes': 1},\n",
+ " 'id_2668': {'nmistakes': 2},\n",
+ " 'id_2671': {'nmistakes': 2},\n",
+ " 'id_2674': {'nmistakes': 2},\n",
+ " 'id_2677': {'nmistakes': 1},\n",
+ " 'id_2680': {'nmistakes': 2},\n",
+ " 'id_2683': {'nmistakes': 2},\n",
+ " 'id_2686': {'nmistakes': 1},\n",
+ " 'id_2689': {'nmistakes': 1},\n",
+ " 'id_2692': {'nmistakes': 3},\n",
+ " 'id_2695': {'nmistakes': 3},\n",
+ " 'id_2698': {'nmistakes': 2},\n",
+ " 'id_2701': {'nmistakes': 3},\n",
+ " 'id_2704': {'nmistakes': 1},\n",
+ " 'id_2707': {'nmistakes': 3},\n",
+ " 'id_2710': {'nmistakes': 2},\n",
+ " 'id_2713': {'nmistakes': 3},\n",
+ " 'id_2716': {'nmistakes': 1},\n",
+ " 'id_2719': {'nmistakes': 2},\n",
+ " 'id_2722': {'nmistakes': 2},\n",
+ " 'id_2725': {'nmistakes': 3},\n",
+ " 'id_2728': {'nmistakes': 1},\n",
+ " 'id_2731': {'nmistakes': 3},\n",
+ " 'id_2734': {'nmistakes': 1},\n",
+ " 'id_2737': {'nmistakes': 1},\n",
+ " 'id_2740': {'nmistakes': 3},\n",
+ " 'id_2743': {'nmistakes': 1},\n",
+ " 'id_2746': {'nmistakes': 2},\n",
+ " 'id_2749': {'nmistakes': 2},\n",
+ " 'id_2752': {'nmistakes': 2},\n",
+ " 'id_2755': {'nmistakes': 2},\n",
+ " 'id_2758': {'nmistakes': 1},\n",
+ " 'id_2761': {'nmistakes': 3},\n",
+ " 'id_2764': {'nmistakes': 1},\n",
+ " 'id_2767': {'nmistakes': 1},\n",
+ " 'id_2770': {'nmistakes': 2},\n",
+ " 'id_2773': {'nmistakes': 2},\n",
+ " 'id_2776': {'nmistakes': 1},\n",
+ " 'id_2779': {'nmistakes': 1},\n",
+ " 'id_2782': {'nmistakes': 2},\n",
+ " 'id_2785': {'nmistakes': 3},\n",
+ " 'id_2788': {'nmistakes': 3},\n",
+ " 'id_2791': {'nmistakes': 1},\n",
+ " 'id_2794': {'nmistakes': 1},\n",
+ " 'id_2797': {'nmistakes': 2},\n",
+ " 'id_2800': {'nmistakes': 1},\n",
+ " 'id_2803': {'nmistakes': 3},\n",
+ " 'id_2806': {'nmistakes': 1},\n",
+ " 'id_2809': {'nmistakes': 3},\n",
+ " 'id_2812': {'nmistakes': 1},\n",
+ " 'id_2815': {'nmistakes': 1},\n",
+ " 'id_2818': {'nmistakes': 2},\n",
+ " 'id_2821': {'nmistakes': 1},\n",
+ " 'id_2824': {'nmistakes': 1},\n",
+ " 'id_2827': {'nmistakes': 1},\n",
+ " 'id_2830': {'nmistakes': 1},\n",
+ " 'id_2833': {'nmistakes': 2},\n",
+ " 'id_2836': {'nmistakes': 2},\n",
+ " 'id_2839': {'nmistakes': 2},\n",
+ " 'id_2842': {'nmistakes': 3},\n",
+ " 'id_2845': {'nmistakes': 2},\n",
+ " 'id_2848': {'nmistakes': 1},\n",
+ " 'id_2851': {'nmistakes': 3},\n",
+ " 'id_2854': {'nmistakes': 3},\n",
+ " 'id_2857': {'nmistakes': 3},\n",
+ " 'id_2860': {'nmistakes': 2},\n",
+ " 'id_2863': {'nmistakes': 3},\n",
+ " 'id_2866': {'nmistakes': 3},\n",
+ " 'id_2869': {'nmistakes': 3},\n",
+ " 'id_2872': {'nmistakes': 1},\n",
+ " 'id_2875': {'nmistakes': 3},\n",
+ " 'id_2878': {'nmistakes': 1},\n",
+ " 'id_2881': {'nmistakes': 3},\n",
+ " 'id_2884': {'nmistakes': 3},\n",
+ " 'id_2887': {'nmistakes': 3},\n",
+ " 'id_2890': {'nmistakes': 2},\n",
+ " 'id_2893': {'nmistakes': 2},\n",
+ " 'id_2896': {'nmistakes': 1},\n",
+ " 'id_2899': {'nmistakes': 2},\n",
+ " 'id_2902': {'nmistakes': 2},\n",
+ " 'id_2905': {'nmistakes': 1},\n",
+ " 'id_2908': {'nmistakes': 1},\n",
+ " 'id_2911': {'nmistakes': 3},\n",
+ " 'id_2914': {'nmistakes': 2},\n",
+ " 'id_2917': {'nmistakes': 1},\n",
+ " 'id_2920': {'nmistakes': 2},\n",
+ " 'id_2923': {'nmistakes': 3},\n",
+ " 'id_2926': {'nmistakes': 2},\n",
+ " 'id_2929': {'nmistakes': 3},\n",
+ " 'id_2932': {'nmistakes': 2},\n",
+ " 'id_2935': {'nmistakes': 3},\n",
+ " 'id_2938': {'nmistakes': 3},\n",
+ " 'id_2941': {'nmistakes': 1},\n",
+ " 'id_2944': {'nmistakes': 1},\n",
+ " 'id_2947': {'nmistakes': 1},\n",
+ " 'id_2950': {'nmistakes': 2},\n",
+ " 'id_2953': {'nmistakes': 1},\n",
+ " 'id_2956': {'nmistakes': 2},\n",
+ " 'id_2959': {'nmistakes': 1},\n",
+ " 'id_2962': {'nmistakes': 3},\n",
+ " 'id_2965': {'nmistakes': 1},\n",
+ " 'id_2968': {'nmistakes': 2},\n",
+ " 'id_2971': {'nmistakes': 1},\n",
+ " 'id_2974': {'nmistakes': 3},\n",
+ " 'id_2977': {'nmistakes': 2},\n",
+ " 'id_2980': {'nmistakes': 3},\n",
+ " 'id_2983': {'nmistakes': 2},\n",
+ " 'id_2986': {'nmistakes': 3},\n",
+ " 'id_2989': {'nmistakes': 2},\n",
+ " 'id_2992': {'nmistakes': 1},\n",
+ " 'id_2995': {'nmistakes': 1},\n",
+ " 'id_2998': {'nmistakes': 2},\n",
+ " ...}"
+ ]
+ },
+ "execution_count": 18,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "scores = {}\n",
+ "\n",
+ "for model_ in folder2model.values():\n",
+ " scores.update(\n",
+ " dict(zip(df_scores[model_].iloc[x_indices], df_scores[model_].iloc[y_indices]))\n",
+ " )\n",
+ "\n",
+ "for k,v in scores.items():\n",
+ " scores[k] = {'nmistakes': v}\n",
+ "\n",
+ "scores"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "id": "48e415a6-8a43-47d9-95e3-c4deb7dfe604",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'id_1': {'pref_rank': 2},\n",
+ " 'id_4': {'pref_rank': 3},\n",
+ " 'id_7': {'pref_rank': 3},\n",
+ " 'id_10': {'pref_rank': 3},\n",
+ " 'id_13': {'pref_rank': 2},\n",
+ " 'id_16': {'pref_rank': 3},\n",
+ " 'id_19': {'pref_rank': 1},\n",
+ " 'id_22': {'pref_rank': 2},\n",
+ " 'id_25': {'pref_rank': 3},\n",
+ " 'id_28': {'pref_rank': 2},\n",
+ " 'id_31': {'pref_rank': 3},\n",
+ " 'id_34': {'pref_rank': 1},\n",
+ " 'id_37': {'pref_rank': 2},\n",
+ " 'id_40': {'pref_rank': 2},\n",
+ " 'id_43': {'pref_rank': 3},\n",
+ " 'id_46': {'pref_rank': 3},\n",
+ " 'id_49': {'pref_rank': 1},\n",
+ " 'id_52': {'pref_rank': 1},\n",
+ " 'id_55': {'pref_rank': 2},\n",
+ " 'id_58': {'pref_rank': 2},\n",
+ " 'id_61': {'pref_rank': 2},\n",
+ " 'id_64': {'pref_rank': 1},\n",
+ " 'id_67': {'pref_rank': 3},\n",
+ " 'id_70': {'pref_rank': 3},\n",
+ " 'id_73': {'pref_rank': 3},\n",
+ " 'id_76': {'pref_rank': 1},\n",
+ " 'id_79': {'pref_rank': 2},\n",
+ " 'id_82': {'pref_rank': 1},\n",
+ " 'id_85': {'pref_rank': 2},\n",
+ " 'id_88': {'pref_rank': 2},\n",
+ " 'id_91': {'pref_rank': 2},\n",
+ " 'id_94': {'pref_rank': 1},\n",
+ " 'id_97': {'pref_rank': 1},\n",
+ " 'id_100': {'pref_rank': 2},\n",
+ " 'id_103': {'pref_rank': 2},\n",
+ " 'id_106': {'pref_rank': 3},\n",
+ " 'id_109': {'pref_rank': 2},\n",
+ " 'id_112': {'pref_rank': 2},\n",
+ " 'id_115': {'pref_rank': 1},\n",
+ " 'id_118': {'pref_rank': 1},\n",
+ " 'id_121': {'pref_rank': 1},\n",
+ " 'id_124': {'pref_rank': 1},\n",
+ " 'id_127': {'pref_rank': 2},\n",
+ " 'id_130': {'pref_rank': 3},\n",
+ " 'id_133': {'pref_rank': 1},\n",
+ " 'id_136': {'pref_rank': 1},\n",
+ " 'id_139': {'pref_rank': 1},\n",
+ " 'id_142': {'pref_rank': 1},\n",
+ " 'id_145': {'pref_rank': 3},\n",
+ " 'id_148': {'pref_rank': 3},\n",
+ " 'id_151': {'pref_rank': 3},\n",
+ " 'id_154': {'pref_rank': 2},\n",
+ " 'id_157': {'pref_rank': 1},\n",
+ " 'id_160': {'pref_rank': 2},\n",
+ " 'id_163': {'pref_rank': 3},\n",
+ " 'id_166': {'pref_rank': 3},\n",
+ " 'id_169': {'pref_rank': 1},\n",
+ " 'id_172': {'pref_rank': 1},\n",
+ " 'id_175': {'pref_rank': 1},\n",
+ " 'id_178': {'pref_rank': 2},\n",
+ " 'id_181': {'pref_rank': 3},\n",
+ " 'id_184': {'pref_rank': 2},\n",
+ " 'id_187': {'pref_rank': 1},\n",
+ " 'id_190': {'pref_rank': 2},\n",
+ " 'id_193': {'pref_rank': 1},\n",
+ " 'id_196': {'pref_rank': 1},\n",
+ " 'id_199': {'pref_rank': 3},\n",
+ " 'id_202': {'pref_rank': 1},\n",
+ " 'id_205': {'pref_rank': 2},\n",
+ " 'id_208': {'pref_rank': 3},\n",
+ " 'id_211': {'pref_rank': 2},\n",
+ " 'id_214': {'pref_rank': 1},\n",
+ " 'id_217': {'pref_rank': 3},\n",
+ " 'id_220': {'pref_rank': 1},\n",
+ " 'id_223': {'pref_rank': 2},\n",
+ " 'id_226': {'pref_rank': 1},\n",
+ " 'id_229': {'pref_rank': 3},\n",
+ " 'id_232': {'pref_rank': 1},\n",
+ " 'id_235': {'pref_rank': 1},\n",
+ " 'id_238': {'pref_rank': 3},\n",
+ " 'id_241': {'pref_rank': 3},\n",
+ " 'id_244': {'pref_rank': 2},\n",
+ " 'id_247': {'pref_rank': 1},\n",
+ " 'id_250': {'pref_rank': 2},\n",
+ " 'id_253': {'pref_rank': 1},\n",
+ " 'id_256': {'pref_rank': 1},\n",
+ " 'id_259': {'pref_rank': 1},\n",
+ " 'id_262': {'pref_rank': 1},\n",
+ " 'id_265': {'pref_rank': 2},\n",
+ " 'id_268': {'pref_rank': 1},\n",
+ " 'id_271': {'pref_rank': 2},\n",
+ " 'id_274': {'pref_rank': 1},\n",
+ " 'id_277': {'pref_rank': 1},\n",
+ " 'id_280': {'pref_rank': 3},\n",
+ " 'id_283': {'pref_rank': 3},\n",
+ " 'id_286': {'pref_rank': 2},\n",
+ " 'id_289': {'pref_rank': 1},\n",
+ " 'id_292': {'pref_rank': 2},\n",
+ " 'id_295': {'pref_rank': 2},\n",
+ " 'id_298': {'pref_rank': 1},\n",
+ " 'id_301': {'pref_rank': 2},\n",
+ " 'id_304': {'pref_rank': 3},\n",
+ " 'id_307': {'pref_rank': 1},\n",
+ " 'id_310': {'pref_rank': 3},\n",
+ " 'id_313': {'pref_rank': 3},\n",
+ " 'id_316': {'pref_rank': 1},\n",
+ " 'id_319': {'pref_rank': 3},\n",
+ " 'id_322': {'pref_rank': 3},\n",
+ " 'id_325': {'pref_rank': 3},\n",
+ " 'id_328': {'pref_rank': 1},\n",
+ " 'id_331': {'pref_rank': 1},\n",
+ " 'id_334': {'pref_rank': 3},\n",
+ " 'id_337': {'pref_rank': 2},\n",
+ " 'id_340': {'pref_rank': 1},\n",
+ " 'id_343': {'pref_rank': 1},\n",
+ " 'id_346': {'pref_rank': 3},\n",
+ " 'id_349': {'pref_rank': 2},\n",
+ " 'id_352': {'pref_rank': 1},\n",
+ " 'id_355': {'pref_rank': 2},\n",
+ " 'id_358': {'pref_rank': 3},\n",
+ " 'id_361': {'pref_rank': 3},\n",
+ " 'id_364': {'pref_rank': 3},\n",
+ " 'id_367': {'pref_rank': 2},\n",
+ " 'id_370': {'pref_rank': 3},\n",
+ " 'id_373': {'pref_rank': 3},\n",
+ " 'id_376': {'pref_rank': 3},\n",
+ " 'id_379': {'pref_rank': 3},\n",
+ " 'id_382': {'pref_rank': 1},\n",
+ " 'id_385': {'pref_rank': 1},\n",
+ " 'id_388': {'pref_rank': 1},\n",
+ " 'id_391': {'pref_rank': 2},\n",
+ " 'id_394': {'pref_rank': 2},\n",
+ " 'id_397': {'pref_rank': 1},\n",
+ " 'id_400': {'pref_rank': 1},\n",
+ " 'id_403': {'pref_rank': 2},\n",
+ " 'id_406': {'pref_rank': 1},\n",
+ " 'id_409': {'pref_rank': 3},\n",
+ " 'id_412': {'pref_rank': 2},\n",
+ " 'id_415': {'pref_rank': 2},\n",
+ " 'id_418': {'pref_rank': 3},\n",
+ " 'id_421': {'pref_rank': 3},\n",
+ " 'id_424': {'pref_rank': 1},\n",
+ " 'id_427': {'pref_rank': 2},\n",
+ " 'id_430': {'pref_rank': 2},\n",
+ " 'id_433': {'pref_rank': 3},\n",
+ " 'id_436': {'pref_rank': 3},\n",
+ " 'id_439': {'pref_rank': 2},\n",
+ " 'id_442': {'pref_rank': 1},\n",
+ " 'id_445': {'pref_rank': 3},\n",
+ " 'id_448': {'pref_rank': 2},\n",
+ " 'id_451': {'pref_rank': 1},\n",
+ " 'id_454': {'pref_rank': 3},\n",
+ " 'id_457': {'pref_rank': 3},\n",
+ " 'id_460': {'pref_rank': 3},\n",
+ " 'id_463': {'pref_rank': 1},\n",
+ " 'id_466': {'pref_rank': 1},\n",
+ " 'id_469': {'pref_rank': 2},\n",
+ " 'id_472': {'pref_rank': 2},\n",
+ " 'id_475': {'pref_rank': 3},\n",
+ " 'id_478': {'pref_rank': 3},\n",
+ " 'id_481': {'pref_rank': 2},\n",
+ " 'id_484': {'pref_rank': 3},\n",
+ " 'id_487': {'pref_rank': 1},\n",
+ " 'id_490': {'pref_rank': 2},\n",
+ " 'id_493': {'pref_rank': 3},\n",
+ " 'id_496': {'pref_rank': 1},\n",
+ " 'id_499': {'pref_rank': 1},\n",
+ " 'id_502': {'pref_rank': 2},\n",
+ " 'id_505': {'pref_rank': 3},\n",
+ " 'id_508': {'pref_rank': 3},\n",
+ " 'id_511': {'pref_rank': 1},\n",
+ " 'id_514': {'pref_rank': 1},\n",
+ " 'id_517': {'pref_rank': 3},\n",
+ " 'id_520': {'pref_rank': 3},\n",
+ " 'id_523': {'pref_rank': 3},\n",
+ " 'id_526': {'pref_rank': 1},\n",
+ " 'id_529': {'pref_rank': 3},\n",
+ " 'id_532': {'pref_rank': 2},\n",
+ " 'id_535': {'pref_rank': 1},\n",
+ " 'id_538': {'pref_rank': 2},\n",
+ " 'id_541': {'pref_rank': 3},\n",
+ " 'id_544': {'pref_rank': 3},\n",
+ " 'id_547': {'pref_rank': 3},\n",
+ " 'id_550': {'pref_rank': 1},\n",
+ " 'id_553': {'pref_rank': 3},\n",
+ " 'id_556': {'pref_rank': 2},\n",
+ " 'id_559': {'pref_rank': 1},\n",
+ " 'id_562': {'pref_rank': 2},\n",
+ " 'id_565': {'pref_rank': 3},\n",
+ " 'id_568': {'pref_rank': 1},\n",
+ " 'id_571': {'pref_rank': 2},\n",
+ " 'id_574': {'pref_rank': 2},\n",
+ " 'id_577': {'pref_rank': 3},\n",
+ " 'id_580': {'pref_rank': 2},\n",
+ " 'id_583': {'pref_rank': 3},\n",
+ " 'id_586': {'pref_rank': 3},\n",
+ " 'id_589': {'pref_rank': 3},\n",
+ " 'id_592': {'pref_rank': 3},\n",
+ " 'id_595': {'pref_rank': 3},\n",
+ " 'id_598': {'pref_rank': 2},\n",
+ " 'id_601': {'pref_rank': 1},\n",
+ " 'id_604': {'pref_rank': 1},\n",
+ " 'id_607': {'pref_rank': 2},\n",
+ " 'id_610': {'pref_rank': 1},\n",
+ " 'id_613': {'pref_rank': 3},\n",
+ " 'id_616': {'pref_rank': 3},\n",
+ " 'id_619': {'pref_rank': 1},\n",
+ " 'id_622': {'pref_rank': 1},\n",
+ " 'id_625': {'pref_rank': 1},\n",
+ " 'id_628': {'pref_rank': 1},\n",
+ " 'id_631': {'pref_rank': 2},\n",
+ " 'id_634': {'pref_rank': 1},\n",
+ " 'id_637': {'pref_rank': 3},\n",
+ " 'id_640': {'pref_rank': 1},\n",
+ " 'id_643': {'pref_rank': 3},\n",
+ " 'id_646': {'pref_rank': 2},\n",
+ " 'id_649': {'pref_rank': 3},\n",
+ " 'id_652': {'pref_rank': 3},\n",
+ " 'id_655': {'pref_rank': 3},\n",
+ " 'id_658': {'pref_rank': 3},\n",
+ " 'id_661': {'pref_rank': 3},\n",
+ " 'id_664': {'pref_rank': 1},\n",
+ " 'id_667': {'pref_rank': 1},\n",
+ " 'id_670': {'pref_rank': 1},\n",
+ " 'id_673': {'pref_rank': 2},\n",
+ " 'id_676': {'pref_rank': 2},\n",
+ " 'id_679': {'pref_rank': 1},\n",
+ " 'id_682': {'pref_rank': 1},\n",
+ " 'id_685': {'pref_rank': 3},\n",
+ " 'id_688': {'pref_rank': 3},\n",
+ " 'id_691': {'pref_rank': 1},\n",
+ " 'id_694': {'pref_rank': 3},\n",
+ " 'id_697': {'pref_rank': 2},\n",
+ " 'id_700': {'pref_rank': 1},\n",
+ " 'id_703': {'pref_rank': 1},\n",
+ " 'id_706': {'pref_rank': 2},\n",
+ " 'id_709': {'pref_rank': 1},\n",
+ " 'id_712': {'pref_rank': 1},\n",
+ " 'id_715': {'pref_rank': 2},\n",
+ " 'id_718': {'pref_rank': 1},\n",
+ " 'id_721': {'pref_rank': 3},\n",
+ " 'id_724': {'pref_rank': 3},\n",
+ " 'id_727': {'pref_rank': 2},\n",
+ " 'id_730': {'pref_rank': 3},\n",
+ " 'id_733': {'pref_rank': 2},\n",
+ " 'id_736': {'pref_rank': 1},\n",
+ " 'id_739': {'pref_rank': 3},\n",
+ " 'id_742': {'pref_rank': 2},\n",
+ " 'id_745': {'pref_rank': 1},\n",
+ " 'id_748': {'pref_rank': 2},\n",
+ " 'id_751': {'pref_rank': 1},\n",
+ " 'id_754': {'pref_rank': 3},\n",
+ " 'id_757': {'pref_rank': 2},\n",
+ " 'id_760': {'pref_rank': 3},\n",
+ " 'id_763': {'pref_rank': 3},\n",
+ " 'id_766': {'pref_rank': 2},\n",
+ " 'id_769': {'pref_rank': 3},\n",
+ " 'id_772': {'pref_rank': 3},\n",
+ " 'id_775': {'pref_rank': 3},\n",
+ " 'id_778': {'pref_rank': 3},\n",
+ " 'id_781': {'pref_rank': 3},\n",
+ " 'id_784': {'pref_rank': 3},\n",
+ " 'id_787': {'pref_rank': 1},\n",
+ " 'id_790': {'pref_rank': 1},\n",
+ " 'id_793': {'pref_rank': 2},\n",
+ " 'id_796': {'pref_rank': 1},\n",
+ " 'id_799': {'pref_rank': 3},\n",
+ " 'id_802': {'pref_rank': 3},\n",
+ " 'id_805': {'pref_rank': 1},\n",
+ " 'id_808': {'pref_rank': 3},\n",
+ " 'id_811': {'pref_rank': 1},\n",
+ " 'id_814': {'pref_rank': 1},\n",
+ " 'id_817': {'pref_rank': 1},\n",
+ " 'id_820': {'pref_rank': 1},\n",
+ " 'id_823': {'pref_rank': 2},\n",
+ " 'id_826': {'pref_rank': 3},\n",
+ " 'id_829': {'pref_rank': 2},\n",
+ " 'id_832': {'pref_rank': 3},\n",
+ " 'id_835': {'pref_rank': 2},\n",
+ " 'id_838': {'pref_rank': 1},\n",
+ " 'id_841': {'pref_rank': 2},\n",
+ " 'id_844': {'pref_rank': 1},\n",
+ " 'id_847': {'pref_rank': 1},\n",
+ " 'id_850': {'pref_rank': 2},\n",
+ " 'id_853': {'pref_rank': 3},\n",
+ " 'id_856': {'pref_rank': 3},\n",
+ " 'id_859': {'pref_rank': 2},\n",
+ " 'id_862': {'pref_rank': 3},\n",
+ " 'id_865': {'pref_rank': 3},\n",
+ " 'id_868': {'pref_rank': 3},\n",
+ " 'id_871': {'pref_rank': 3},\n",
+ " 'id_874': {'pref_rank': 3},\n",
+ " 'id_877': {'pref_rank': 1},\n",
+ " 'id_880': {'pref_rank': 2},\n",
+ " 'id_883': {'pref_rank': 1},\n",
+ " 'id_886': {'pref_rank': 1},\n",
+ " 'id_889': {'pref_rank': 3},\n",
+ " 'id_892': {'pref_rank': 3},\n",
+ " 'id_895': {'pref_rank': 1},\n",
+ " 'id_898': {'pref_rank': 3},\n",
+ " 'id_901': {'pref_rank': 1},\n",
+ " 'id_904': {'pref_rank': 2},\n",
+ " 'id_907': {'pref_rank': 2},\n",
+ " 'id_910': {'pref_rank': 2},\n",
+ " 'id_913': {'pref_rank': 1},\n",
+ " 'id_916': {'pref_rank': 2},\n",
+ " 'id_919': {'pref_rank': 2},\n",
+ " 'id_922': {'pref_rank': 1},\n",
+ " 'id_925': {'pref_rank': 3},\n",
+ " 'id_928': {'pref_rank': 2},\n",
+ " 'id_931': {'pref_rank': 2},\n",
+ " 'id_934': {'pref_rank': 3},\n",
+ " 'id_937': {'pref_rank': 1},\n",
+ " 'id_940': {'pref_rank': 2},\n",
+ " 'id_943': {'pref_rank': 1},\n",
+ " 'id_946': {'pref_rank': 2},\n",
+ " 'id_949': {'pref_rank': 3},\n",
+ " 'id_952': {'pref_rank': 2},\n",
+ " 'id_955': {'pref_rank': 1},\n",
+ " 'id_958': {'pref_rank': 3},\n",
+ " 'id_961': {'pref_rank': 3},\n",
+ " 'id_964': {'pref_rank': 2},\n",
+ " 'id_967': {'pref_rank': 3},\n",
+ " 'id_970': {'pref_rank': 1},\n",
+ " 'id_973': {'pref_rank': 2},\n",
+ " 'id_976': {'pref_rank': 1},\n",
+ " 'id_979': {'pref_rank': 2},\n",
+ " 'id_982': {'pref_rank': 3},\n",
+ " 'id_985': {'pref_rank': 2},\n",
+ " 'id_988': {'pref_rank': 3},\n",
+ " 'id_991': {'pref_rank': 3},\n",
+ " 'id_994': {'pref_rank': 2},\n",
+ " 'id_997': {'pref_rank': 1},\n",
+ " 'id_1000': {'pref_rank': 1},\n",
+ " 'id_1003': {'pref_rank': 3},\n",
+ " 'id_1006': {'pref_rank': 2},\n",
+ " 'id_1009': {'pref_rank': 3},\n",
+ " 'id_1012': {'pref_rank': 1},\n",
+ " 'id_1015': {'pref_rank': 2},\n",
+ " 'id_1018': {'pref_rank': 1},\n",
+ " 'id_1021': {'pref_rank': 3},\n",
+ " 'id_1024': {'pref_rank': 2},\n",
+ " 'id_1027': {'pref_rank': 2},\n",
+ " 'id_1030': {'pref_rank': 3},\n",
+ " 'id_1033': {'pref_rank': 1},\n",
+ " 'id_1036': {'pref_rank': 1},\n",
+ " 'id_1039': {'pref_rank': 2},\n",
+ " 'id_1042': {'pref_rank': 2},\n",
+ " 'id_1045': {'pref_rank': 1},\n",
+ " 'id_1048': {'pref_rank': 1},\n",
+ " 'id_1051': {'pref_rank': 2},\n",
+ " 'id_1054': {'pref_rank': 3},\n",
+ " 'id_1057': {'pref_rank': 3},\n",
+ " 'id_1060': {'pref_rank': 3},\n",
+ " 'id_1063': {'pref_rank': 3},\n",
+ " 'id_1066': {'pref_rank': 2},\n",
+ " 'id_1069': {'pref_rank': 2},\n",
+ " 'id_1072': {'pref_rank': 1},\n",
+ " 'id_1075': {'pref_rank': 3},\n",
+ " 'id_1078': {'pref_rank': 2},\n",
+ " 'id_1081': {'pref_rank': 2},\n",
+ " 'id_1084': {'pref_rank': 2},\n",
+ " 'id_1087': {'pref_rank': 2},\n",
+ " 'id_1090': {'pref_rank': 2},\n",
+ " 'id_1093': {'pref_rank': 3},\n",
+ " 'id_1096': {'pref_rank': 2},\n",
+ " 'id_1099': {'pref_rank': 2},\n",
+ " 'id_1102': {'pref_rank': 1},\n",
+ " 'id_1105': {'pref_rank': 1},\n",
+ " 'id_1108': {'pref_rank': 3},\n",
+ " 'id_1111': {'pref_rank': 2},\n",
+ " 'id_1114': {'pref_rank': 2},\n",
+ " 'id_1117': {'pref_rank': 1},\n",
+ " 'id_1120': {'pref_rank': 2},\n",
+ " 'id_1123': {'pref_rank': 2},\n",
+ " 'id_1126': {'pref_rank': 3},\n",
+ " 'id_1129': {'pref_rank': 2},\n",
+ " 'id_1132': {'pref_rank': 1},\n",
+ " 'id_1135': {'pref_rank': 2},\n",
+ " 'id_1138': {'pref_rank': 2},\n",
+ " 'id_1141': {'pref_rank': 1},\n",
+ " 'id_1144': {'pref_rank': 1},\n",
+ " 'id_1147': {'pref_rank': 3},\n",
+ " 'id_1150': {'pref_rank': 1},\n",
+ " 'id_1153': {'pref_rank': 1},\n",
+ " 'id_1156': {'pref_rank': 3},\n",
+ " 'id_1159': {'pref_rank': 1},\n",
+ " 'id_1162': {'pref_rank': 1},\n",
+ " 'id_1165': {'pref_rank': 3},\n",
+ " 'id_1168': {'pref_rank': 1},\n",
+ " 'id_1171': {'pref_rank': 2},\n",
+ " 'id_1174': {'pref_rank': 3},\n",
+ " 'id_1177': {'pref_rank': 2},\n",
+ " 'id_1180': {'pref_rank': 2},\n",
+ " 'id_1183': {'pref_rank': 1},\n",
+ " 'id_1186': {'pref_rank': 2},\n",
+ " 'id_1189': {'pref_rank': 1},\n",
+ " 'id_1192': {'pref_rank': 1},\n",
+ " 'id_1195': {'pref_rank': 2},\n",
+ " 'id_1198': {'pref_rank': 1},\n",
+ " 'id_1201': {'pref_rank': 3},\n",
+ " 'id_1204': {'pref_rank': 1},\n",
+ " 'id_1207': {'pref_rank': 1},\n",
+ " 'id_1210': {'pref_rank': 1},\n",
+ " 'id_1213': {'pref_rank': 1},\n",
+ " 'id_1216': {'pref_rank': 3},\n",
+ " 'id_1219': {'pref_rank': 1},\n",
+ " 'id_1222': {'pref_rank': 3},\n",
+ " 'id_1225': {'pref_rank': 3},\n",
+ " 'id_1228': {'pref_rank': 2},\n",
+ " 'id_1231': {'pref_rank': 2},\n",
+ " 'id_1234': {'pref_rank': 3},\n",
+ " 'id_1237': {'pref_rank': 1},\n",
+ " 'id_1240': {'pref_rank': 2},\n",
+ " 'id_1243': {'pref_rank': 2},\n",
+ " 'id_1246': {'pref_rank': 2},\n",
+ " 'id_1249': {'pref_rank': 3},\n",
+ " 'id_1252': {'pref_rank': 2},\n",
+ " 'id_1255': {'pref_rank': 2},\n",
+ " 'id_1258': {'pref_rank': 1},\n",
+ " 'id_1261': {'pref_rank': 2},\n",
+ " 'id_1264': {'pref_rank': 3},\n",
+ " 'id_1267': {'pref_rank': 3},\n",
+ " 'id_1270': {'pref_rank': 1},\n",
+ " 'id_1273': {'pref_rank': 2},\n",
+ " 'id_1276': {'pref_rank': 3},\n",
+ " 'id_1279': {'pref_rank': 3},\n",
+ " 'id_1282': {'pref_rank': 2},\n",
+ " 'id_1285': {'pref_rank': 3},\n",
+ " 'id_1288': {'pref_rank': 2},\n",
+ " 'id_1291': {'pref_rank': 3},\n",
+ " 'id_1294': {'pref_rank': 2},\n",
+ " 'id_1297': {'pref_rank': 2},\n",
+ " 'id_1300': {'pref_rank': 2},\n",
+ " 'id_1303': {'pref_rank': 3},\n",
+ " 'id_1306': {'pref_rank': 1},\n",
+ " 'id_1309': {'pref_rank': 1},\n",
+ " 'id_1312': {'pref_rank': 2},\n",
+ " 'id_1315': {'pref_rank': 3},\n",
+ " 'id_1318': {'pref_rank': 2},\n",
+ " 'id_1321': {'pref_rank': 3},\n",
+ " 'id_1324': {'pref_rank': 3},\n",
+ " 'id_1327': {'pref_rank': 2},\n",
+ " 'id_1330': {'pref_rank': 2},\n",
+ " 'id_1333': {'pref_rank': 1},\n",
+ " 'id_1336': {'pref_rank': 2},\n",
+ " 'id_1339': {'pref_rank': 3},\n",
+ " 'id_1342': {'pref_rank': 3},\n",
+ " 'id_1345': {'pref_rank': 2},\n",
+ " 'id_1348': {'pref_rank': 3},\n",
+ " 'id_1351': {'pref_rank': 3},\n",
+ " 'id_1354': {'pref_rank': 1},\n",
+ " 'id_1357': {'pref_rank': 2},\n",
+ " 'id_1360': {'pref_rank': 1},\n",
+ " 'id_1363': {'pref_rank': 3},\n",
+ " 'id_1366': {'pref_rank': 2},\n",
+ " 'id_1369': {'pref_rank': 3},\n",
+ " 'id_1372': {'pref_rank': 3},\n",
+ " 'id_1375': {'pref_rank': 2},\n",
+ " 'id_1378': {'pref_rank': 2},\n",
+ " 'id_1381': {'pref_rank': 3},\n",
+ " 'id_1384': {'pref_rank': 3},\n",
+ " 'id_1387': {'pref_rank': 2},\n",
+ " 'id_1390': {'pref_rank': 1},\n",
+ " 'id_1393': {'pref_rank': 1},\n",
+ " 'id_1396': {'pref_rank': 2},\n",
+ " 'id_1399': {'pref_rank': 2},\n",
+ " 'id_1402': {'pref_rank': 3},\n",
+ " 'id_1405': {'pref_rank': 1},\n",
+ " 'id_1408': {'pref_rank': 3},\n",
+ " 'id_1411': {'pref_rank': 3},\n",
+ " 'id_1414': {'pref_rank': 3},\n",
+ " 'id_1417': {'pref_rank': 1},\n",
+ " 'id_1420': {'pref_rank': 1},\n",
+ " 'id_1423': {'pref_rank': 1},\n",
+ " 'id_1426': {'pref_rank': 2},\n",
+ " 'id_1429': {'pref_rank': 2},\n",
+ " 'id_1432': {'pref_rank': 1},\n",
+ " 'id_1435': {'pref_rank': 2},\n",
+ " 'id_1438': {'pref_rank': 3},\n",
+ " 'id_1441': {'pref_rank': 3},\n",
+ " 'id_1444': {'pref_rank': 3},\n",
+ " 'id_1447': {'pref_rank': 3},\n",
+ " 'id_1450': {'pref_rank': 1},\n",
+ " 'id_1453': {'pref_rank': 2},\n",
+ " 'id_1456': {'pref_rank': 2},\n",
+ " 'id_1459': {'pref_rank': 1},\n",
+ " 'id_1462': {'pref_rank': 1},\n",
+ " 'id_1465': {'pref_rank': 2},\n",
+ " 'id_1468': {'pref_rank': 1},\n",
+ " 'id_1471': {'pref_rank': 1},\n",
+ " 'id_1474': {'pref_rank': 2},\n",
+ " 'id_1477': {'pref_rank': 3},\n",
+ " 'id_1480': {'pref_rank': 2},\n",
+ " 'id_1483': {'pref_rank': 3},\n",
+ " 'id_1486': {'pref_rank': 1},\n",
+ " 'id_1489': {'pref_rank': 3},\n",
+ " 'id_1492': {'pref_rank': 3},\n",
+ " 'id_1495': {'pref_rank': 1},\n",
+ " 'id_1498': {'pref_rank': 1},\n",
+ " 'id_1501': {'pref_rank': 2},\n",
+ " 'id_1504': {'pref_rank': 1},\n",
+ " 'id_1507': {'pref_rank': 3},\n",
+ " 'id_1510': {'pref_rank': 2},\n",
+ " 'id_1513': {'pref_rank': 3},\n",
+ " 'id_1516': {'pref_rank': 2},\n",
+ " 'id_1519': {'pref_rank': 3},\n",
+ " 'id_1522': {'pref_rank': 2},\n",
+ " 'id_1525': {'pref_rank': 3},\n",
+ " 'id_1528': {'pref_rank': 1},\n",
+ " 'id_1531': {'pref_rank': 2},\n",
+ " 'id_1534': {'pref_rank': 2},\n",
+ " 'id_1537': {'pref_rank': 3},\n",
+ " 'id_1540': {'pref_rank': 1},\n",
+ " 'id_1543': {'pref_rank': 2},\n",
+ " 'id_1546': {'pref_rank': 3},\n",
+ " 'id_1549': {'pref_rank': 1},\n",
+ " 'id_1552': {'pref_rank': 2},\n",
+ " 'id_1555': {'pref_rank': 1},\n",
+ " 'id_1558': {'pref_rank': 2},\n",
+ " 'id_1561': {'pref_rank': 1},\n",
+ " 'id_1564': {'pref_rank': 2},\n",
+ " 'id_1567': {'pref_rank': 2},\n",
+ " 'id_1570': {'pref_rank': 3},\n",
+ " 'id_1573': {'pref_rank': 2},\n",
+ " 'id_1576': {'pref_rank': 1},\n",
+ " 'id_1579': {'pref_rank': 1},\n",
+ " 'id_1582': {'pref_rank': 1},\n",
+ " 'id_1585': {'pref_rank': 1},\n",
+ " 'id_1588': {'pref_rank': 2},\n",
+ " 'id_1591': {'pref_rank': 3},\n",
+ " 'id_1594': {'pref_rank': 1},\n",
+ " 'id_1597': {'pref_rank': 3},\n",
+ " 'id_1600': {'pref_rank': 2},\n",
+ " 'id_1603': {'pref_rank': 1},\n",
+ " 'id_1606': {'pref_rank': 3},\n",
+ " 'id_1609': {'pref_rank': 1},\n",
+ " 'id_1612': {'pref_rank': 3},\n",
+ " 'id_1615': {'pref_rank': 2},\n",
+ " 'id_1618': {'pref_rank': 1},\n",
+ " 'id_1621': {'pref_rank': 2},\n",
+ " 'id_1624': {'pref_rank': 1},\n",
+ " 'id_1627': {'pref_rank': 1},\n",
+ " 'id_1630': {'pref_rank': 3},\n",
+ " 'id_1633': {'pref_rank': 3},\n",
+ " 'id_1636': {'pref_rank': 2},\n",
+ " 'id_1639': {'pref_rank': 2},\n",
+ " 'id_1642': {'pref_rank': 2},\n",
+ " 'id_1645': {'pref_rank': 2},\n",
+ " 'id_1648': {'pref_rank': 1},\n",
+ " 'id_1651': {'pref_rank': 3},\n",
+ " 'id_1654': {'pref_rank': 3},\n",
+ " 'id_1657': {'pref_rank': 2},\n",
+ " 'id_1660': {'pref_rank': 1},\n",
+ " 'id_1663': {'pref_rank': 3},\n",
+ " 'id_1666': {'pref_rank': 3},\n",
+ " 'id_1669': {'pref_rank': 2},\n",
+ " 'id_1672': {'pref_rank': 2},\n",
+ " 'id_1675': {'pref_rank': 2},\n",
+ " 'id_1678': {'pref_rank': 2},\n",
+ " 'id_1681': {'pref_rank': 2},\n",
+ " 'id_1684': {'pref_rank': 1},\n",
+ " 'id_1687': {'pref_rank': 2},\n",
+ " 'id_1690': {'pref_rank': 2},\n",
+ " 'id_1693': {'pref_rank': 1},\n",
+ " 'id_1696': {'pref_rank': 3},\n",
+ " 'id_1699': {'pref_rank': 3},\n",
+ " 'id_1702': {'pref_rank': 3},\n",
+ " 'id_1705': {'pref_rank': 1},\n",
+ " 'id_1708': {'pref_rank': 2},\n",
+ " 'id_1711': {'pref_rank': 1},\n",
+ " 'id_1714': {'pref_rank': 1},\n",
+ " 'id_1717': {'pref_rank': 3},\n",
+ " 'id_1720': {'pref_rank': 1},\n",
+ " 'id_1723': {'pref_rank': 2},\n",
+ " 'id_1726': {'pref_rank': 1},\n",
+ " 'id_1729': {'pref_rank': 3},\n",
+ " 'id_1732': {'pref_rank': 1},\n",
+ " 'id_1735': {'pref_rank': 2},\n",
+ " 'id_1738': {'pref_rank': 1},\n",
+ " 'id_1741': {'pref_rank': 1},\n",
+ " 'id_1744': {'pref_rank': 3},\n",
+ " 'id_1747': {'pref_rank': 1},\n",
+ " 'id_1750': {'pref_rank': 2},\n",
+ " 'id_1753': {'pref_rank': 1},\n",
+ " 'id_1756': {'pref_rank': 2},\n",
+ " 'id_1759': {'pref_rank': 2},\n",
+ " 'id_1762': {'pref_rank': 3},\n",
+ " 'id_1765': {'pref_rank': 2},\n",
+ " 'id_1768': {'pref_rank': 3},\n",
+ " 'id_1771': {'pref_rank': 1},\n",
+ " 'id_1774': {'pref_rank': 3},\n",
+ " 'id_1777': {'pref_rank': 3},\n",
+ " 'id_1780': {'pref_rank': 3},\n",
+ " 'id_1783': {'pref_rank': 2},\n",
+ " 'id_1786': {'pref_rank': 1},\n",
+ " 'id_1789': {'pref_rank': 1},\n",
+ " 'id_1792': {'pref_rank': 2},\n",
+ " 'id_1795': {'pref_rank': 3},\n",
+ " 'id_1798': {'pref_rank': 2},\n",
+ " 'id_1801': {'pref_rank': 1},\n",
+ " 'id_1804': {'pref_rank': 3},\n",
+ " 'id_1807': {'pref_rank': 3},\n",
+ " 'id_1810': {'pref_rank': 3},\n",
+ " 'id_1813': {'pref_rank': 2},\n",
+ " 'id_1816': {'pref_rank': 1},\n",
+ " 'id_1819': {'pref_rank': 2},\n",
+ " 'id_1822': {'pref_rank': 1},\n",
+ " 'id_1825': {'pref_rank': 1},\n",
+ " 'id_1828': {'pref_rank': 1},\n",
+ " 'id_1831': {'pref_rank': 3},\n",
+ " 'id_1834': {'pref_rank': 2},\n",
+ " 'id_1837': {'pref_rank': 3},\n",
+ " 'id_1840': {'pref_rank': 1},\n",
+ " 'id_1843': {'pref_rank': 1},\n",
+ " 'id_1846': {'pref_rank': 3},\n",
+ " 'id_1849': {'pref_rank': 2},\n",
+ " 'id_1852': {'pref_rank': 2},\n",
+ " 'id_1855': {'pref_rank': 1},\n",
+ " 'id_1858': {'pref_rank': 1},\n",
+ " 'id_1861': {'pref_rank': 3},\n",
+ " 'id_1864': {'pref_rank': 3},\n",
+ " 'id_1867': {'pref_rank': 2},\n",
+ " 'id_1870': {'pref_rank': 3},\n",
+ " 'id_1873': {'pref_rank': 2},\n",
+ " 'id_1876': {'pref_rank': 2},\n",
+ " 'id_1879': {'pref_rank': 3},\n",
+ " 'id_1882': {'pref_rank': 2},\n",
+ " 'id_1885': {'pref_rank': 3},\n",
+ " 'id_1888': {'pref_rank': 3},\n",
+ " 'id_1891': {'pref_rank': 1},\n",
+ " 'id_1894': {'pref_rank': 2},\n",
+ " 'id_1897': {'pref_rank': 1},\n",
+ " 'id_1900': {'pref_rank': 1},\n",
+ " 'id_1903': {'pref_rank': 1},\n",
+ " 'id_1906': {'pref_rank': 3},\n",
+ " 'id_1909': {'pref_rank': 3},\n",
+ " 'id_1912': {'pref_rank': 1},\n",
+ " 'id_1915': {'pref_rank': 3},\n",
+ " 'id_1918': {'pref_rank': 2},\n",
+ " 'id_1921': {'pref_rank': 3},\n",
+ " 'id_1924': {'pref_rank': 3},\n",
+ " 'id_1927': {'pref_rank': 2},\n",
+ " 'id_1930': {'pref_rank': 3},\n",
+ " 'id_1933': {'pref_rank': 1},\n",
+ " 'id_1936': {'pref_rank': 3},\n",
+ " 'id_1939': {'pref_rank': 1},\n",
+ " 'id_1942': {'pref_rank': 2},\n",
+ " 'id_1945': {'pref_rank': 2},\n",
+ " 'id_1948': {'pref_rank': 3},\n",
+ " 'id_1951': {'pref_rank': 2},\n",
+ " 'id_1954': {'pref_rank': 1},\n",
+ " 'id_1957': {'pref_rank': 2},\n",
+ " 'id_1960': {'pref_rank': 1},\n",
+ " 'id_1963': {'pref_rank': 1},\n",
+ " 'id_1966': {'pref_rank': 1},\n",
+ " 'id_1969': {'pref_rank': 3},\n",
+ " 'id_1972': {'pref_rank': 3},\n",
+ " 'id_1975': {'pref_rank': 1},\n",
+ " 'id_1978': {'pref_rank': 3},\n",
+ " 'id_1981': {'pref_rank': 1},\n",
+ " 'id_1984': {'pref_rank': 1},\n",
+ " 'id_1987': {'pref_rank': 3},\n",
+ " 'id_1990': {'pref_rank': 3},\n",
+ " 'id_1993': {'pref_rank': 1},\n",
+ " 'id_1996': {'pref_rank': 1},\n",
+ " 'id_1999': {'pref_rank': 2},\n",
+ " 'id_2002': {'pref_rank': 1},\n",
+ " 'id_2005': {'pref_rank': 2},\n",
+ " 'id_2008': {'pref_rank': 1},\n",
+ " 'id_2011': {'pref_rank': 2},\n",
+ " 'id_2014': {'pref_rank': 1},\n",
+ " 'id_2017': {'pref_rank': 1},\n",
+ " 'id_2020': {'pref_rank': 1},\n",
+ " 'id_2023': {'pref_rank': 2},\n",
+ " 'id_2026': {'pref_rank': 1},\n",
+ " 'id_2029': {'pref_rank': 2},\n",
+ " 'id_2032': {'pref_rank': 1},\n",
+ " 'id_2035': {'pref_rank': 1},\n",
+ " 'id_2038': {'pref_rank': 3},\n",
+ " 'id_2041': {'pref_rank': 1},\n",
+ " 'id_2044': {'pref_rank': 2},\n",
+ " 'id_2047': {'pref_rank': 3},\n",
+ " 'id_2050': {'pref_rank': 2},\n",
+ " 'id_2053': {'pref_rank': 1},\n",
+ " 'id_2056': {'pref_rank': 1},\n",
+ " 'id_2059': {'pref_rank': 3},\n",
+ " 'id_2062': {'pref_rank': 1},\n",
+ " 'id_2065': {'pref_rank': 2},\n",
+ " 'id_2068': {'pref_rank': 3},\n",
+ " 'id_2071': {'pref_rank': 2},\n",
+ " 'id_2074': {'pref_rank': 1},\n",
+ " 'id_2077': {'pref_rank': 1},\n",
+ " 'id_2080': {'pref_rank': 1},\n",
+ " 'id_2083': {'pref_rank': 3},\n",
+ " 'id_2086': {'pref_rank': 1},\n",
+ " 'id_2089': {'pref_rank': 1},\n",
+ " 'id_2092': {'pref_rank': 2},\n",
+ " 'id_2095': {'pref_rank': 3},\n",
+ " 'id_2098': {'pref_rank': 2},\n",
+ " 'id_2101': {'pref_rank': 1},\n",
+ " 'id_2104': {'pref_rank': 1},\n",
+ " 'id_2107': {'pref_rank': 2},\n",
+ " 'id_2110': {'pref_rank': 2},\n",
+ " 'id_2113': {'pref_rank': 2},\n",
+ " 'id_2116': {'pref_rank': 3},\n",
+ " 'id_2119': {'pref_rank': 1},\n",
+ " 'id_2122': {'pref_rank': 1},\n",
+ " 'id_2125': {'pref_rank': 2},\n",
+ " 'id_2128': {'pref_rank': 3},\n",
+ " 'id_2131': {'pref_rank': 1},\n",
+ " 'id_2134': {'pref_rank': 3},\n",
+ " 'id_2137': {'pref_rank': 2},\n",
+ " 'id_2140': {'pref_rank': 2},\n",
+ " 'id_2143': {'pref_rank': 3},\n",
+ " 'id_2146': {'pref_rank': 1},\n",
+ " 'id_2149': {'pref_rank': 1},\n",
+ " 'id_2152': {'pref_rank': 3},\n",
+ " 'id_2155': {'pref_rank': 3},\n",
+ " 'id_2158': {'pref_rank': 2},\n",
+ " 'id_2161': {'pref_rank': 2},\n",
+ " 'id_2164': {'pref_rank': 1},\n",
+ " 'id_2167': {'pref_rank': 2},\n",
+ " 'id_2170': {'pref_rank': 2},\n",
+ " 'id_2173': {'pref_rank': 3},\n",
+ " 'id_2176': {'pref_rank': 3},\n",
+ " 'id_2179': {'pref_rank': 2},\n",
+ " 'id_2182': {'pref_rank': 1},\n",
+ " 'id_2185': {'pref_rank': 3},\n",
+ " 'id_2188': {'pref_rank': 2},\n",
+ " 'id_2191': {'pref_rank': 3},\n",
+ " 'id_2194': {'pref_rank': 2},\n",
+ " 'id_2197': {'pref_rank': 2},\n",
+ " 'id_2200': {'pref_rank': 2},\n",
+ " 'id_2203': {'pref_rank': 2},\n",
+ " 'id_2206': {'pref_rank': 2},\n",
+ " 'id_2209': {'pref_rank': 3},\n",
+ " 'id_2212': {'pref_rank': 1},\n",
+ " 'id_2215': {'pref_rank': 2},\n",
+ " 'id_2218': {'pref_rank': 1},\n",
+ " 'id_2221': {'pref_rank': 1},\n",
+ " 'id_2224': {'pref_rank': 2},\n",
+ " 'id_2227': {'pref_rank': 2},\n",
+ " 'id_2230': {'pref_rank': 2},\n",
+ " 'id_2233': {'pref_rank': 2},\n",
+ " 'id_2236': {'pref_rank': 3},\n",
+ " 'id_2239': {'pref_rank': 2},\n",
+ " 'id_2242': {'pref_rank': 2},\n",
+ " 'id_2245': {'pref_rank': 3},\n",
+ " 'id_2248': {'pref_rank': 2},\n",
+ " 'id_2251': {'pref_rank': 3},\n",
+ " 'id_2254': {'pref_rank': 1},\n",
+ " 'id_2257': {'pref_rank': 2},\n",
+ " 'id_2260': {'pref_rank': 1},\n",
+ " 'id_2263': {'pref_rank': 2},\n",
+ " 'id_2266': {'pref_rank': 3},\n",
+ " 'id_2269': {'pref_rank': 3},\n",
+ " 'id_2272': {'pref_rank': 3},\n",
+ " 'id_2275': {'pref_rank': 1},\n",
+ " 'id_2278': {'pref_rank': 3},\n",
+ " 'id_2281': {'pref_rank': 2},\n",
+ " 'id_2284': {'pref_rank': 1},\n",
+ " 'id_2287': {'pref_rank': 2},\n",
+ " 'id_2290': {'pref_rank': 1},\n",
+ " 'id_2293': {'pref_rank': 3},\n",
+ " 'id_2296': {'pref_rank': 3},\n",
+ " 'id_2299': {'pref_rank': 2},\n",
+ " 'id_2302': {'pref_rank': 2},\n",
+ " 'id_2305': {'pref_rank': 1},\n",
+ " 'id_2308': {'pref_rank': 3},\n",
+ " 'id_2311': {'pref_rank': 2},\n",
+ " 'id_2314': {'pref_rank': 2},\n",
+ " 'id_2317': {'pref_rank': 1},\n",
+ " 'id_2320': {'pref_rank': 1},\n",
+ " 'id_2323': {'pref_rank': 3},\n",
+ " 'id_2326': {'pref_rank': 1},\n",
+ " 'id_2329': {'pref_rank': 1},\n",
+ " 'id_2332': {'pref_rank': 3},\n",
+ " 'id_2335': {'pref_rank': 2},\n",
+ " 'id_2338': {'pref_rank': 1},\n",
+ " 'id_2341': {'pref_rank': 3},\n",
+ " 'id_2344': {'pref_rank': 1},\n",
+ " 'id_2347': {'pref_rank': 1},\n",
+ " 'id_2350': {'pref_rank': 1},\n",
+ " 'id_2353': {'pref_rank': 1},\n",
+ " 'id_2356': {'pref_rank': 1},\n",
+ " 'id_2359': {'pref_rank': 1},\n",
+ " 'id_2362': {'pref_rank': 3},\n",
+ " 'id_2365': {'pref_rank': 3},\n",
+ " 'id_2368': {'pref_rank': 3},\n",
+ " 'id_2371': {'pref_rank': 2},\n",
+ " 'id_2374': {'pref_rank': 3},\n",
+ " 'id_2377': {'pref_rank': 1},\n",
+ " 'id_2380': {'pref_rank': 3},\n",
+ " 'id_2383': {'pref_rank': 2},\n",
+ " 'id_2386': {'pref_rank': 2},\n",
+ " 'id_2389': {'pref_rank': 3},\n",
+ " 'id_2392': {'pref_rank': 3},\n",
+ " 'id_2395': {'pref_rank': 2},\n",
+ " 'id_2398': {'pref_rank': 3},\n",
+ " 'id_2401': {'pref_rank': 2},\n",
+ " 'id_2404': {'pref_rank': 1},\n",
+ " 'id_2407': {'pref_rank': 1},\n",
+ " 'id_2410': {'pref_rank': 1},\n",
+ " 'id_2413': {'pref_rank': 2},\n",
+ " 'id_2416': {'pref_rank': 3},\n",
+ " 'id_2419': {'pref_rank': 3},\n",
+ " 'id_2422': {'pref_rank': 1},\n",
+ " 'id_2425': {'pref_rank': 1},\n",
+ " 'id_2428': {'pref_rank': 2},\n",
+ " 'id_2431': {'pref_rank': 2},\n",
+ " 'id_2434': {'pref_rank': 2},\n",
+ " 'id_2437': {'pref_rank': 2},\n",
+ " 'id_2440': {'pref_rank': 1},\n",
+ " 'id_2443': {'pref_rank': 3},\n",
+ " 'id_2446': {'pref_rank': 2},\n",
+ " 'id_2449': {'pref_rank': 1},\n",
+ " 'id_2452': {'pref_rank': 3},\n",
+ " 'id_2455': {'pref_rank': 2},\n",
+ " 'id_2458': {'pref_rank': 3},\n",
+ " 'id_2461': {'pref_rank': 1},\n",
+ " 'id_2464': {'pref_rank': 1},\n",
+ " 'id_2467': {'pref_rank': 2},\n",
+ " 'id_2470': {'pref_rank': 1},\n",
+ " 'id_2473': {'pref_rank': 3},\n",
+ " 'id_2476': {'pref_rank': 2},\n",
+ " 'id_2479': {'pref_rank': 3},\n",
+ " 'id_2482': {'pref_rank': 3},\n",
+ " 'id_2485': {'pref_rank': 3},\n",
+ " 'id_2488': {'pref_rank': 3},\n",
+ " 'id_2491': {'pref_rank': 1},\n",
+ " 'id_2494': {'pref_rank': 2},\n",
+ " 'id_2497': {'pref_rank': 2},\n",
+ " 'id_2500': {'pref_rank': 2},\n",
+ " 'id_2503': {'pref_rank': 1},\n",
+ " 'id_2506': {'pref_rank': 3},\n",
+ " 'id_2509': {'pref_rank': 2},\n",
+ " 'id_2512': {'pref_rank': 1},\n",
+ " 'id_2515': {'pref_rank': 1},\n",
+ " 'id_2518': {'pref_rank': 3},\n",
+ " 'id_2521': {'pref_rank': 3},\n",
+ " 'id_2524': {'pref_rank': 2},\n",
+ " 'id_2527': {'pref_rank': 2},\n",
+ " 'id_2530': {'pref_rank': 3},\n",
+ " 'id_2533': {'pref_rank': 3},\n",
+ " 'id_2536': {'pref_rank': 2},\n",
+ " 'id_2539': {'pref_rank': 3},\n",
+ " 'id_2542': {'pref_rank': 3},\n",
+ " 'id_2545': {'pref_rank': 3},\n",
+ " 'id_2548': {'pref_rank': 1},\n",
+ " 'id_2551': {'pref_rank': 1},\n",
+ " 'id_2554': {'pref_rank': 1},\n",
+ " 'id_2557': {'pref_rank': 2},\n",
+ " 'id_2560': {'pref_rank': 1},\n",
+ " 'id_2563': {'pref_rank': 1},\n",
+ " 'id_2566': {'pref_rank': 2},\n",
+ " 'id_2569': {'pref_rank': 1},\n",
+ " 'id_2572': {'pref_rank': 2},\n",
+ " 'id_2575': {'pref_rank': 2},\n",
+ " 'id_2578': {'pref_rank': 3},\n",
+ " 'id_2581': {'pref_rank': 2},\n",
+ " 'id_2584': {'pref_rank': 1},\n",
+ " 'id_2587': {'pref_rank': 2},\n",
+ " 'id_2590': {'pref_rank': 2},\n",
+ " 'id_2593': {'pref_rank': 3},\n",
+ " 'id_2596': {'pref_rank': 3},\n",
+ " 'id_2599': {'pref_rank': 3},\n",
+ " 'id_2602': {'pref_rank': 2},\n",
+ " 'id_2605': {'pref_rank': 3},\n",
+ " 'id_2608': {'pref_rank': 2},\n",
+ " 'id_2611': {'pref_rank': 1},\n",
+ " 'id_2614': {'pref_rank': 2},\n",
+ " 'id_2617': {'pref_rank': 2},\n",
+ " 'id_2620': {'pref_rank': 2},\n",
+ " 'id_2623': {'pref_rank': 3},\n",
+ " 'id_2626': {'pref_rank': 2},\n",
+ " 'id_2629': {'pref_rank': 3},\n",
+ " 'id_2632': {'pref_rank': 3},\n",
+ " 'id_2635': {'pref_rank': 2},\n",
+ " 'id_2638': {'pref_rank': 1},\n",
+ " 'id_2641': {'pref_rank': 3},\n",
+ " 'id_2644': {'pref_rank': 2},\n",
+ " 'id_2647': {'pref_rank': 3},\n",
+ " 'id_2650': {'pref_rank': 1},\n",
+ " 'id_2653': {'pref_rank': 3},\n",
+ " 'id_2656': {'pref_rank': 1},\n",
+ " 'id_2659': {'pref_rank': 1},\n",
+ " 'id_2662': {'pref_rank': 3},\n",
+ " 'id_2665': {'pref_rank': 1},\n",
+ " 'id_2668': {'pref_rank': 2},\n",
+ " 'id_2671': {'pref_rank': 2},\n",
+ " 'id_2674': {'pref_rank': 2},\n",
+ " 'id_2677': {'pref_rank': 1},\n",
+ " 'id_2680': {'pref_rank': 2},\n",
+ " 'id_2683': {'pref_rank': 2},\n",
+ " 'id_2686': {'pref_rank': 1},\n",
+ " 'id_2689': {'pref_rank': 1},\n",
+ " 'id_2692': {'pref_rank': 3},\n",
+ " 'id_2695': {'pref_rank': 3},\n",
+ " 'id_2698': {'pref_rank': 2},\n",
+ " 'id_2701': {'pref_rank': 3},\n",
+ " 'id_2704': {'pref_rank': 1},\n",
+ " 'id_2707': {'pref_rank': 3},\n",
+ " 'id_2710': {'pref_rank': 2},\n",
+ " 'id_2713': {'pref_rank': 3},\n",
+ " 'id_2716': {'pref_rank': 1},\n",
+ " 'id_2719': {'pref_rank': 2},\n",
+ " 'id_2722': {'pref_rank': 2},\n",
+ " 'id_2725': {'pref_rank': 3},\n",
+ " 'id_2728': {'pref_rank': 1},\n",
+ " 'id_2731': {'pref_rank': 3},\n",
+ " 'id_2734': {'pref_rank': 1},\n",
+ " 'id_2737': {'pref_rank': 1},\n",
+ " 'id_2740': {'pref_rank': 3},\n",
+ " 'id_2743': {'pref_rank': 1},\n",
+ " 'id_2746': {'pref_rank': 2},\n",
+ " 'id_2749': {'pref_rank': 2},\n",
+ " 'id_2752': {'pref_rank': 2},\n",
+ " 'id_2755': {'pref_rank': 2},\n",
+ " 'id_2758': {'pref_rank': 1},\n",
+ " 'id_2761': {'pref_rank': 3},\n",
+ " 'id_2764': {'pref_rank': 1},\n",
+ " 'id_2767': {'pref_rank': 1},\n",
+ " 'id_2770': {'pref_rank': 2},\n",
+ " 'id_2773': {'pref_rank': 2},\n",
+ " 'id_2776': {'pref_rank': 1},\n",
+ " 'id_2779': {'pref_rank': 1},\n",
+ " 'id_2782': {'pref_rank': 2},\n",
+ " 'id_2785': {'pref_rank': 3},\n",
+ " 'id_2788': {'pref_rank': 3},\n",
+ " 'id_2791': {'pref_rank': 1},\n",
+ " 'id_2794': {'pref_rank': 1},\n",
+ " 'id_2797': {'pref_rank': 2},\n",
+ " 'id_2800': {'pref_rank': 1},\n",
+ " 'id_2803': {'pref_rank': 3},\n",
+ " 'id_2806': {'pref_rank': 1},\n",
+ " 'id_2809': {'pref_rank': 3},\n",
+ " 'id_2812': {'pref_rank': 1},\n",
+ " 'id_2815': {'pref_rank': 1},\n",
+ " 'id_2818': {'pref_rank': 2},\n",
+ " 'id_2821': {'pref_rank': 1},\n",
+ " 'id_2824': {'pref_rank': 1},\n",
+ " 'id_2827': {'pref_rank': 1},\n",
+ " 'id_2830': {'pref_rank': 1},\n",
+ " 'id_2833': {'pref_rank': 2},\n",
+ " 'id_2836': {'pref_rank': 2},\n",
+ " 'id_2839': {'pref_rank': 2},\n",
+ " 'id_2842': {'pref_rank': 3},\n",
+ " 'id_2845': {'pref_rank': 2},\n",
+ " 'id_2848': {'pref_rank': 1},\n",
+ " 'id_2851': {'pref_rank': 3},\n",
+ " 'id_2854': {'pref_rank': 3},\n",
+ " 'id_2857': {'pref_rank': 3},\n",
+ " 'id_2860': {'pref_rank': 2},\n",
+ " 'id_2863': {'pref_rank': 3},\n",
+ " 'id_2866': {'pref_rank': 3},\n",
+ " 'id_2869': {'pref_rank': 3},\n",
+ " 'id_2872': {'pref_rank': 1},\n",
+ " 'id_2875': {'pref_rank': 3},\n",
+ " 'id_2878': {'pref_rank': 1},\n",
+ " 'id_2881': {'pref_rank': 3},\n",
+ " 'id_2884': {'pref_rank': 3},\n",
+ " 'id_2887': {'pref_rank': 3},\n",
+ " 'id_2890': {'pref_rank': 2},\n",
+ " 'id_2893': {'pref_rank': 2},\n",
+ " 'id_2896': {'pref_rank': 1},\n",
+ " 'id_2899': {'pref_rank': 2},\n",
+ " 'id_2902': {'pref_rank': 2},\n",
+ " 'id_2905': {'pref_rank': 1},\n",
+ " 'id_2908': {'pref_rank': 1},\n",
+ " 'id_2911': {'pref_rank': 3},\n",
+ " 'id_2914': {'pref_rank': 2},\n",
+ " 'id_2917': {'pref_rank': 1},\n",
+ " 'id_2920': {'pref_rank': 2},\n",
+ " 'id_2923': {'pref_rank': 3},\n",
+ " 'id_2926': {'pref_rank': 2},\n",
+ " 'id_2929': {'pref_rank': 3},\n",
+ " 'id_2932': {'pref_rank': 2},\n",
+ " 'id_2935': {'pref_rank': 3},\n",
+ " 'id_2938': {'pref_rank': 3},\n",
+ " 'id_2941': {'pref_rank': 1},\n",
+ " 'id_2944': {'pref_rank': 1},\n",
+ " 'id_2947': {'pref_rank': 1},\n",
+ " 'id_2950': {'pref_rank': 2},\n",
+ " 'id_2953': {'pref_rank': 1},\n",
+ " 'id_2956': {'pref_rank': 2},\n",
+ " 'id_2959': {'pref_rank': 1},\n",
+ " 'id_2962': {'pref_rank': 3},\n",
+ " 'id_2965': {'pref_rank': 1},\n",
+ " 'id_2968': {'pref_rank': 2},\n",
+ " 'id_2971': {'pref_rank': 1},\n",
+ " 'id_2974': {'pref_rank': 3},\n",
+ " 'id_2977': {'pref_rank': 2},\n",
+ " 'id_2980': {'pref_rank': 3},\n",
+ " 'id_2983': {'pref_rank': 2},\n",
+ " 'id_2986': {'pref_rank': 3},\n",
+ " 'id_2989': {'pref_rank': 2},\n",
+ " 'id_2992': {'pref_rank': 1},\n",
+ " 'id_2995': {'pref_rank': 1},\n",
+ " 'id_2998': {'pref_rank': 2},\n",
+ " ...}"
+ ]
+ },
+ "execution_count": 19,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "pref = {}\n",
+ "\n",
+ "for model_ in folder2model.values():\n",
+ " pref.update(\n",
+ " dict(zip(df_scores[model_].iloc[x_indices], df_scores[model_].iloc[y_indices]))\n",
+ " )\n",
+ "\n",
+ "for k,v in pref.items():\n",
+ " pref[k] = {'pref_rank': v}\n",
+ "\n",
+ "pref"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "id": "4f73823c-a3d2-4cb8-bbe3-317acbf2e4c7",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "['id_1', 'id_4', 'id_7', 'id_10', 'id_13']"
+ ]
+ },
+ "execution_count": 20,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "list(df_scores['m1'].iloc[x_indices])[:5]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "id": "871152a6-5809-4815-91d3-285123b5a80b",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'id_1': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_4': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_7': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_10': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_13': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_16': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_19': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_22': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_25': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_28': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_31': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_34': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_37': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_40': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_43': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_46': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_49': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_52': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_55': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_58': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_61': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_64': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_67': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_70': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_73': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_76': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_79': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_82': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_85': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_88': {'model': 'm1',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_91': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_94': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_97': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_100': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_103': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_106': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_109': {'model': 'm2',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_112': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_115': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_118': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_121': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_124': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_127': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_130': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_133': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_136': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_139': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_142': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_145': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_148': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_151': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_154': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_157': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_160': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_163': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_166': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_169': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_172': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_175': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_178': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_181': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_184': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_187': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_190': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_193': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_196': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_199': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_202': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_205': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_208': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_211': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_214': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_217': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_220': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_223': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_226': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_229': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_232': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_235': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_238': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_241': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_244': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_247': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_250': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_253': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_256': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_259': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_262': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_265': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_268': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_271': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_274': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_277': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_280': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_283': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_286': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_289': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_292': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_295': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_298': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_301': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_304': {'model': 'm2',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_307': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_310': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_313': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_316': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_319': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_322': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_325': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_328': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_331': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_334': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_337': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_340': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_343': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_346': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_349': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_352': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_355': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_358': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_361': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_364': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_367': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_370': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_373': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_376': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_379': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_382': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_385': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_388': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_391': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_394': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_397': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_400': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_403': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_406': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_409': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_412': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_415': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_418': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_421': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_424': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_427': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_430': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_433': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_436': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_439': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_442': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_445': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_448': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0011',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_451': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_454': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_457': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_460': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_463': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_466': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_469': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_472': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_475': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_478': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_481': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_484': {'model': 'm2',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_487': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_490': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_493': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_496': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_499': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_502': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_505': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_508': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_511': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_514': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_517': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_520': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_523': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_526': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_529': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_532': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_535': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_538': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_541': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_544': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_547': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_550': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_553': {'model': 'm2',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_556': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_559': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_562': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_565': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_568': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_571': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_574': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_577': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_580': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_583': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_586': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_589': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_592': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_595': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_598': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_601': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_604': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_607': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_610': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_613': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_616': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_619': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_622': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_625': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_628': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_631': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_634': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_637': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_640': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_643': {'model': 'm2',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_646': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_649': {'model': 'm2',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_652': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_655': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_658': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_661': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_664': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_667': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_670': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_673': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_676': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_679': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_682': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_685': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_688': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_691': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_694': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_697': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_700': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_703': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_706': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_709': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_712': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_715': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_718': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_721': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_724': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_727': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_730': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_733': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_736': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_739': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_742': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_745': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_748': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_751': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_754': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_757': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_760': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_763': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_766': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_769': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_772': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_775': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_778': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_781': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_784': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_787': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_790': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_793': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_796': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_799': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_802': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_805': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_808': {'model': 'm1',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_811': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_814': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_817': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_820': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_823': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_826': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_829': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_832': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_835': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_838': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_841': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_844': {'model': 'm2',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_847': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_850': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_853': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_856': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_859': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_862': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_865': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_868': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_871': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_874': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_877': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_880': {'model': 'm1',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_883': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_886': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_889': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_892': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_895': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_898': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0012',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_901': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_904': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_907': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_910': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_913': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_916': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_919': {'model': 'm2',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_922': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_925': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_928': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_931': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_934': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_937': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_940': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_943': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_946': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_949': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_952': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_955': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_958': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_961': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_964': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_967': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_970': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_973': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_976': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_979': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_982': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_985': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_988': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_991': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_994': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_997': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1000': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1003': {'model': 'm2',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1006': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1009': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1012': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1015': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1018': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1021': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1024': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1027': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1030': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1033': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1036': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1039': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1042': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1045': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1048': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1051': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1054': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1057': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1060': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1063': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1066': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1069': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1072': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1075': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1078': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1081': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1084': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1087': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1090': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1093': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1096': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1099': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1102': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1105': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1108': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1111': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1114': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1117': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1120': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1123': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1126': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1129': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1132': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1135': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1138': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1141': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1144': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1147': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1150': {'model': 'm1',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1153': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1156': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1159': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1162': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1165': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1168': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1171': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1174': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1177': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1180': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1183': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1186': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1189': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1192': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1195': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1198': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1201': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1204': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1207': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1210': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1213': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1216': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1219': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1222': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1225': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1228': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1231': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1234': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1237': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1240': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1243': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1246': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1249': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1252': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1255': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1258': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1261': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1264': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1267': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1270': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1273': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1276': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1279': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1282': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1285': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1288': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1291': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1294': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1297': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1300': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1303': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1306': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1309': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1312': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1315': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1318': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1321': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1324': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1327': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1330': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1333': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1336': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1339': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1342': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1345': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1348': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0013',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1351': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1354': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1357': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1360': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1363': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1366': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1369': {'model': 'm2',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1372': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1375': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1378': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1381': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1384': {'model': 'm2',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1387': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1390': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1393': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1396': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1399': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1402': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1405': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1408': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1411': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1414': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1417': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1420': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1423': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1426': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1429': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1432': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1435': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1438': {'model': 'm1',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1441': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1444': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1447': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1450': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1453': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1456': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1459': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1462': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1465': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1468': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1471': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1474': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1477': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1480': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1483': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1486': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1489': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1492': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1495': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1498': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1501': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1504': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1507': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1510': {'model': 'm1',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1513': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1516': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1519': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1522': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1525': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1528': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1531': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1534': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1537': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1540': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1543': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1546': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1549': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1552': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1555': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1558': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1561': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1564': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1567': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1570': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1573': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1576': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1579': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1582': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1585': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1588': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1591': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1594': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1597': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1600': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1603': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1606': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1609': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1612': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1615': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1618': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1621': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1624': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1627': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1630': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1633': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1636': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1639': {'model': 'm2',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1642': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1645': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1648': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1651': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1654': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1657': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1660': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1663': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1666': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1669': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1672': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1675': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1678': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1681': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1684': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1687': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1690': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1693': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1696': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1699': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1702': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1705': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1708': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1711': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1714': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1717': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1720': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1723': {'model': 'm2',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1726': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1729': {'model': 'm2',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1732': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1735': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1738': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1741': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1744': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1747': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1750': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1753': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1756': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1759': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1762': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1765': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1768': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1771': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1774': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1777': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1780': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1783': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1786': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1789': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1792': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1795': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1798': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0014',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1801': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1804': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1807': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1810': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1813': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1816': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1819': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1822': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1825': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1828': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1831': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1834': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1837': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1840': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1843': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1846': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1849': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1852': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1855': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1858': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1861': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1864': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1867': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1870': {'model': 'm1',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1873': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1876': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1879': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1882': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1885': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1888': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1891': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1894': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1897': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1900': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1903': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1906': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1909': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1912': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1915': {'model': 'm3',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1918': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1921': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1924': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1927': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1930': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1933': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1936': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1939': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1942': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1945': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1948': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1951': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1954': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1957': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_1960': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1963': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1966': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1969': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1972': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1975': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1978': {'model': 'm1',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1981': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1984': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1987': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1990': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_1993': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1996': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_1999': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2002': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2005': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2008': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2011': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2014': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2017': {'model': 'm1',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2020': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2023': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2026': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2029': {'model': 'm1',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2032': {'model': 'm2',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2035': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2038': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2041': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2044': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2047': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2050': {'model': 'm1',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2053': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2056': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2059': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2062': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2065': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2068': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2071': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2074': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2077': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2080': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2083': {'model': 'm2',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2086': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2089': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2092': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2095': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2098': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2101': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2104': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2107': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2110': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2113': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2116': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2119': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2122': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2125': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2128': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2131': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2134': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2137': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2140': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2143': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2146': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2149': {'model': 'm2',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2152': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2155': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2158': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2161': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2164': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2167': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2170': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2173': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2176': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2179': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2182': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2185': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2188': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2191': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2194': {'model': 'm2',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2197': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2200': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2203': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2206': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2209': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2212': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2215': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2218': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2221': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2224': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2227': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2230': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2233': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2236': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2239': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2242': {'model': 'm1',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2245': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2248': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0015',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2251': {'model': 'm2',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2254': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2257': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2260': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2263': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2266': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2269': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2272': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2275': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2278': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2281': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2284': {'model': 'm2',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2287': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2290': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2293': {'model': 'm2',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2296': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2299': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2302': {'model': 'm1',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2305': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2308': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2311': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2314': {'model': 'm2',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2317': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2320': {'model': 'm1',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2323': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2326': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2329': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2332': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2335': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2338': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2341': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2344': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2347': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2350': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2353': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2356': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2359': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2362': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2365': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2368': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2371': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2374': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2377': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2380': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2383': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2386': {'model': 'm1',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2389': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2392': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2395': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2398': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2401': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2404': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2407': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2410': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2413': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2416': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2419': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2422': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2425': {'model': 'm3',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2428': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2431': {'model': 'm3',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2434': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2437': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2440': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2443': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2446': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2449': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2452': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2455': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2458': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2461': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2464': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2467': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2470': {'model': 'm1',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2473': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2476': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2479': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2482': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2485': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2488': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2491': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2494': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2497': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2500': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2503': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2506': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2509': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2512': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2515': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2518': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2521': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2524': {'model': 'm1',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2527': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2530': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2533': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2536': {'model': 'm1',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2539': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2542': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2545': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2548': {'model': 'm2',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2551': {'model': 'm3',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2554': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2557': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2560': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2563': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2566': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2569': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2572': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2575': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2578': {'model': 'm1',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2581': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2584': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2587': {'model': 'm2',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2590': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2593': {'model': 'm3',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2596': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2599': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2602': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2605': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2608': {'model': 'm3',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2611': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2614': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2617': {'model': 'm2',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2620': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2623': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2626': {'model': 'm2',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2629': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2632': {'model': 'm2',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2635': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2638': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2641': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2644': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2647': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2650': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2653': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2656': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2659': {'model': 'm3',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2662': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2665': {'model': 'm1',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2668': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2671': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2674': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2677': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2680': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2683': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2686': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2689': {'model': 'm1',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2692': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2695': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2698': {'model': 'm1',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0016',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2701': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2704': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2707': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2710': {'model': 'm1',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2713': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2716': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2719': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2722': {'model': 'm3',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2725': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2728': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2731': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2734': {'model': 'm1',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2737': {'model': 'm3',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2740': {'model': 'm3',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2743': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2746': {'model': 'm3',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2749': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2752': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2755': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2758': {'model': 'm3',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2761': {'model': 'm2',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2764': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2767': {'model': 'm3',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2770': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2773': {'model': 'm2',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2776': {'model': 'm1',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2779': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2782': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2785': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2788': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2791': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2794': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2797': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2800': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2803': {'model': 'm1',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2806': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2809': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2812': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2815': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2818': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2821': {'model': 'm1',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2824': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2827': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2830': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2833': {'model': 'm3',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2836': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2839': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2842': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2845': {'model': 'm2',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2848': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2851': {'model': 'm1',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2854': {'model': 'm3',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2857': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2860': {'model': 'm3',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2863': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2866': {'model': 'm2',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2869': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2872': {'model': 'm2',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2875': {'model': 'm1',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2878': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2881': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2884': {'model': 'm2',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2887': {'model': 'm1',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2890': {'model': 'm3',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2893': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2896': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2899': {'model': 'm3',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2902': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2905': {'model': 'm2',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2908': {'model': 'm3',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2911': {'model': 'm2',\n",
+ " 'sent_id': 19,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Luckily, this kind of collapse is relatively infrequent.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2914': {'model': 'm3',\n",
+ " 'sent_id': 2,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Fifty yards ahead of her were the first of the rocks .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2917': {'model': 'm2',\n",
+ " 'sent_id': 20,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it using language that caused their brains to develop?',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2920': {'model': 'm2',\n",
+ " 'sent_id': 21,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If everyone followed a similar plan, the results would be impressive.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2923': {'model': 'm1',\n",
+ " 'sent_id': 22,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2926': {'model': 'm2',\n",
+ " 'sent_id': 23,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'For more than two hundred years the pessimists have been winning the public debate.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2929': {'model': 'm2',\n",
+ " 'sent_id': 24,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2932': {'model': 'm3',\n",
+ " 'sent_id': 25,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2935': {'model': 'm3',\n",
+ " 'sent_id': 26,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2938': {'model': 'm2',\n",
+ " 'sent_id': 27,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2941': {'model': 'm3',\n",
+ " 'sent_id': 28,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2944': {'model': 'm1',\n",
+ " 'sent_id': 29,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2947': {'model': 'm1',\n",
+ " 'sent_id': 3,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'It seemed the ordained order of things that dogs should work .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2950': {'model': 'm2',\n",
+ " 'sent_id': 30,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2953': {'model': 'm1',\n",
+ " 'sent_id': 4,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The journey was continued at dawn .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2956': {'model': 'm3',\n",
+ " 'sent_id': 5,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Was it the rendezvous of those who were striving to work his ruin .',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2959': {'model': 'm3',\n",
+ " 'sent_id': 6,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'A dead man is of no use on a plantation .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2962': {'model': 'm3',\n",
+ " 'sent_id': 7,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'The Claudine was leaving next morning for Honolulu .',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2965': {'model': 'm2',\n",
+ " 'sent_id': 8,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2968': {'model': 'm2',\n",
+ " 'sent_id': 9,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2971': {'model': 'm1',\n",
+ " 'sent_id': 1,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'We got few vegetables and fruits , and became fish eaters .',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2974': {'model': 'm3',\n",
+ " 'sent_id': 10,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Humans also judge distance by using the relative sizes of objects.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2977': {'model': 'm3',\n",
+ " 'sent_id': 11,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'If this is true then those who tend to think creatively, really are somehow different.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2980': {'model': 'm2',\n",
+ " 'sent_id': 12,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'But really in the grand scheme of things, this information is insignificant.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2983': {'model': 'm3',\n",
+ " 'sent_id': 13,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2986': {'model': 'm3',\n",
+ " 'sent_id': 14,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
+ " 'nmistakes': 3,\n",
+ " 'pref_rank': 3},\n",
+ " 'id_2989': {'model': 'm1',\n",
+ " 'sent_id': 15,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " 'id_2992': {'model': 'm1',\n",
+ " 'sent_id': 16,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2995': {'model': 'm1',\n",
+ " 'sent_id': 17,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
+ " 'nmistakes': 1,\n",
+ " 'pref_rank': 1},\n",
+ " 'id_2998': {'model': 'm1',\n",
+ " 'sent_id': 18,\n",
+ " 'speaker': '0017',\n",
+ " 'accent': None,\n",
+ " 'text': 'Earthquakes damage all structures, including bridges.',\n",
+ " 'nmistakes': 2,\n",
+ " 'pref_rank': 2},\n",
+ " ...}"
+ ]
+ },
+ "execution_count": 21,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "for wav_id in meta.keys():\n",
+ " record_ = meta[wav_id]\n",
+ " record_.update(sentences[wav_id])\n",
+ " record_.update(scores[wav_id])\n",
+ " record_.update(pref[wav_id])\n",
+ "\n",
+ "meta"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 22,
+ "id": "479da0a9-6e49-40af-8e9c-dd6147df0f9f",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "4050"
+ ]
+ },
+ "execution_count": 22,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "len(pref)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 23,
+ "id": "fe728682-e40b-47cb-bc38-6864f7312cc5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " model | \n",
+ " sent_id | \n",
+ " speaker | \n",
+ " accent | \n",
+ " text | \n",
+ " nmistakes | \n",
+ " pref_rank | \n",
+ " nwords | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | id_3994 | \n",
+ " m2 | \n",
+ " 2 | \n",
+ " 0020 | \n",
+ " None | \n",
+ " Fifty yards ahead of her were the first of the rocks . | \n",
+ " 3 | \n",
+ " 3 | \n",
+ " 12 | \n",
+ "
\n",
+ " \n",
+ " | id_719 | \n",
+ " m1 | \n",
+ " 9 | \n",
+ " 0012 | \n",
+ " None | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 3 | \n",
+ " 3 | \n",
+ " 11 | \n",
+ "
\n",
+ " \n",
+ " | id_4012 | \n",
+ " m3 | \n",
+ " 25 | \n",
+ " 0020 | \n",
+ " None | \n",
+ " Young people want to feel supported and appreciated by their company and their superiors. | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 14 | \n",
+ "
\n",
+ " \n",
+ " | id_3258 | \n",
+ " m3 | \n",
+ " 14 | \n",
+ " 0018 | \n",
+ " None | \n",
+ " When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town. | \n",
+ " 3 | \n",
+ " 3 | \n",
+ " 19 | \n",
+ "
\n",
+ " \n",
+ " | id_1331 | \n",
+ " m2 | \n",
+ " 30 | \n",
+ " 0013 | \n",
+ " None | \n",
+ " All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart. | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " 23 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " model sent_id speaker accent \\\n",
+ "id_3994 m2 2 0020 None \n",
+ "id_719 m1 9 0012 None \n",
+ "id_4012 m3 25 0020 None \n",
+ "id_3258 m3 14 0018 None \n",
+ "id_1331 m2 30 0013 None \n",
+ "\n",
+ " text \\\n",
+ "id_3994 Fifty yards ahead of her were the first of the rocks . \n",
+ "id_719 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "id_4012 Young people want to feel supported and appreciated by their company and their superiors. \n",
+ "id_3258 When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town. \n",
+ "id_1331 All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart. \n",
+ "\n",
+ " nmistakes pref_rank nwords \n",
+ "id_3994 3 3 12 \n",
+ "id_719 3 3 11 \n",
+ "id_4012 2 2 14 \n",
+ "id_3258 3 3 19 \n",
+ "id_1331 1 1 23 "
+ ]
+ },
+ "execution_count": 23,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_meta = pd.DataFrame.from_dict(meta, orient='index')\n",
+ "df_meta['nwords'] = df_meta['text'].apply(lambda x: len(x.split(' ')))\n",
+ "df_meta.sample(5)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 24,
+ "id": "2d5a228d-2946-41bf-9a3e-ca699453171a",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " model | \n",
+ " sent_id | \n",
+ " speaker | \n",
+ " accent | \n",
+ " text | \n",
+ " nmistakes | \n",
+ " pref_rank | \n",
+ " nwords | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | id_3107 | \n",
+ " m1 | \n",
+ " 23 | \n",
+ " 0017 | \n",
+ " None | \n",
+ " For more than two hundred years the pessimists have been winning the public debate. | \n",
+ " FAILED | \n",
+ " FAILED | \n",
+ " 14 | \n",
+ "
\n",
+ " \n",
+ " | id_3112 | \n",
+ " m1 | \n",
+ " 25 | \n",
+ " 0017 | \n",
+ " None | \n",
+ " Young people want to feel supported and appreciated by their company and their superiors. | \n",
+ " FAILED | \n",
+ " FAILED | \n",
+ " 14 | \n",
+ "
\n",
+ " \n",
+ " | id_3108 | \n",
+ " m2 | \n",
+ " 23 | \n",
+ " 0017 | \n",
+ " None | \n",
+ " For more than two hundred years the pessimists have been winning the public debate. | \n",
+ " FAILED | \n",
+ " FAILED | \n",
+ " 14 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " model sent_id speaker accent \\\n",
+ "id_3107 m1 23 0017 None \n",
+ "id_3112 m1 25 0017 None \n",
+ "id_3108 m2 23 0017 None \n",
+ "\n",
+ " text \\\n",
+ "id_3107 For more than two hundred years the pessimists have been winning the public debate. \n",
+ "id_3112 Young people want to feel supported and appreciated by their company and their superiors. \n",
+ "id_3108 For more than two hundred years the pessimists have been winning the public debate. \n",
+ "\n",
+ " nmistakes pref_rank nwords \n",
+ "id_3107 FAILED FAILED 14 \n",
+ "id_3112 FAILED FAILED 14 \n",
+ "id_3108 FAILED FAILED 14 "
+ ]
+ },
+ "execution_count": 24,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_meta.loc[df_meta['nmistakes'] == 'FAILED'].sample(3)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 25,
+ "id": "aa54fcc9-7dcb-4371-bcd5-18d850e7e631",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "# Filter bad speakers?\n",
+ "some_bad_speaker = 'scottish__scottish_male__cmu_us_awb_arctic'\n",
+ "df_failed = df_meta.loc[df_meta['speaker'] == some_bad_speaker]\n",
+ "df_good = df_meta.loc[df_meta['speaker'] != some_bad_speaker]\n",
+ "df_good = df_good.loc[df_good['nmistakes'] != \"FAILED\"]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 26,
+ "id": "48fdd680-684e-4331-929d-e03ea0519182",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " model | \n",
+ " sent_id | \n",
+ " speaker | \n",
+ " accent | \n",
+ " text | \n",
+ " nmistakes | \n",
+ " pref_rank | \n",
+ " nwords | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ "Empty DataFrame\n",
+ "Columns: [model, sent_id, speaker, accent, text, nmistakes, pref_rank, nwords]\n",
+ "Index: []"
+ ]
+ },
+ "execution_count": 26,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_failed_good_models = df_failed.loc[df_failed['nmistakes'] != 'FAILED', :]\n",
+ "df_failed_good_models"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 27,
+ "id": "b69770ea-64f8-4e59-a1b8-cccbd95dff2d",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " model | \n",
+ " sent_id | \n",
+ " speaker | \n",
+ " accent | \n",
+ " text | \n",
+ " nmistakes | \n",
+ " pref_rank | \n",
+ " nwords | \n",
+ " wer | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | id_682 | \n",
+ " m2 | \n",
+ " 25 | \n",
+ " 0012 | \n",
+ " None | \n",
+ " Young people want to feel supported and appreciated by their company and their superiors. | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " 14 | \n",
+ " 0.071429 | \n",
+ "
\n",
+ " \n",
+ " | id_1709 | \n",
+ " m2 | \n",
+ " 9 | \n",
+ " 0014 | \n",
+ " None | \n",
+ " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 11 | \n",
+ " 0.181818 | \n",
+ "
\n",
+ " \n",
+ " | id_3289 | \n",
+ " m2 | \n",
+ " 24 | \n",
+ " 0018 | \n",
+ " None | \n",
+ " It's wearing me out trying to juggle work with looking after my children and my family. | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 16 | \n",
+ " 0.125 | \n",
+ "
\n",
+ " \n",
+ " | id_3131 | \n",
+ " m1 | \n",
+ " 30 | \n",
+ " 0017 | \n",
+ " None | \n",
+ " All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart. | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 23 | \n",
+ " 0.086957 | \n",
+ "
\n",
+ " \n",
+ " | id_807 | \n",
+ " m3 | \n",
+ " 8 | \n",
+ " 0012 | \n",
+ " None | \n",
+ " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " 14 | \n",
+ " 0.142857 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " model sent_id speaker accent \\\n",
+ "id_682 m2 25 0012 None \n",
+ "id_1709 m2 9 0014 None \n",
+ "id_3289 m2 24 0018 None \n",
+ "id_3131 m1 30 0017 None \n",
+ "id_807 m3 8 0012 None \n",
+ "\n",
+ " text \\\n",
+ "id_682 Young people want to feel supported and appreciated by their company and their superiors. \n",
+ "id_1709 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ "id_3289 It's wearing me out trying to juggle work with looking after my children and my family. \n",
+ "id_3131 All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart. \n",
+ "id_807 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
+ "\n",
+ " nmistakes pref_rank nwords wer \n",
+ "id_682 1 1 14 0.071429 \n",
+ "id_1709 2 2 11 0.181818 \n",
+ "id_3289 2 2 16 0.125 \n",
+ "id_3131 2 2 23 0.086957 \n",
+ "id_807 2 2 14 0.142857 "
+ ]
+ },
+ "execution_count": 27,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_good['wer'] = df_good['nmistakes'] / df_good['nwords']\n",
+ "df_good.sample(5)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 28,
+ "id": "e1bf942e-a3e1-4849-b60f-9a049810aa66",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df_full = df_good"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 29,
+ "id": "9eb31c09-902d-4628-b298-5ebc5a56d446",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "mean_wer = {}\n",
+ "std_wer = {}\n",
+ "stats = {}\n",
+ "for m, df in df_full.groupby('model'):\n",
+ " mean_wer[m] = df['wer'].mean()\n",
+ " std_wer[m] = df['wer'].std()\n",
+ " stats[m] = (mean_wer[m], std_wer[m])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 30,
+ "id": "5ef9cbc8-0807-42ff-8a79-6eedb81b4531",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'m1': 0.15581893610424408, 'm2': 0.1551033686858993, 'm3': 0.1505934661339411}"
+ ]
+ },
+ "execution_count": 30,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "mean_wer"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 31,
+ "id": "cb6ed758-1050-4fb3-a505-6510423d92f5",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'m1': (0.15581893610424408, 0.0917370138172076),\n",
+ " 'm2': (0.1551033686858993, 0.08791329488553278),\n",
+ " 'm3': (0.1505934661339411, 0.08370192086698483)}"
+ ]
+ },
+ "execution_count": 31,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "stats"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 32,
+ "id": "1b749874-5078-49c9-96f1-af75c63998b1",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'m1': (0.06408192228703648, 0.2475559499214517),\n",
+ " 'm2': (0.06719007380036653, 0.2430166635714321),\n",
+ " 'm3': (0.06689154526695626, 0.23429538700092592)}"
+ ]
+ },
+ "execution_count": 32,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "conf_int = {}\n",
+ "for m in stats.keys():\n",
+ " conf_int[m] = (stats[m][0] - stats[m][1], stats[m][0] + stats[m][1])\n",
+ "\n",
+ "conf_int"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 33,
+ "id": "725bb813-96c7-4779-a2f6-e46b667c0b98",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'m1': 'generated_hifi/esd_tune/g_3164999',\n",
+ " 'm2': 'generated_hifi/esd_tune_reversal/g_3164999',\n",
+ " 'm3': 'generated_hifi/esd_tune_advloss0/g_3164999'}"
+ ]
+ },
+ "execution_count": 33,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "model2folder"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 34,
+ "id": "c49f11ee-55f9-477c-a749-8dffd176015a",
+ "metadata": {
+ "scrolled": true,
+ "tags": []
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'0011_m1': {'mean': 0.1649417562959747,\n",
+ " 'std': 0.09848066669836777,\n",
+ " 'conf_int': (0.06646108959760694, 0.2634224229943425)},\n",
+ " '0011_m2': {'mean': 0.15374506591006587,\n",
+ " 'std': 0.09372400140491297,\n",
+ " 'conf_int': (0.060021064505152905, 0.24746906731497884)},\n",
+ " '0011_m3': {'mean': 0.15757343048134242,\n",
+ " 'std': 0.09647052824930616,\n",
+ " 'conf_int': (0.061102902232036266, 0.25404395873064856)},\n",
+ " '0012_m1': {'mean': 0.15808598946517752,\n",
+ " 'std': 0.08908074500705088,\n",
+ " 'conf_int': (0.06900524445812664, 0.2471667344722284)},\n",
+ " '0012_m2': {'mean': 0.15953635163248103,\n",
+ " 'std': 0.09717079605964918,\n",
+ " 'conf_int': (0.062365555572831854, 0.2567071476921302)},\n",
+ " '0012_m3': {'mean': 0.1525969552657367,\n",
+ " 'std': 0.07814707979240157,\n",
+ " 'conf_int': (0.07444987547333512, 0.23074403505813826)},\n",
+ " '0013_m1': {'mean': 0.16239193389292073,\n",
+ " 'std': 0.09757158871850868,\n",
+ " 'conf_int': (0.06482034517441204, 0.2599635226114294)},\n",
+ " '0013_m2': {'mean': 0.16063079414164727,\n",
+ " 'std': 0.08754696864487832,\n",
+ " 'conf_int': (0.07308382549676895, 0.2481777627865256)},\n",
+ " '0013_m3': {'mean': 0.1519149953173421,\n",
+ " 'std': 0.08349049225936797,\n",
+ " 'conf_int': (0.06842450305797412, 0.23540548757671007)},\n",
+ " '0014_m1': {'mean': 0.15330570306335917,\n",
+ " 'std': 0.08736689982957992,\n",
+ " 'conf_int': (0.06593880323377925, 0.24067260289293907)},\n",
+ " '0014_m2': {'mean': 0.1426293068048946,\n",
+ " 'std': 0.07633868568249282,\n",
+ " 'conf_int': (0.06629062112240179, 0.2189679924873874)},\n",
+ " '0014_m3': {'mean': 0.1384163390987707,\n",
+ " 'std': 0.07469015107914477,\n",
+ " 'conf_int': (0.06372618801962594, 0.2131064901779155)},\n",
+ " '0015_m1': {'mean': 0.15765198768178051,\n",
+ " 'std': 0.09358788188396122,\n",
+ " 'conf_int': (0.06406410579781929, 0.25123986956574174)},\n",
+ " '0015_m2': {'mean': 0.1507825603221522,\n",
+ " 'std': 0.0814955191128956,\n",
+ " 'conf_int': (0.0692870412092566, 0.2322780794350478)},\n",
+ " '0015_m3': {'mean': 0.14636983260313963,\n",
+ " 'std': 0.0764192598427006,\n",
+ " 'conf_int': (0.06995057276043903, 0.22278909244584022)},\n",
+ " '0016_m1': {'mean': 0.15037814523110357,\n",
+ " 'std': 0.0914280222484199,\n",
+ " 'conf_int': (0.05895012298268368, 0.24180616747952347)},\n",
+ " '0016_m2': {'mean': 0.15052519785355048,\n",
+ " 'std': 0.08800983126453843,\n",
+ " 'conf_int': (0.06251536658901205, 0.2385350291180889)},\n",
+ " '0016_m3': {'mean': 0.15825089545714013,\n",
+ " 'std': 0.09284693977917047,\n",
+ " 'conf_int': (0.06540395567796967, 0.2510978352363106)},\n",
+ " '0017_m1': {'mean': 0.14841250241957357,\n",
+ " 'std': 0.08660737038257468,\n",
+ " 'conf_int': (0.06180513203699889, 0.23501987280214826)},\n",
+ " '0017_m2': {'mean': 0.16131369102962131,\n",
+ " 'std': 0.08667879676997356,\n",
+ " 'conf_int': (0.07463489425964775, 0.24799248779959487)},\n",
+ " '0017_m3': {'mean': 0.143035627614613,\n",
+ " 'std': 0.07708385493382297,\n",
+ " 'conf_int': (0.06595177268079003, 0.22011948254843597)},\n",
+ " '0018_m1': {'mean': 0.15305746660308842,\n",
+ " 'std': 0.0875897927244637,\n",
+ " 'conf_int': (0.06546767387862472, 0.2406472593275521)},\n",
+ " '0018_m2': {'mean': 0.1522211084782473,\n",
+ " 'std': 0.08686380874816599,\n",
+ " 'conf_int': (0.06535729973008131, 0.23908491722641328)},\n",
+ " '0018_m3': {'mean': 0.1490366761321364,\n",
+ " 'std': 0.07977764804299615,\n",
+ " 'conf_int': (0.06925902808914024, 0.22881432417513253)},\n",
+ " '0020_m1': {'mean': 0.15404618783608884,\n",
+ " 'std': 0.09415821387808693,\n",
+ " 'conf_int': (0.05988797395800191, 0.24820440171417577)},\n",
+ " '0020_m2': {'mean': 0.1645876441493875,\n",
+ " 'std': 0.09176936660138603,\n",
+ " 'conf_int': (0.07281827754800148, 0.25635701075077355)},\n",
+ " '0020_m3': {'mean': 0.15804567205498574,\n",
+ " 'std': 0.09105011689380604,\n",
+ " 'conf_int': (0.06699555516117969, 0.24909578894879178)}}"
+ ]
+ },
+ "execution_count": 34,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "mean_wer = {}\n",
+ "std_wer = {}\n",
+ "stats = {}\n",
+ "conf_int = {}\n",
+ "meta_speaker = {}\n",
+ "for speaker, df1 in df_full.groupby('speaker'):\n",
+ " for m, df in df1.groupby('model'):\n",
+ " mean_wer[m] = df['wer'].mean()\n",
+ " std_wer[m] = df['wer'].std()\n",
+ " stats[m] = (mean_wer[m], std_wer[m])\n",
+ " conf_int[m] = (stats[m][0] - stats[m][1], stats[m][0] + stats[m][1])\n",
+ " meta_speaker[speaker + '_' + m] = {\n",
+ " 'mean': mean_wer[m],\n",
+ " 'std': std_wer[m],\n",
+ " 'conf_int': conf_int[m]\n",
+ " }\n",
+ "\n",
+ "meta_speaker"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 35,
+ "id": "a48e203f-91fb-4018-bd4f-ab6628579def",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " mean | \n",
+ " std | \n",
+ " conf_int | \n",
+ " speaker_model | \n",
+ " speaker | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0011_m1 | \n",
+ " 0.164942 | \n",
+ " 0.098481 | \n",
+ " (0.06646108959760694, 0.2634224229943425) | \n",
+ " 0011_m1 | \n",
+ " 0011 | \n",
+ "
\n",
+ " \n",
+ " | 0011_m2 | \n",
+ " 0.153745 | \n",
+ " 0.093724 | \n",
+ " (0.060021064505152905, 0.24746906731497884) | \n",
+ " 0011_m2 | \n",
+ " 0011 | \n",
+ "
\n",
+ " \n",
+ " | 0011_m3 | \n",
+ " 0.157573 | \n",
+ " 0.096471 | \n",
+ " (0.061102902232036266, 0.25404395873064856) | \n",
+ " 0011_m3 | \n",
+ " 0011 | \n",
+ "
\n",
+ " \n",
+ " | 0012_m1 | \n",
+ " 0.158086 | \n",
+ " 0.089081 | \n",
+ " (0.06900524445812664, 0.2471667344722284) | \n",
+ " 0012_m1 | \n",
+ " 0012 | \n",
+ "
\n",
+ " \n",
+ " | 0012_m2 | \n",
+ " 0.159536 | \n",
+ " 0.097171 | \n",
+ " (0.062365555572831854, 0.2567071476921302) | \n",
+ " 0012_m2 | \n",
+ " 0012 | \n",
+ "
\n",
+ " \n",
+ " | 0012_m3 | \n",
+ " 0.152597 | \n",
+ " 0.078147 | \n",
+ " (0.07444987547333512, 0.23074403505813826) | \n",
+ " 0012_m3 | \n",
+ " 0012 | \n",
+ "
\n",
+ " \n",
+ " | 0013_m1 | \n",
+ " 0.162392 | \n",
+ " 0.097572 | \n",
+ " (0.06482034517441204, 0.2599635226114294) | \n",
+ " 0013_m1 | \n",
+ " 0013 | \n",
+ "
\n",
+ " \n",
+ " | 0013_m2 | \n",
+ " 0.160631 | \n",
+ " 0.087547 | \n",
+ " (0.07308382549676895, 0.2481777627865256) | \n",
+ " 0013_m2 | \n",
+ " 0013 | \n",
+ "
\n",
+ " \n",
+ " | 0013_m3 | \n",
+ " 0.151915 | \n",
+ " 0.083490 | \n",
+ " (0.06842450305797412, 0.23540548757671007) | \n",
+ " 0013_m3 | \n",
+ " 0013 | \n",
+ "
\n",
+ " \n",
+ " | 0014_m1 | \n",
+ " 0.153306 | \n",
+ " 0.087367 | \n",
+ " (0.06593880323377925, 0.24067260289293907) | \n",
+ " 0014_m1 | \n",
+ " 0014 | \n",
+ "
\n",
+ " \n",
+ " | 0014_m2 | \n",
+ " 0.142629 | \n",
+ " 0.076339 | \n",
+ " (0.06629062112240179, 0.2189679924873874) | \n",
+ " 0014_m2 | \n",
+ " 0014 | \n",
+ "
\n",
+ " \n",
+ " | 0014_m3 | \n",
+ " 0.138416 | \n",
+ " 0.074690 | \n",
+ " (0.06372618801962594, 0.2131064901779155) | \n",
+ " 0014_m3 | \n",
+ " 0014 | \n",
+ "
\n",
+ " \n",
+ " | 0015_m1 | \n",
+ " 0.157652 | \n",
+ " 0.093588 | \n",
+ " (0.06406410579781929, 0.25123986956574174) | \n",
+ " 0015_m1 | \n",
+ " 0015 | \n",
+ "
\n",
+ " \n",
+ " | 0015_m2 | \n",
+ " 0.150783 | \n",
+ " 0.081496 | \n",
+ " (0.0692870412092566, 0.2322780794350478) | \n",
+ " 0015_m2 | \n",
+ " 0015 | \n",
+ "
\n",
+ " \n",
+ " | 0015_m3 | \n",
+ " 0.146370 | \n",
+ " 0.076419 | \n",
+ " (0.06995057276043903, 0.22278909244584022) | \n",
+ " 0015_m3 | \n",
+ " 0015 | \n",
+ "
\n",
+ " \n",
+ " | 0016_m1 | \n",
+ " 0.150378 | \n",
+ " 0.091428 | \n",
+ " (0.05895012298268368, 0.24180616747952347) | \n",
+ " 0016_m1 | \n",
+ " 0016 | \n",
+ "
\n",
+ " \n",
+ " | 0016_m2 | \n",
+ " 0.150525 | \n",
+ " 0.088010 | \n",
+ " (0.06251536658901205, 0.2385350291180889) | \n",
+ " 0016_m2 | \n",
+ " 0016 | \n",
+ "
\n",
+ " \n",
+ " | 0016_m3 | \n",
+ " 0.158251 | \n",
+ " 0.092847 | \n",
+ " (0.06540395567796967, 0.2510978352363106) | \n",
+ " 0016_m3 | \n",
+ " 0016 | \n",
+ "
\n",
+ " \n",
+ " | 0017_m1 | \n",
+ " 0.148413 | \n",
+ " 0.086607 | \n",
+ " (0.06180513203699889, 0.23501987280214826) | \n",
+ " 0017_m1 | \n",
+ " 0017 | \n",
+ "
\n",
+ " \n",
+ " | 0017_m2 | \n",
+ " 0.161314 | \n",
+ " 0.086679 | \n",
+ " (0.07463489425964775, 0.24799248779959487) | \n",
+ " 0017_m2 | \n",
+ " 0017 | \n",
+ "
\n",
+ " \n",
+ " | 0017_m3 | \n",
+ " 0.143036 | \n",
+ " 0.077084 | \n",
+ " (0.06595177268079003, 0.22011948254843597) | \n",
+ " 0017_m3 | \n",
+ " 0017 | \n",
+ "
\n",
+ " \n",
+ " | 0018_m1 | \n",
+ " 0.153057 | \n",
+ " 0.087590 | \n",
+ " (0.06546767387862472, 0.2406472593275521) | \n",
+ " 0018_m1 | \n",
+ " 0018 | \n",
+ "
\n",
+ " \n",
+ " | 0018_m2 | \n",
+ " 0.152221 | \n",
+ " 0.086864 | \n",
+ " (0.06535729973008131, 0.23908491722641328) | \n",
+ " 0018_m2 | \n",
+ " 0018 | \n",
+ "
\n",
+ " \n",
+ " | 0018_m3 | \n",
+ " 0.149037 | \n",
+ " 0.079778 | \n",
+ " (0.06925902808914024, 0.22881432417513253) | \n",
+ " 0018_m3 | \n",
+ " 0018 | \n",
+ "
\n",
+ " \n",
+ " | 0020_m1 | \n",
+ " 0.154046 | \n",
+ " 0.094158 | \n",
+ " (0.05988797395800191, 0.24820440171417577) | \n",
+ " 0020_m1 | \n",
+ " 0020 | \n",
+ "
\n",
+ " \n",
+ " | 0020_m2 | \n",
+ " 0.164588 | \n",
+ " 0.091769 | \n",
+ " (0.07281827754800148, 0.25635701075077355) | \n",
+ " 0020_m2 | \n",
+ " 0020 | \n",
+ "
\n",
+ " \n",
+ " | 0020_m3 | \n",
+ " 0.158046 | \n",
+ " 0.091050 | \n",
+ " (0.06699555516117969, 0.24909578894879178) | \n",
+ " 0020_m3 | \n",
+ " 0020 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " mean std conf_int \\\n",
+ "0011_m1 0.164942 0.098481 (0.06646108959760694, 0.2634224229943425) \n",
+ "0011_m2 0.153745 0.093724 (0.060021064505152905, 0.24746906731497884) \n",
+ "0011_m3 0.157573 0.096471 (0.061102902232036266, 0.25404395873064856) \n",
+ "0012_m1 0.158086 0.089081 (0.06900524445812664, 0.2471667344722284) \n",
+ "0012_m2 0.159536 0.097171 (0.062365555572831854, 0.2567071476921302) \n",
+ "0012_m3 0.152597 0.078147 (0.07444987547333512, 0.23074403505813826) \n",
+ "0013_m1 0.162392 0.097572 (0.06482034517441204, 0.2599635226114294) \n",
+ "0013_m2 0.160631 0.087547 (0.07308382549676895, 0.2481777627865256) \n",
+ "0013_m3 0.151915 0.083490 (0.06842450305797412, 0.23540548757671007) \n",
+ "0014_m1 0.153306 0.087367 (0.06593880323377925, 0.24067260289293907) \n",
+ "0014_m2 0.142629 0.076339 (0.06629062112240179, 0.2189679924873874) \n",
+ "0014_m3 0.138416 0.074690 (0.06372618801962594, 0.2131064901779155) \n",
+ "0015_m1 0.157652 0.093588 (0.06406410579781929, 0.25123986956574174) \n",
+ "0015_m2 0.150783 0.081496 (0.0692870412092566, 0.2322780794350478) \n",
+ "0015_m3 0.146370 0.076419 (0.06995057276043903, 0.22278909244584022) \n",
+ "0016_m1 0.150378 0.091428 (0.05895012298268368, 0.24180616747952347) \n",
+ "0016_m2 0.150525 0.088010 (0.06251536658901205, 0.2385350291180889) \n",
+ "0016_m3 0.158251 0.092847 (0.06540395567796967, 0.2510978352363106) \n",
+ "0017_m1 0.148413 0.086607 (0.06180513203699889, 0.23501987280214826) \n",
+ "0017_m2 0.161314 0.086679 (0.07463489425964775, 0.24799248779959487) \n",
+ "0017_m3 0.143036 0.077084 (0.06595177268079003, 0.22011948254843597) \n",
+ "0018_m1 0.153057 0.087590 (0.06546767387862472, 0.2406472593275521) \n",
+ "0018_m2 0.152221 0.086864 (0.06535729973008131, 0.23908491722641328) \n",
+ "0018_m3 0.149037 0.079778 (0.06925902808914024, 0.22881432417513253) \n",
+ "0020_m1 0.154046 0.094158 (0.05988797395800191, 0.24820440171417577) \n",
+ "0020_m2 0.164588 0.091769 (0.07281827754800148, 0.25635701075077355) \n",
+ "0020_m3 0.158046 0.091050 (0.06699555516117969, 0.24909578894879178) \n",
+ "\n",
+ " speaker_model speaker \n",
+ "0011_m1 0011_m1 0011 \n",
+ "0011_m2 0011_m2 0011 \n",
+ "0011_m3 0011_m3 0011 \n",
+ "0012_m1 0012_m1 0012 \n",
+ "0012_m2 0012_m2 0012 \n",
+ "0012_m3 0012_m3 0012 \n",
+ "0013_m1 0013_m1 0013 \n",
+ "0013_m2 0013_m2 0013 \n",
+ "0013_m3 0013_m3 0013 \n",
+ "0014_m1 0014_m1 0014 \n",
+ "0014_m2 0014_m2 0014 \n",
+ "0014_m3 0014_m3 0014 \n",
+ "0015_m1 0015_m1 0015 \n",
+ "0015_m2 0015_m2 0015 \n",
+ "0015_m3 0015_m3 0015 \n",
+ "0016_m1 0016_m1 0016 \n",
+ "0016_m2 0016_m2 0016 \n",
+ "0016_m3 0016_m3 0016 \n",
+ "0017_m1 0017_m1 0017 \n",
+ "0017_m2 0017_m2 0017 \n",
+ "0017_m3 0017_m3 0017 \n",
+ "0018_m1 0018_m1 0018 \n",
+ "0018_m2 0018_m2 0018 \n",
+ "0018_m3 0018_m3 0018 \n",
+ "0020_m1 0020_m1 0020 \n",
+ "0020_m2 0020_m2 0020 \n",
+ "0020_m3 0020_m3 0020 "
+ ]
+ },
+ "execution_count": 35,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df_meta_speakers = pd.DataFrame.from_dict(meta_speaker, orient='index')\n",
+ "df_meta_speakers['speaker_model'] = df_meta_speakers.index\n",
+ "df_meta_speakers['speaker'] = df_meta_speakers['speaker_model'].apply(lambda x: x.split('_')[0])\n",
+ "df_meta_speakers"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 36,
+ "id": "9c44e9ac-7f96-401a-9e5a-499824ad08a9",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'m1': 'generated_hifi/esd_tune/g_3164999',\n",
+ " 'm2': 'generated_hifi/esd_tune_reversal/g_3164999',\n",
+ " 'm3': 'generated_hifi/esd_tune_advloss0/g_3164999'}"
+ ]
+ },
+ "execution_count": 36,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "model2folder"
+ ]
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3 (ipykernel)",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.8.12"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
From b86c4c18f3853eb4d845b387f577ac5e037fa725 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Tue, 17 May 2022 21:54:34 +0300
Subject: [PATCH 14/17] Update for new emo references
---
generate_samples hifi.ipynb | 13 +++++++------
1 file changed, 7 insertions(+), 6 deletions(-)
diff --git a/generate_samples hifi.ipynb b/generate_samples hifi.ipynb
index 4ee370c..22d9c34 100644
--- a/generate_samples hifi.ipynb
+++ b/generate_samples hifi.ipynb
@@ -26,7 +26,7 @@
"metadata": {},
"outputs": [],
"source": [
- "config = load_config(\"configs/esd_tune.yml\")"
+ "config = load_config(\"configs/esd_tune_reversal.yml\")"
]
},
{
@@ -36,7 +36,7 @@
"metadata": {},
"outputs": [],
"source": [
- "device = config.device"
+ "device = \"cuda:0\" # config.device"
]
},
{
@@ -404,6 +404,7 @@
"):\n",
" text_lengths_tensor = torch.LongTensor([len(phonemes_ids)])\n",
" reference = (reference - mels_mean) / mels_std\n",
+ " reference = reference.unsqueeze(0)\n",
" reference = reference.permute(0, 2, 1).to(device)\n",
" phonemes_ids_tensor = torch.LongTensor(phonemes_ids).unsqueeze(0).to(device)\n",
" speaker_ids_tensor = torch.LongTensor([speaker_id]).to(device)\n",
@@ -448,8 +449,8 @@
"metadata": {},
"outputs": [],
"source": [
- "mels_mean = torch.load(checkpoint_path / \"feature\" / \"mels_mean.pth\").float()\n",
- "mels_std = torch.load(checkpoint_path / \"feature\" / \"mels_std.pth\").float()"
+ "mels_mean = torch.load(checkpoint_path / \"feature\" / \"mels_mean.pth\", map_location=device).float()\n",
+ "mels_std = torch.load(checkpoint_path / \"feature\" / \"mels_std.pth\", map_location=device).float()"
]
},
{
@@ -461,7 +462,7 @@
{
"data": {
"application/vnd.jupyter.widget-view+json": {
- "model_id": "5a3b446ba486467ca5044574aa77436a",
+ "model_id": "de26e6fa134d4392b0ca0e332da61123",
"version_major": 2,
"version_minor": 0
},
@@ -477,7 +478,7 @@
"for reference in tqdm(list(reference_pathes.rglob(\"*.pkl\"))):\n",
" speaker = reference.parent.name\n",
" speaker_id = speaker_to_id[speaker]\n",
- " ref_mel = torch.load(reference)\n",
+ " ref_mel = torch.load(reference, map_location=device)\n",
" for i, phonemes in enumerate(phonemes_list):\n",
" batch = get_tacotron_batch(phonemes, ref_mel, speaker_id, device, mels_mean, mels_std)\n",
" with torch.no_grad():\n",
From c33cad7b9e2d312501427be298185356922401cb Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Wed, 18 May 2022 16:49:54 +0300
Subject: [PATCH 15/17] Update HTML's notebook
---
generate_listener_html.ipynb | 560 +++++++++++++++++------------------
1 file changed, 280 insertions(+), 280 deletions(-)
diff --git a/generate_listener_html.ipynb b/generate_listener_html.ipynb
index 36192f4..e6404dd 100644
--- a/generate_listener_html.ipynb
+++ b/generate_listener_html.ipynb
@@ -28,36 +28,35 @@
"outputs": [],
"source": [
"texts = [\n",
- " 'We got few vegetables and fruits , and became fish eaters .',\n",
- " 'Fifty yards ahead of her were the first of the rocks .',\n",
- " 'It seemed the ordained order of things that dogs should work .',\n",
- " 'The journey was continued at dawn .',\n",
- " 'Was it the rendezvous of those who were striving to work his ruin .',\n",
- " 'A dead man is of no use on a plantation .',\n",
- " 'The Claudine was leaving next morning for Honolulu .',\n",
- " 'Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting.',\n",
- " 'Different telescope designs perform differently, and have different strengths and weaknesses.',\n",
- " 'Humans also judge distance by using the relative sizes of objects.',\n",
- " 'If this is true then those who tend to think creatively, really are somehow different.',\n",
- " 'But really in the grand scheme of things, this information is insignificant.',\n",
- " 'He had a private jet with three king-size beds, expensive rugs, porcelain vases and a dining area.',\n",
- " 'When I reached Atlanta my steadily increasing disappointment was not lessened. I found it a big, dull, red town.',\n",
- " 'She woke Meg with a \"Merry Christmas\", and bade her see what was under her pillow. A green–covered book appeared, with the same picture inside, and a few words written by their mother, which made their one present very precious in their eyes.',\n",
- " \"Does Jane know about your new job? No, and don't you dare tell her! She will be furious!\",\n",
- " 'Does she like ice cream or sweets? She likes any kind of ice cream. Chocolate, vanilla, strawberry, banana, the one with caramel, coconut, any you can think of!',\n",
- " 'Earthquakes damage all structures, including bridges.',\n",
- " 'Luckily, this kind of collapse is relatively infrequent.',\n",
- " 'Was it using language that caused their brains to develop?',\n",
- " 'If everyone followed a similar plan, the results would be impressive.',\n",
- " 'Next, the hero overcomes obstacles on the way to facing their greatest challenge.',\n",
- " 'For more than two hundred years the pessimists have been winning the public debate.',\n",
- " \"It's wearing me out trying to juggle work with looking after my children and my family.\",\n",
- " 'Young people want to feel supported and appreciated by their company and their superiors.',\n",
- " 'We start to see the evidence of early human civilisation, through cave paintings for example.',\n",
- " 'In this culture a so-called \"smile of respect\" is seen as insincere and often regarded with suspicion.',\n",
- " 'We can express complex thoughts, convey subtle emotions and communicate about some abstract concepts.',\n",
- " 'The activists send a clear message to companies that people are no longer willing to accept the environmental and human cost of overconsumption.',\n",
- " 'All this is thanks to his childhood in the mountains and to genetics, but it is his mental strength that sets him apart.'\n",
+ " 'Do you realize what time it is?',\n",
+ " 'He comes back to the valley.',\n",
+ " 'This dress does not look worth much!',\n",
+ " 'What happened tonight has nothing to do with Henry.',\n",
+ " 'Today, five years later, we are facing a similar situation.',\n",
+ " 'When I saw you kissing, you looked really happy.',\n",
+ " 'Only one vehicle may be allowed to park at any given time.',\n",
+ " 'The deadlines are indeed very tight.',\n",
+ " \"I'm glad you enjoyed yourself.\", 'What are you still doing here?',\n",
+ " 'This is an animal that is admired for its whiteness and cleanliness. ',\n",
+ " 'Perhaps there is another way to pose these issues.',\n",
+ " \"Your students' test scores drop lower and lower every year.\",\n",
+ " 'Wherever her tears fell, a fruit tree grew.',\n",
+ " 'I was about to head back to my hotel and go to sleep.',\n",
+ " 'You said she really helped last time.',\n",
+ " 'My favorite season, spring, is here.',\n",
+ " \"He's the rich guy who built the airplanes.\",\n",
+ " 'Otto and Elizabeth gave it to us, for the wedding - incredibly generous.',\n",
+ " 'Look, the police said that there was nothing stolen from the house.',\n",
+ " 'And I suppose we can thank your brother for that.',\n",
+ " \"That's a pretty dangerous thing you're doing.\",\n",
+ " 'He arrived in Japan for the first time at the age of twenty six.',\n",
+ " 'Sam thought we were having fun being together.',\n",
+ " \"Well, the true value of something isn't always determined by its price.\",\n",
+ " \"No, it's not polite to discuss a lady's age.\",\n",
+ " \"Just another quarter-mile and I don't have to be tolerant ever again.\",\n",
+ " \"But Jones' apartment had only been rented out for a week.\",\n",
+ " 'What your perfect day would have been like?',\n",
+ " 'Not a very useful skill, especially when the money runs out.',\n",
"]"
]
},
@@ -69,36 +68,36 @@
"outputs": [],
"source": [
"huawei_phones = [\n",
- " ' W IY1 G AA1 T F Y UW1 V EH1 JH T AH0 B AH0 L Z AH0 N D F R UW1 T S AH0 N D B IH0 K EY1 M F IH1 SH IY1 T ER0 Z ',\n",
- " ' F IH1 F T IY0 Y AA1 R D Z AH0 HH EH1 D AH1 V HH ER1 W ER1 DH AH0 F ER1 S T AH1 V DH AH0 R AA1 K S ',\n",
- " ' IH1 T S IY1 M D DH IY0 AO0 R D EY1 N D AO1 R D ER0 AH1 V TH IH1 NG Z DH AE1 T D AA1 G Z SH UH1 D W ER1 K ',\n",
- " ' DH AH0 JH ER1 N IY0 W AA1 Z K AH0 N T IH1 N Y UW0 D AE1 T D AO1 N ',\n",
- " ' W AA1 Z IH1 T DH AH0 R AA1 N D IH0 V UW2 AH1 V DH OW1 Z HH UW1 W ER1 S T R AY1 V IH0 NG T UW1 W ER1 K HH IH1 Z R UW1 AH0 N ',\n",
- " ' AH0 D EH1 D M AE1 N IH1 Z AH1 V N OW1 Y UW1 S AA1 N AH0 P L AE2 N T EY1 SH AH0 N ',\n",
- " ' DH AH0 K L AO0 D IY1 N W AA1 Z L IY1 V IH0 NG N EH1 K S T M AO1 R N IH0 NG F AO1 R HH AA2 N AH0 L UW1 L UW0 ',\n",
- " ' P R AA1 S IH0 K Y UW2 T ER0 Z HH AE1 V OW1 P AH0 N D AH0 M AE1 S IH0 V IH2 N V EH2 S T AH0 G EY1 SH AH0 N IH1 N T UW0 AE2 L AH0 G EY1 SH AH0 N Z AH1 V F IH1 K S IH0 NG G EY1 M Z AH0 N D IH2 L IY1 G AH0 L B EH1 T IH0 NG ',\n",
- " ' D IH1 F ER0 AH0 N T T EH1 L AH0 S K OW2 P D IH0 Z AY1 N Z P ER0 F AO1 R M D IH1 F R AH0 N T L IY0 AH0 N D HH AE1 V D IH1 F ER0 AH0 N T S T R EH1 NG K TH S AH0 N D W IY1 K N AH0 S AH0 Z ',\n",
- " ' HH Y UW1 M AH0 N Z AO1 L S OW0 JH AH1 JH D IH1 S T AH0 N S B AY1 Y UW1 Z IH0 NG DH AH0 R EH1 L AH0 T IH0 V S AY1 Z AH0 Z AH1 V AA1 B JH EH0 K T S ',\n",
- " ' IH1 F DH IH1 S IH1 Z T R UW1 DH EH1 N DH OW1 Z HH UW1 T EH1 N D T UW1 TH IH1 NG K K R IY0 EY1 T IH0 V L IY0 R IH1 L IY0 AA1 R S AH1 M HH AW2 D IH1 F ER0 AH0 N T ',\n",
- " ' B AH1 T R IH1 L IY0 IH0 N DH AH0 G R AE1 N D S K IY1 M AH1 V TH IH1 NG Z DH IH1 S IH2 N F ER0 M EY1 SH AH0 N IH1 Z IH2 N S IH0 G N Y IH1 F IH0 K AH0 N T ',\n",
- " ' HH IY1 HH AE1 D AH0 P R AY1 V AH0 T JH EH1 T W IH1 DH TH R IY1 K IH1 NG S AY1 Z B EH1 D Z IH0 K S P EH1 N S IH0 V R AH1 G Z P AO1 R S AH0 L AH0 N V EY1 S AH0 Z AH0 N D AH0 D AY1 N IH0 NG EH1 R IY0 AH0 ',\n",
- " ' W EH1 N AY1 R IY1 CH T AE0 T L AE1 N T AH0 M AY1 S T EH1 D AH0 L IY0 IH2 N K R IY1 S IH0 NG D IH2 S AH0 P OY1 N T M AH0 N T W AA1 Z N AA1 T L EH1 S AH0 N D AY1 F AW1 N D IH1 T AH0 B IH1 G D AH1 L R EH1 D T AW1 N ',\n",
- " ' SH IY1 W OW1 K M EH1 G W IH1 DH AH0 M EH1 R IY0 K R IH1 S M AH0 S AH0 N D B EY1 D HH ER1 S IY1 W AH1 T W AA1 Z AH1 N D ER0 HH ER1 P IH1 L OW0 AH0 G R IY1 N K AH1 V ER0 D B UH1 K AH0 P IH1 R D W IH1 DH DH AH0 S EY1 M P IH1 K CH ER0 IH2 N S AY1 D AH0 N D AH0 F Y UW1 W ER1 D Z R IH1 T AH0 N B AY1 DH EH1 R M AH1 DH ER0 W IH1 CH M EY1 D DH EH1 R W AH1 N P R EH1 Z AH0 N T V EH1 R IY0 P R EH1 SH AH0 S IH0 N DH EH1 R AY1 Z ',\n",
- " ' D AH1 Z JH EY1 N N OW1 AH0 B AW1 T Y AO1 R N UW1 JH AA1 B N OW1 AH0 N D D OW1 N T Y UW1 D EH1 R T EH1 L HH ER1 SH IY1 W IH1 L B IY1 F Y UH1 R IY0 AH0 S ',\n",
- " ' D AH1 Z SH IY1 L AY1 K AY1 S K R IY1 M AO1 R S W IY1 T S SH IY1 L AY1 K S EH1 N IY0 K AY1 N D AH1 V AY1 S K R IY1 M CH AO1 K L AH0 T V AH0 N IH1 L AH0 S T R AO1 B EH2 R IY0 B AH0 N AE1 N AH0 DH AH0 W AH1 N W IH1 DH K EH1 R AH0 M AH0 L K OW1 K AH0 N AH2 T EH1 N IY0 Y UW1 K AE1 N TH IH1 NG K AH1 V ',\n",
- " ' ER1 TH K W EY2 K S D AE1 M AH0 JH AO1 L S T R AH1 K CH ER0 Z IH2 N K L UW1 D IH0 NG B R IH1 JH AH0 Z ',\n",
- " ' L AH1 K AH0 L IY0 DH IH1 S K AY1 N D AH1 V K AH0 L AE1 P S IH1 Z R EH1 L AH0 T IH0 V L IY0 IH2 N F R IY1 K W AH0 N T ',\n",
- " ' W AA1 Z IH1 T Y UW1 Z IH0 NG L AE1 NG G W AH0 JH DH AE1 T K AA1 Z D DH EH1 R B R EY1 N Z T UW1 D IH0 V EH1 L AH0 P ',\n",
- " ' IH1 F EH1 V R IY0 W AH2 N F AA1 L OW0 D AH0 S IH1 M AH0 L ER0 P L AE1 N DH AH0 R IH0 Z AH1 L T S W UH1 D B IY1 IH2 M P R EH1 S IH0 V ',\n",
- " ' N EH1 K S T DH AH0 HH IH1 R OW0 OW1 V ER0 K AH2 M Z AA1 B S T AH0 K AH0 L Z AA1 N DH AH0 W EY1 T UW1 F EY1 S IH0 NG DH EH1 R G R EY1 T AH0 S T CH AE1 L AH0 N JH ',\n",
- " ' F AO1 R M AO1 R DH AE1 N T UW1 HH AH1 N D R AH0 D Y IH1 R Z DH AH0 P EH1 S AH0 M IH0 S T S HH AE1 V B IH1 N W IH1 N IH0 NG DH AH0 P AH1 B L IH0 K D AH0 B EY1 T ',\n",
- " ' IH1 T S W EH1 R IH0 NG M IY1 AW1 T T R AY1 IH0 NG T UW1 JH AH1 G AH0 L W ER1 K W IH1 DH L UH1 K IH0 NG AE1 F T ER0 M AY1 CH IH1 L D R AH0 N AH0 N D M AY1 F AE1 M AH0 L IY0 ',\n",
- " ' Y AH1 NG P IY1 P AH0 L W AA1 N T T UW1 F IY1 L S AH0 P AO1 R T IH0 D AH0 N D AH0 P R IY1 SH IY0 EY2 T IH0 D B AY1 DH EH1 R K AH1 M P AH0 N IY2 AH0 N D DH EH1 R S UW0 P IH1 R IY0 ER0 Z ',\n",
- " ' W IY1 S T AA1 R T T UW1 S IY1 DH IY0 EH1 V AH0 D AH0 N S AH1 V ER1 L IY0 HH Y UW1 M AH0 N S IH1 V AH0 L IH0 S EY1 SH AH0 N TH R UW1 K EY1 V P EY1 N T IH0 NG Z F AO1 R IH0 G Z AE1 M P AH0 L ',\n",
- " ' IH0 N DH IH1 S K AH1 L CH ER0 AH0 S OW1 K AO1 L D S M AY1 L AH1 V R IH0 S P EH1 K T IH1 Z S IY1 N AE1 Z IH2 N S IH0 N S IH1 R AH0 N D AO1 F AH0 N R IH0 G AA1 R D IH0 D W IH1 DH S AH0 S P IH1 SH AH0 N ',\n",
- " ' W IY1 K AE1 N IH0 K S P R EH1 S K AA1 M P L EH0 K S TH AO1 T S K AH0 N V EY1 S AH1 T AH0 L IH0 M OW1 SH AH0 N Z AH0 N D K AH0 M Y UW1 N AH0 K EY2 T AH0 B AW1 T S AH1 M AE1 B S T R AE0 K T K AA1 N S EH0 P T S ',\n",
- " ' DH IY0 AE1 K T AH0 V AH0 S T S S EH1 N D AH0 K L IH1 R M EH1 S AH0 JH T UW1 K AH1 M P AH0 N IY2 Z DH AE1 T P IY1 P AH0 L AA1 R N OW1 L AO1 NG G ER0 W IH1 L IH0 NG T UW1 AE0 K S EH1 P T DH IY0 IH0 N V AY2 R AH0 N M EH1 N T AH0 L AH0 N D HH Y UW1 M AH0 N K AA1 S T AH1 V OW1 V ER0 K AH0 N S AH2 M P SH AH0 N ',\n",
- " ' AO1 L DH IH1 S IH1 Z TH AE1 NG K S T UW1 HH IH1 Z CH AY1 L D HH UH2 D IH0 N DH AH0 M AW1 N T AH0 N Z AH0 N D T UW1 JH AH0 N EH1 T IH0 K S B AH1 T IH1 T IH1 Z HH IH1 Z M EH1 N T AH0 L S T R EH1 NG K TH DH AE1 T S EH1 T S HH IH1 M AH0 P AA1 R T '\n",
+ " 'D UW1 Y UW1 R IY1 AH0 L AY2 Z W AH1 T T AY1 M IH1 T IH1 Z ',\n",
+ " 'HH IY1 K AH1 M Z B AE1 K T UW1 DH AH0 V AE1 L IY0 ',\n",
+ " 'DH IH1 S D R EH1 S D AH1 Z N AA1 T L UH1 K W ER1 TH M AH1 CH ',\n",
+ " 'W AH1 T HH AE1 P AH0 N D T AH0 N AY1 T HH AE1 Z N AH1 TH IH0 NG T UW1 D UW1 W IH1 DH HH EH1 N R IY0 ',\n",
+ " 'T AH0 D EY1 F AY1 V Y IH1 R Z L EY1 T ER0 W IY1 AA1 R F EY1 S IH0 NG AH0 S IH1 M AH0 L ER0 S IH2 CH UW0 EY1 SH AH0 N ',\n",
+ " 'W EH1 N AY1 S AO1 Y UW1 K IH1 S IH0 NG Y UW1 L UH1 K T R IH1 L IY0 HH AE1 P IY0 ',\n",
+ " 'OW1 N L IY0 W AH1 N V IY1 HH IH0 K AH0 L M EY1 B IY1 AH0 L AW1 D T UW1 P AA1 R K AE1 T EH1 N IY0 G IH1 V AH0 N T AY1 M ',\n",
+ " 'DH AH0 D EH1 D L AY2 N Z AA1 R IH2 N D IY1 D V EH1 R IY0 T AY1 T ',\n",
+ " 'AY1 EH1 M G L AE1 D Y UW1 EH2 N JH OY1 D Y ER0 S EH1 L F ',\n",
+ " 'W AH1 T AA1 R Y UW1 S T IH1 L D UW1 IH0 NG HH IY1 R ',\n",
+ " 'DH IH1 S IH1 Z AE1 N AE1 N AH0 M AH0 L DH AE1 T IH1 Z AH0 D M AY1 ER0 D F AO1 R IH1 T S W AY1 T N AH0 S AH0 N D K L EH1 N L IY0 N IH0 S ',\n",
+ " 'P ER0 HH AE1 P S DH EH1 R IH1 Z AH0 N AH1 DH ER0 W EY1 T UW1 P OW1 Z DH IY1 Z IH1 SH UW0 Z ',\n",
+ " 'Y AO1 R S T UW1 D AH0 N T S T EH1 S T S K AO1 R Z D R AA1 P L OW1 ER0 AH0 N D L OW1 ER0 EH1 V ER0 IY0 Y IH1 R ',\n",
+ " 'W EH0 R EH1 V ER0 HH ER1 T IH1 R Z F EH1 L AH0 F R UW1 T T R IY1 G R UW1 ',\n",
+ " 'AY1 W AA1 Z AH0 B AW1 T T UW1 HH EH1 D B AE1 K T UW1 M AY1 HH OW0 T EH1 L AH0 N D G OW1 T UW1 S L IY1 P ',\n",
+ " 'Y UW1 S EH1 D SH IY1 R IH1 L IY0 HH EH1 L P T L AE1 S T T AY1 M ',\n",
+ " 'M AY1 F EY1 V ER0 IH0 T S IY1 Z AH0 N S P R IH1 NG IH1 Z HH IY1 R ',\n",
+ " 'HH IY1 EH1 S DH AH0 R IH1 CH G AY1 HH UW1 B IH1 L T DH IY0 EH1 R P L EY0 N Z ',\n",
+ " 'AA1 T OW2 AH0 N D IH0 L IH1 Z AH0 B AH0 TH G EY1 V IH1 T T UW1 AH1 S F AO1 R DH AH0 W EH1 D IH0 NG IH2 N K R EH1 D AH0 B L IY0 JH EH1 N ER0 AH0 S ',\n",
+ " 'L UH1 K DH AH0 P AH0 L IY1 S S EH1 D DH AE1 T DH EH1 R W AA1 Z N AH1 TH IH0 NG S T OW1 L AH0 N F R AH1 M DH AH0 HH AW1 S ',\n",
+ " 'AH0 N D AY1 S AH0 P OW1 Z W IY1 K AE1 N TH AE1 NG K Y AO1 R B R AH1 DH ER0 F AO1 R DH AE1 T ',\n",
+ " 'DH AE1 T EH1 S EY0 P R IH1 T IY0 D EY1 N JH ER0 AH0 S TH IH1 NG Y UW1 R EY1 D UW1 IH0 NG ',\n",
+ " 'HH IY1 ER0 AY1 V D IH0 N JH AH0 P AE1 N F AO1 R DH AH0 F ER1 S T T AY1 M AE1 T DH IY0 EY1 JH AH1 V T W EH1 N T IY0 S IH1 K S ',\n",
+ " 'S AE1 M TH AO1 T W IY1 W ER1 HH AE1 V IH0 NG F AH1 N B IY1 IH0 NG T AH0 G EH1 DH ER0 ',\n",
+ " 'W EH1 L DH AH0 T R UW1 V AE1 L Y UW0 AH1 V S AH1 M TH IH0 NG IH1 S N T IY1 AO1 L W EY2 Z D IH0 T ER1 M AH0 N D B AY1 IH1 T S P R AY1 S ',\n",
+ " 'N OW1 IH1 T EH1 S N AA1 T P AH0 L AY1 T T UW1 D IH0 S K AH1 S AH0 L EY1 D IY0 EH1 S EY1 JH ',\n",
+ " 'JH AH1 S T AH0 N AH1 DH ER0 K W AO1 R T ER0 M AY1 L AH0 N D AY1 D AA1 N T IY1 HH AE1 V T UW1 B IY1 T AA1 L ER0 AH0 N T EH1 V ER0 AH0 G EH1 N ',\n",
+ " 'B AH1 T JH OW1 N Z AH0 P AA1 R T M AH0 N T HH AE1 D OW1 N L IY0 B IH1 N R EH1 N T IH0 D AW1 T F AO1 R AH0 W IY1 K ',\n",
+ " 'W AH1 T Y AO1 R P ER1 F IH1 K T D EY1 W UH1 D HH AE1 V B IH1 N L AY1 K ',\n",
+ " 'N AA1 T AH0 V EH1 R IY0 Y UW1 S F AH0 L S K IH1 L AH0 S P EH1 SH L IY0 W EH1 N DH AH0 M AH1 N IY0 R AH1 N Z AW1 T ',\n",
"]"
]
},
@@ -111,9 +110,9 @@
"source": [
"## NOTE: all model keys need to be composed of a single letter followed by a number\n",
"model2folder = {\n",
- " \"m1\": 'generated_hifi/esd_tune/g_3164999',\n",
- " \"m2\": 'generated_hifi/esd_tune_reversal/g_3164999',\n",
- " \"m3\": 'generated_hifi/esd_tune_advloss0/g_3164999',\n",
+ " \"m1\": 'generated_hifi/esd_tune/g_2669999',\n",
+ " \"m2\": 'generated_hifi/esd_tune_reversal/g_2669999',\n",
+ " \"m3\": 'generated_hifi/esd_tune_advloss0/g_2669999',\n",
"}"
]
},
@@ -507,18 +506,18 @@
" \n",
" \n",
" | 1 | \n",
- " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
" 1.wav | \n",
" 0011 | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " Do you realize what time it is? | \n",
" 1.wav | \n",
" 0011 | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " Do you realize what time it is? | \n",
" 1.wav | \n",
" 0011 | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " Do you realize what time it is? | \n",
"
\n",
" \n",
" | 2 | \n",
@@ -537,18 +536,18 @@
"
\n",
" \n",
" | 3 | \n",
- " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
" 10.wav | \n",
" 0011 | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " What are you still doing here? | \n",
" 10.wav | \n",
" 0011 | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " What are you still doing here? | \n",
" 10.wav | \n",
" 0011 | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " What are you still doing here? | \n",
"
\n",
" \n",
" | 4 | \n",
@@ -582,18 +581,18 @@
"
\n",
" \n",
" | 2695 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
" 7.wav | \n",
" 0020 | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
" 7.wav | \n",
" 0020 | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
" 7.wav | \n",
" 0020 | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
"
\n",
" \n",
" | 2696 | \n",
@@ -612,18 +611,18 @@
"
\n",
" \n",
" | 2697 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
" 8.wav | \n",
" 0020 | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " The deadlines are indeed very tight. | \n",
" 8.wav | \n",
" 0020 | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " The deadlines are indeed very tight. | \n",
" 8.wav | \n",
" 0020 | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " The deadlines are indeed very tight. | \n",
"
\n",
" \n",
" | 2698 | \n",
@@ -642,18 +641,18 @@
"
\n",
" \n",
" | 2699 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
" 9.wav | \n",
" 0020 | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " I'm glad you enjoyed yourself. | \n",
" 9.wav | \n",
" 0020 | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " I'm glad you enjoyed yourself. | \n",
" 9.wav | \n",
" 0020 | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " I'm glad you enjoyed yourself. | \n",
"
\n",
" \n",
"\n",
@@ -663,42 +662,42 @@
"text/plain": [
" m1 \\\n",
"0 id_1 \n",
- "1 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
"2 id_4 \n",
- "3 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
"4 id_7 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
"2696 id_4045 \n",
- "2697 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
"2698 id_4048 \n",
- "2699 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
"\n",
" m2 \\\n",
"0 id_2 \n",
- "1 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
"2 id_5 \n",
- "3 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
"4 id_8 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
"2696 id_4046 \n",
- "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
"2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
"\n",
" m3 \\\n",
"0 id_3 \n",
- "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
"2 id_6 \n",
- "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
"4 id_9 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
"2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
"2698 id_4050 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
"\n",
" m1_wavbasename m1_accent_speaker \\\n",
"0 None None \n",
@@ -713,18 +712,18 @@
"2698 None None \n",
"2699 9.wav 0020 \n",
"\n",
- " m1_text \\\n",
- "0 None \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 None \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 None \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 None \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 None \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m1_text \\\n",
+ "0 None \n",
+ "1 Do you realize what time it is? \n",
+ "2 None \n",
+ "3 What are you still doing here? \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 None \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 None \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
" m2_wavbasename m2_accent_speaker \\\n",
"0 None None \n",
@@ -739,18 +738,18 @@
"2698 None None \n",
"2699 9.wav 0020 \n",
"\n",
- " m2_text \\\n",
- "0 None \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 None \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 None \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 None \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 None \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m2_text \\\n",
+ "0 None \n",
+ "1 Do you realize what time it is? \n",
+ "2 None \n",
+ "3 What are you still doing here? \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 None \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 None \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
" m3_wavbasename m3_accent_speaker \\\n",
"0 None None \n",
@@ -765,18 +764,18 @@
"2698 None None \n",
"2699 9.wav 0020 \n",
"\n",
- " m3_text \n",
- "0 None \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 None \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 None \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 None \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 None \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m3_text \n",
+ "0 None \n",
+ "1 Do you realize what time it is? \n",
+ "2 None \n",
+ "3 What are you still doing here? \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 None \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 None \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
"[2700 rows x 12 columns]"
]
@@ -925,12 +924,12 @@
" \n",
" \n",
" | 1 | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " Do you realize what time it is? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
+ " Do you realize what time it is? | \n",
"
\n",
" \n",
" | 2 | \n",
@@ -943,12 +942,12 @@
"
\n",
" \n",
" | 3 | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " What are you still doing here? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
+ " What are you still doing here? | \n",
"
\n",
" \n",
" | 4 | \n",
@@ -970,12 +969,12 @@
"
\n",
" \n",
" | 2695 | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
"
\n",
" \n",
" | 2696 | \n",
@@ -988,12 +987,12 @@
"
\n",
" \n",
" | 2697 | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " The deadlines are indeed very tight. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
+ " The deadlines are indeed very tight. | \n",
"
\n",
" \n",
" | 2698 | \n",
@@ -1006,12 +1005,12 @@
"
\n",
" \n",
" | 2699 | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " I'm glad you enjoyed yourself. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
+ " I'm glad you enjoyed yourself. | \n",
"
\n",
" \n",
"\n",
@@ -1019,70 +1018,70 @@
""
],
"text/plain": [
- " m1_text \\\n",
- "0 None \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 None \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 None \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 None \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 None \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m1_text \\\n",
+ "0 None \n",
+ "1 Do you realize what time it is? \n",
+ "2 None \n",
+ "3 What are you still doing here? \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 None \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 None \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
" m1_accent_speaker m1 \\\n",
"0 None id_1 \n",
- "1 0011 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "1 0011 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
"2 None id_4 \n",
- "3 0011 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "3 0011 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
"4 None id_7 \n",
"... ... ... \n",
- "2695 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2695 0020 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
"2696 None id_4045 \n",
- "2697 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2697 0020 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
"2698 None id_4048 \n",
- "2699 0020 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "2699 0020 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
"\n",
" m2 \\\n",
"0 id_2 \n",
- "1 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
"2 id_5 \n",
- "3 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
"4 id_8 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
"2696 id_4046 \n",
- "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
"2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
"\n",
" m3 \\\n",
"0 id_3 \n",
- "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
"2 id_6 \n",
- "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
"4 id_9 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
"2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
"2698 id_4050 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
"\n",
- " m2_text \n",
- "0 None \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 None \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 None \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 None \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 None \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m2_text \n",
+ "0 None \n",
+ "1 Do you realize what time it is? \n",
+ "2 None \n",
+ "3 What are you still doing here? \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 None \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 None \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
"[2700 rows x 6 columns]"
]
@@ -1150,12 +1149,12 @@
" \n",
" \n",
" | 1 | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " Do you realize what time it is? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune/g_3164999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav | \n",
- " We got few vegetables and fruits , and became fish eaters . | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
+ " Do you realize what time it is? | \n",
"
\n",
" \n",
" | 2 | \n",
@@ -1168,12 +1167,12 @@
"
\n",
" \n",
" | 3 | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " What are you still doing here? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune/g_3164999/0011/angry/10.wav | \n",
- " Humans also judge distance by using the relative sizes of objects. | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
+ " What are you still doing here? | \n",
"
\n",
" \n",
" | 4 | \n",
@@ -1195,12 +1194,12 @@
"
\n",
" \n",
" | 2695 | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav | \n",
- " The Claudine was leaving next morning for Honolulu . | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
+ " Only one vehicle may be allowed to park at any given time. | \n",
"
\n",
" \n",
" | 2696 | \n",
@@ -1213,12 +1212,12 @@
"
\n",
" \n",
" | 2697 | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " The deadlines are indeed very tight. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav | \n",
- " Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
+ " The deadlines are indeed very tight. | \n",
"
\n",
" \n",
" | 2698 | \n",
@@ -1231,12 +1230,12 @@
"
\n",
" \n",
" | 2699 | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " I'm glad you enjoyed yourself. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav | \n",
- " Different telescope designs perform differently, and have different strengths and weaknesses. | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
+ " I'm glad you enjoyed yourself. | \n",
"
\n",
" \n",
"\n",
@@ -1244,18 +1243,18 @@
""
],
"text/plain": [
- " m1_text \\\n",
- "0 - \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 - \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 - \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 - \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 - \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m1_text \\\n",
+ "0 - \n",
+ "1 Do you realize what time it is? \n",
+ "2 - \n",
+ "3 What are you still doing here? \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 - \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 - \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
" m1_accent_speaker \\\n",
"0 - \n",
@@ -1272,55 +1271,55 @@
"\n",
" m1 \\\n",
"0 id_1 \n",
- "1 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
"2 id_4 \n",
- "3 generated_hifi/esd_tune_reversal/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
"4 id_7 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
"2696 id_4045 \n",
- "2697 generated_hifi/esd_tune/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
"2698 id_4048 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
"\n",
" m2 \\\n",
"0 id_2 \n",
- "1 generated_hifi/esd_tune/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
"2 id_5 \n",
- "3 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
"4 id_8 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
"2696 id_4046 \n",
- "2697 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
"2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_reversal/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
"\n",
" m3 \\\n",
"0 id_3 \n",
- "1 generated_hifi/esd_tune_advloss0/g_3164999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
"2 id_6 \n",
- "3 generated_hifi/esd_tune/g_3164999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
"4 id_9 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
"2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_3164999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
"2698 id_4050 \n",
- "2699 generated_hifi/esd_tune/g_3164999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
"\n",
- " m2_text \n",
- "0 - \n",
- "1 We got few vegetables and fruits , and became fish eaters . \n",
- "2 - \n",
- "3 Humans also judge distance by using the relative sizes of objects. \n",
- "4 - \n",
- "... ... \n",
- "2695 The Claudine was leaving next morning for Honolulu . \n",
- "2696 - \n",
- "2697 Prosecutors have opened a massive investigation into allegations of fixing games and illegal betting. \n",
- "2698 - \n",
- "2699 Different telescope designs perform differently, and have different strengths and weaknesses. \n",
+ " m2_text \n",
+ "0 - \n",
+ "1 Do you realize what time it is? \n",
+ "2 - \n",
+ "3 What are you still doing here? \n",
+ "4 - \n",
+ "... ... \n",
+ "2695 Only one vehicle may be allowed to park at any given time. \n",
+ "2696 - \n",
+ "2697 The deadlines are indeed very tight. \n",
+ "2698 - \n",
+ "2699 I'm glad you enjoyed yourself. \n",
"\n",
"[2700 rows x 6 columns]"
]
@@ -1347,11 +1346,12 @@
},
{
"cell_type": "code",
- "execution_count": 14,
+ "execution_count": 15,
"id": "eef3b325-c26e-457a-b575-eb6b210aff7f",
"metadata": {},
"outputs": [],
"source": [
+ "Path('reports').mkdir(exist_ok=True)\n",
"df_permuted.to_csv(\n",
" 'reports/eval_map.csv',\n",
" sep = \"\\t\",\n",
@@ -1363,7 +1363,7 @@
},
{
"cell_type": "code",
- "execution_count": 15,
+ "execution_count": 16,
"id": "d32630c2-aca7-4ee9-b44c-a949d0fd17c4",
"metadata": {},
"outputs": [],
@@ -1380,7 +1380,7 @@
},
{
"cell_type": "code",
- "execution_count": 16,
+ "execution_count": 17,
"id": "2c11c3ca-abe4-4bbd-930f-8a4f62c9dc8f",
"metadata": {},
"outputs": [],
@@ -1403,7 +1403,7 @@
},
{
"cell_type": "code",
- "execution_count": 17,
+ "execution_count": 18,
"id": "11d84c76-841a-4215-a45f-268076e4ae21",
"metadata": {},
"outputs": [],
@@ -1415,7 +1415,7 @@
},
{
"cell_type": "code",
- "execution_count": 18,
+ "execution_count": 19,
"id": "26b577fe-3957-4902-8758-e5501f5d81a0",
"metadata": {},
"outputs": [],
@@ -1426,7 +1426,7 @@
},
{
"cell_type": "code",
- "execution_count": 19,
+ "execution_count": 20,
"id": "f37b7fb3-93eb-448c-a8a3-a23cb0d165ae",
"metadata": {},
"outputs": [],
@@ -1437,7 +1437,7 @@
},
{
"cell_type": "code",
- "execution_count": 20,
+ "execution_count": 21,
"id": "24aef771-215a-4fe6-82cb-1ff375681189",
"metadata": {
"scrolled": true,
@@ -1530,7 +1530,7 @@
},
{
"cell_type": "code",
- "execution_count": 21,
+ "execution_count": 22,
"id": "49a60285-31bf-4263-9162-c3d928aa9068",
"metadata": {},
"outputs": [
From 8b4a95e7a90f3845ec6715cfb956c4173297c9b7 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Wed, 18 May 2022 18:51:44 +0300
Subject: [PATCH 16/17] Update test phrases
---
generate_listener_html.ipynb | 173 ++++++++++++++++++-----------------
1 file changed, 87 insertions(+), 86 deletions(-)
diff --git a/generate_listener_html.ipynb b/generate_listener_html.ipynb
index e6404dd..a23ed4d 100644
--- a/generate_listener_html.ipynb
+++ b/generate_listener_html.ipynb
@@ -28,35 +28,36 @@
"outputs": [],
"source": [
"texts = [\n",
- " 'Do you realize what time it is?',\n",
- " 'He comes back to the valley.',\n",
- " 'This dress does not look worth much!',\n",
- " 'What happened tonight has nothing to do with Henry.',\n",
- " 'Today, five years later, we are facing a similar situation.',\n",
- " 'When I saw you kissing, you looked really happy.',\n",
- " 'Only one vehicle may be allowed to park at any given time.',\n",
- " 'The deadlines are indeed very tight.',\n",
- " \"I'm glad you enjoyed yourself.\", 'What are you still doing here?',\n",
- " 'This is an animal that is admired for its whiteness and cleanliness. ',\n",
- " 'Perhaps there is another way to pose these issues.',\n",
- " \"Your students' test scores drop lower and lower every year.\",\n",
- " 'Wherever her tears fell, a fruit tree grew.',\n",
- " 'I was about to head back to my hotel and go to sleep.',\n",
- " 'You said she really helped last time.',\n",
- " 'My favorite season, spring, is here.',\n",
- " \"He's the rich guy who built the airplanes.\",\n",
- " 'Otto and Elizabeth gave it to us, for the wedding - incredibly generous.',\n",
- " 'Look, the police said that there was nothing stolen from the house.',\n",
- " 'And I suppose we can thank your brother for that.',\n",
- " \"That's a pretty dangerous thing you're doing.\",\n",
- " 'He arrived in Japan for the first time at the age of twenty six.',\n",
- " 'Sam thought we were having fun being together.',\n",
- " \"Well, the true value of something isn't always determined by its price.\",\n",
- " \"No, it's not polite to discuss a lady's age.\",\n",
- " \"Just another quarter-mile and I don't have to be tolerant ever again.\",\n",
- " \"But Jones' apartment had only been rented out for a week.\",\n",
- " 'What your perfect day would have been like?',\n",
- " 'Not a very useful skill, especially when the money runs out.',\n",
+ " 'Do you realize what time it is?',\n",
+ " 'He comes back to the valley.',\n",
+ " 'This dress does not look worth much!',\n",
+ " 'What happened tonight has nothing to do with Henry.',\n",
+ " 'Today, five years later, we are facing a similar situation.',\n",
+ " 'When I saw you kissing, you looked really happy.',\n",
+ " 'Only one vehicle may be allowed to park at any given time.',\n",
+ " 'The deadlines are indeed very tight.',\n",
+ " \"I'm glad you enjoyed yourself.\",\n",
+ " 'What are you still doing here?',\n",
+ " 'This is an animal that is admired for its whiteness and cleanliness. ',\n",
+ " 'Perhaps there is another way to pose these issues.',\n",
+ " \"Your students' test scores drop lower and lower every year.\",\n",
+ " 'Wherever her tears fell, a fruit tree grew.',\n",
+ " 'I was about to head back to my hotel and go to sleep.',\n",
+ " 'You said she really helped last time.',\n",
+ " 'My favorite season, spring, is here.',\n",
+ " \"He's the rich guy who built the airplanes.\",\n",
+ " 'Otto and Elizabeth gave it to us, for the wedding - incredibly generous.',\n",
+ " 'Look, the police said that there was nothing stolen from the house.',\n",
+ " 'And I suppose we can thank your brother for that.',\n",
+ " \"That's a pretty dangerous thing you're doing.\",\n",
+ " 'He arrived in Japan for the first time at the age of twenty six.',\n",
+ " 'Sam thought we were having fun being together.',\n",
+ " \"Well, the true value of something isn't always determined by its price.\",\n",
+ " \"No, it's not polite to discuss a lady's age.\",\n",
+ " \"Just another quarter-mile and I don't have to be tolerant ever again.\",\n",
+ " \"But Jones' apartment had only been rented out for a week.\",\n",
+ " 'What your perfect day would have been like?',\n",
+ " 'Not a very useful skill, especially when the money runs out.',\n",
"]"
]
},
@@ -68,36 +69,36 @@
"outputs": [],
"source": [
"huawei_phones = [\n",
- " 'D UW1 Y UW1 R IY1 AH0 L AY2 Z W AH1 T T AY1 M IH1 T IH1 Z ',\n",
- " 'HH IY1 K AH1 M Z B AE1 K T UW1 DH AH0 V AE1 L IY0 ',\n",
- " 'DH IH1 S D R EH1 S D AH1 Z N AA1 T L UH1 K W ER1 TH M AH1 CH ',\n",
- " 'W AH1 T HH AE1 P AH0 N D T AH0 N AY1 T HH AE1 Z N AH1 TH IH0 NG T UW1 D UW1 W IH1 DH HH EH1 N R IY0 ',\n",
- " 'T AH0 D EY1 F AY1 V Y IH1 R Z L EY1 T ER0 W IY1 AA1 R F EY1 S IH0 NG AH0 S IH1 M AH0 L ER0 S IH2 CH UW0 EY1 SH AH0 N ',\n",
- " 'W EH1 N AY1 S AO1 Y UW1 K IH1 S IH0 NG Y UW1 L UH1 K T R IH1 L IY0 HH AE1 P IY0 ',\n",
- " 'OW1 N L IY0 W AH1 N V IY1 HH IH0 K AH0 L M EY1 B IY1 AH0 L AW1 D T UW1 P AA1 R K AE1 T EH1 N IY0 G IH1 V AH0 N T AY1 M ',\n",
- " 'DH AH0 D EH1 D L AY2 N Z AA1 R IH2 N D IY1 D V EH1 R IY0 T AY1 T ',\n",
- " 'AY1 EH1 M G L AE1 D Y UW1 EH2 N JH OY1 D Y ER0 S EH1 L F ',\n",
- " 'W AH1 T AA1 R Y UW1 S T IH1 L D UW1 IH0 NG HH IY1 R ',\n",
- " 'DH IH1 S IH1 Z AE1 N AE1 N AH0 M AH0 L DH AE1 T IH1 Z AH0 D M AY1 ER0 D F AO1 R IH1 T S W AY1 T N AH0 S AH0 N D K L EH1 N L IY0 N IH0 S ',\n",
- " 'P ER0 HH AE1 P S DH EH1 R IH1 Z AH0 N AH1 DH ER0 W EY1 T UW1 P OW1 Z DH IY1 Z IH1 SH UW0 Z ',\n",
- " 'Y AO1 R S T UW1 D AH0 N T S T EH1 S T S K AO1 R Z D R AA1 P L OW1 ER0 AH0 N D L OW1 ER0 EH1 V ER0 IY0 Y IH1 R ',\n",
- " 'W EH0 R EH1 V ER0 HH ER1 T IH1 R Z F EH1 L AH0 F R UW1 T T R IY1 G R UW1 ',\n",
- " 'AY1 W AA1 Z AH0 B AW1 T T UW1 HH EH1 D B AE1 K T UW1 M AY1 HH OW0 T EH1 L AH0 N D G OW1 T UW1 S L IY1 P ',\n",
- " 'Y UW1 S EH1 D SH IY1 R IH1 L IY0 HH EH1 L P T L AE1 S T T AY1 M ',\n",
- " 'M AY1 F EY1 V ER0 IH0 T S IY1 Z AH0 N S P R IH1 NG IH1 Z HH IY1 R ',\n",
- " 'HH IY1 EH1 S DH AH0 R IH1 CH G AY1 HH UW1 B IH1 L T DH IY0 EH1 R P L EY0 N Z ',\n",
- " 'AA1 T OW2 AH0 N D IH0 L IH1 Z AH0 B AH0 TH G EY1 V IH1 T T UW1 AH1 S F AO1 R DH AH0 W EH1 D IH0 NG IH2 N K R EH1 D AH0 B L IY0 JH EH1 N ER0 AH0 S ',\n",
- " 'L UH1 K DH AH0 P AH0 L IY1 S S EH1 D DH AE1 T DH EH1 R W AA1 Z N AH1 TH IH0 NG S T OW1 L AH0 N F R AH1 M DH AH0 HH AW1 S ',\n",
- " 'AH0 N D AY1 S AH0 P OW1 Z W IY1 K AE1 N TH AE1 NG K Y AO1 R B R AH1 DH ER0 F AO1 R DH AE1 T ',\n",
- " 'DH AE1 T EH1 S EY0 P R IH1 T IY0 D EY1 N JH ER0 AH0 S TH IH1 NG Y UW1 R EY1 D UW1 IH0 NG ',\n",
- " 'HH IY1 ER0 AY1 V D IH0 N JH AH0 P AE1 N F AO1 R DH AH0 F ER1 S T T AY1 M AE1 T DH IY0 EY1 JH AH1 V T W EH1 N T IY0 S IH1 K S ',\n",
- " 'S AE1 M TH AO1 T W IY1 W ER1 HH AE1 V IH0 NG F AH1 N B IY1 IH0 NG T AH0 G EH1 DH ER0 ',\n",
- " 'W EH1 L DH AH0 T R UW1 V AE1 L Y UW0 AH1 V S AH1 M TH IH0 NG IH1 S N T IY1 AO1 L W EY2 Z D IH0 T ER1 M AH0 N D B AY1 IH1 T S P R AY1 S ',\n",
- " 'N OW1 IH1 T EH1 S N AA1 T P AH0 L AY1 T T UW1 D IH0 S K AH1 S AH0 L EY1 D IY0 EH1 S EY1 JH ',\n",
- " 'JH AH1 S T AH0 N AH1 DH ER0 K W AO1 R T ER0 M AY1 L AH0 N D AY1 D AA1 N T IY1 HH AE1 V T UW1 B IY1 T AA1 L ER0 AH0 N T EH1 V ER0 AH0 G EH1 N ',\n",
- " 'B AH1 T JH OW1 N Z AH0 P AA1 R T M AH0 N T HH AE1 D OW1 N L IY0 B IH1 N R EH1 N T IH0 D AW1 T F AO1 R AH0 W IY1 K ',\n",
- " 'W AH1 T Y AO1 R P ER1 F IH1 K T D EY1 W UH1 D HH AE1 V B IH1 N L AY1 K ',\n",
- " 'N AA1 T AH0 V EH1 R IY0 Y UW1 S F AH0 L S K IH1 L AH0 S P EH1 SH L IY0 W EH1 N DH AH0 M AH1 N IY0 R AH1 N Z AW1 T ',\n",
+ " ' D UW1 Y UW1 R IY1 AH0 L AY2 Z W AH1 T T AY1 M IH1 T IH1 Z ',\n",
+ " ' HH IY1 K AH1 M Z B AE1 K T UW1 DH AH0 V AE1 L IY0 ',\n",
+ " ' DH IH1 S D R EH1 S D AH1 Z N AA1 T L UH1 K W ER1 TH M AH1 CH ',\n",
+ " ' W AH1 T HH AE1 P AH0 N D T AH0 N AY1 T HH AE1 Z N AH1 TH IH0 NG T UW1 D UW1 W IH1 DH HH EH1 N R IY0 ',\n",
+ " ' T AH0 D EY1 F AY1 V Y IH1 R Z L EY1 T ER0 W IY1 AA1 R F EY1 S IH0 NG AH0 S IH1 M AH0 L ER0 S IH2 CH UW0 EY1 SH AH0 N ',\n",
+ " ' W EH1 N AY1 S AO1 Y UW1 K IH1 S IH0 NG Y UW1 L UH1 K T R IH1 L IY0 HH AE1 P IY0 ',\n",
+ " ' OW1 N L IY0 W AH1 N V IY1 HH IH0 K AH0 L M EY1 B IY1 AH0 L AW1 D T UW1 P AA1 R K AE1 T EH1 N IY0 G IH1 V AH0 N T AY1 M ',\n",
+ " ' DH AH0 D EH1 D L AY2 N Z AA1 R IH2 N D IY1 D V EH1 R IY0 T AY1 T ',\n",
+ " ' AY1 EH1 M G L AE1 D Y UW1 EH2 N JH OY1 D Y ER0 S EH1 L F ',\n",
+ " ' W AH1 T AA1 R Y UW1 S T IH1 L D UW1 IH0 NG HH IY1 R ',\n",
+ " ' DH IH1 S IH1 Z AE1 N AE1 N AH0 M AH0 L DH AE1 T IH1 Z AH0 D M AY1 ER0 D F AO1 R IH1 T S W AY1 T N AH0 S AH0 N D K L EH1 N L IY0 N IH0 S ',\n",
+ " ' P ER0 HH AE1 P S DH EH1 R IH1 Z AH0 N AH1 DH ER0 W EY1 T UW1 P OW1 Z DH IY1 Z IH1 SH UW0 Z ',\n",
+ " ' Y AO1 R S T UW1 D AH0 N T S T EH1 S T S K AO1 R Z D R AA1 P L OW1 ER0 AH0 N D L OW1 ER0 EH1 V ER0 IY0 Y IH1 R ',\n",
+ " ' W EH0 R EH1 V ER0 HH ER1 T IH1 R Z F EH1 L AH0 F R UW1 T T R IY1 G R UW1 ',\n",
+ " ' AY1 W AA1 Z AH0 B AW1 T T UW1 HH EH1 D B AE1 K T UW1 M AY1 HH OW0 T EH1 L AH0 N D G OW1 T UW1 S L IY1 P ',\n",
+ " ' Y UW1 S EH1 D SH IY1 R IH1 L IY0 HH EH1 L P T L AE1 S T T AY1 M ',\n",
+ " ' M AY1 F EY1 V ER0 IH0 T S IY1 Z AH0 N S P R IH1 NG IH1 Z HH IY1 R ',\n",
+ " ' HH IY1 EH1 S DH AH0 R IH1 CH G AY1 HH UW1 B IH1 L T DH IY0 EH1 R P L EY0 N Z ',\n",
+ " ' AA1 T OW2 AH0 N D IH0 L IH1 Z AH0 B AH0 TH G EY1 V IH1 T T UW1 AH1 S F AO1 R DH AH0 W EH1 D IH0 NG IH2 N K R EH1 D AH0 B L IY0 JH EH1 N ER0 AH0 S ',\n",
+ " ' L UH1 K DH AH0 P AH0 L IY1 S S EH1 D DH AE1 T DH EH1 R W AA1 Z N AH1 TH IH0 NG S T OW1 L AH0 N F R AH1 M DH AH0 HH AW1 S ',\n",
+ " ' AH0 N D AY1 S AH0 P OW1 Z W IY1 K AE1 N TH AE1 NG K Y AO1 R B R AH1 DH ER0 F AO1 R DH AE1 T ',\n",
+ " ' DH AE1 T EH1 S EY0 P R IH1 T IY0 D EY1 N JH ER0 AH0 S TH IH1 NG Y UW1 R EY1 D UW1 IH0 NG ',\n",
+ " ' HH IY1 ER0 AY1 V D IH0 N JH AH0 P AE1 N F AO1 R DH AH0 F ER1 S T T AY1 M AE1 T DH IY0 EY1 JH AH1 V T W EH1 N T IY0 S IH1 K S ',\n",
+ " ' S AE1 M TH AO1 T W IY1 W ER1 HH AE1 V IH0 NG F AH1 N B IY1 IH0 NG T AH0 G EH1 DH ER0 ',\n",
+ " ' W EH1 L DH AH0 T R UW1 V AE1 L Y UW0 AH1 V S AH1 M TH IH0 NG IH1 S N T IY1 AO1 L W EY2 Z D IH0 T ER1 M AH0 N D B AY1 IH1 T S P R AY1 S ',\n",
+ " ' N OW1 IH1 T EH1 S N AA1 T P AH0 L AY1 T T UW1 D IH0 S K AH1 S AH0 L EY1 D IY0 EH1 S EY1 JH ',\n",
+ " ' JH AH1 S T AH0 N AH1 DH ER0 K W AO1 R T ER0 M AY1 L AH0 N D AY1 D AA1 N T IY1 HH AE1 V T UW1 B IY1 T AA1 L ER0 AH0 N T EH1 V ER0 AH0 G EH1 N ',\n",
+ " ' B AH1 T JH OW1 N Z AH0 P AA1 R T M AH0 N T HH AE1 D OW1 N L IY0 B IH1 N R EH1 N T IH0 D AW1 T F AO1 R AH0 W IY1 K ',\n",
+ " ' W AH1 T Y AO1 R P ER1 F IH1 K T D EY1 W UH1 D HH AE1 V B IH1 N L AY1 K ',\n",
+ " ' N AA1 T AH0 V EH1 R IY0 Y UW1 S F AH0 L S K IH1 L AH0 S P EH1 SH L IY0 W EH1 N DH AH0 M AH1 N IY0 R AH1 N Z AW1 T ',\n",
"]"
]
},
@@ -1151,9 +1152,9 @@
" 1 | \n",
" Do you realize what time it is? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
" generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
" Do you realize what time it is? | \n",
" \n",
" \n",
@@ -1169,9 +1170,9 @@
" | 3 | \n",
" What are you still doing here? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
" generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
" generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
" What are you still doing here? | \n",
"
\n",
" \n",
@@ -1196,9 +1197,9 @@
" | 2695 | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
" generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
"
\n",
" \n",
@@ -1214,9 +1215,9 @@
" | 2697 | \n",
" The deadlines are indeed very tight. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
" generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
" generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
" The deadlines are indeed very tight. | \n",
"
\n",
" \n",
@@ -1232,8 +1233,8 @@
" | 2699 | \n",
" I'm glad you enjoyed yourself. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
" generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
" generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
" I'm glad you enjoyed yourself. | \n",
"
\n",
@@ -1271,40 +1272,40 @@
"\n",
" m1 \\\n",
"0 id_1 \n",
- "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
"2 id_4 \n",
- "3 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
"4 id_7 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
"2696 id_4045 \n",
- "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
"2698 id_4048 \n",
- "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
"\n",
" m2 \\\n",
"0 id_2 \n",
"1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
"2 id_5 \n",
- "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
"4 id_8 \n",
"... ... \n",
"2695 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
"2696 id_4046 \n",
- "2697 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
"2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
+ "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
"\n",
" m3 \\\n",
"0 id_3 \n",
- "1 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
+ "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
"2 id_6 \n",
- "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
+ "3 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
"4 id_9 \n",
"... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
+ "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
"2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
+ "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
"2698 id_4050 \n",
"2699 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
"\n",
@@ -1346,7 +1347,7 @@
},
{
"cell_type": "code",
- "execution_count": 15,
+ "execution_count": 14,
"id": "eef3b325-c26e-457a-b575-eb6b210aff7f",
"metadata": {},
"outputs": [],
@@ -1363,7 +1364,7 @@
},
{
"cell_type": "code",
- "execution_count": 16,
+ "execution_count": 15,
"id": "d32630c2-aca7-4ee9-b44c-a949d0fd17c4",
"metadata": {},
"outputs": [],
@@ -1380,7 +1381,7 @@
},
{
"cell_type": "code",
- "execution_count": 17,
+ "execution_count": 16,
"id": "2c11c3ca-abe4-4bbd-930f-8a4f62c9dc8f",
"metadata": {},
"outputs": [],
@@ -1403,7 +1404,7 @@
},
{
"cell_type": "code",
- "execution_count": 18,
+ "execution_count": 17,
"id": "11d84c76-841a-4215-a45f-268076e4ae21",
"metadata": {},
"outputs": [],
@@ -1415,7 +1416,7 @@
},
{
"cell_type": "code",
- "execution_count": 19,
+ "execution_count": 18,
"id": "26b577fe-3957-4902-8758-e5501f5d81a0",
"metadata": {},
"outputs": [],
@@ -1426,7 +1427,7 @@
},
{
"cell_type": "code",
- "execution_count": 20,
+ "execution_count": 19,
"id": "f37b7fb3-93eb-448c-a8a3-a23cb0d165ae",
"metadata": {},
"outputs": [],
@@ -1437,7 +1438,7 @@
},
{
"cell_type": "code",
- "execution_count": 21,
+ "execution_count": 20,
"id": "24aef771-215a-4fe6-82cb-1ff375681189",
"metadata": {
"scrolled": true,
@@ -1530,7 +1531,7 @@
},
{
"cell_type": "code",
- "execution_count": 22,
+ "execution_count": 21,
"id": "49a60285-31bf-4263-9162-c3d928aa9068",
"metadata": {},
"outputs": [
From 72b7bb953d81a2b2e43cac7c5c343bc75d9d67e0 Mon Sep 17 00:00:00 2001
From: ruk0sh <43880105+ruk0sh@users.noreply.github.com>
Date: Sat, 28 May 2022 10:52:53 +0300
Subject: [PATCH 17/17] Update HTML generation notebook
---
generate_listener_html.ipynb | 454 ++++++++++++++++++-----------------
1 file changed, 236 insertions(+), 218 deletions(-)
diff --git a/generate_listener_html.ipynb b/generate_listener_html.ipynb
index a23ed4d..3cf7791 100644
--- a/generate_listener_html.ipynb
+++ b/generate_listener_html.ipynb
@@ -17,7 +17,12 @@
"\n",
"\n",
"pd.set_option('display.max_colwidth', None)\n",
- "pd.set_option('display.colheader_justify', 'center')"
+ "pd.set_option('display.colheader_justify', 'center')\n",
+ "\n",
+ "\n",
+ "REPORTS_DIR = Path('reports')\n",
+ "REPORT_NAME = 'esd_tune_1-2-7'\n",
+ "OUTPUT_DIR = REPORTS_DIR / REPORT_NAME"
]
},
{
@@ -63,7 +68,7 @@
},
{
"cell_type": "code",
- "execution_count": 3,
+ "execution_count": null,
"id": "f0871808-7396-4a82-b529-404babb6be8d",
"metadata": {},
"outputs": [],
@@ -104,22 +109,22 @@
},
{
"cell_type": "code",
- "execution_count": 4,
+ "execution_count": 3,
"id": "d7942da8-a539-4a50-98ef-d93cbdcec403",
"metadata": {},
"outputs": [],
"source": [
"## NOTE: all model keys need to be composed of a single letter followed by a number\n",
"model2folder = {\n",
- " \"m1\": 'generated_hifi/esd_tune/g_2669999',\n",
- " \"m2\": 'generated_hifi/esd_tune_reversal/g_2669999',\n",
- " \"m3\": 'generated_hifi/esd_tune_advloss0/g_2669999',\n",
+ " \"m1\": 'generated_hifi/esd_tune_1/g_2879999',\n",
+ " \"m2\": 'generated_hifi/esd_tune_2/g_2939999',\n",
+ " \"m3\": 'generated_hifi/esd_tune_7/g_3059999',\n",
"}"
]
},
{
"cell_type": "code",
- "execution_count": 5,
+ "execution_count": 4,
"id": "d4d44f9e-525a-4e3d-bb5c-679b64bd7861",
"metadata": {},
"outputs": [],
@@ -129,7 +134,7 @@
},
{
"cell_type": "code",
- "execution_count": 6,
+ "execution_count": 5,
"id": "51e4eae6-ea64-4d69-947c-2a0c7b15678b",
"metadata": {},
"outputs": [
@@ -154,7 +159,7 @@
},
{
"cell_type": "code",
- "execution_count": 7,
+ "execution_count": 6,
"id": "e2031149-e1e8-421f-983c-83833c1b67ad",
"metadata": {},
"outputs": [],
@@ -166,7 +171,7 @@
},
{
"cell_type": "code",
- "execution_count": 8,
+ "execution_count": 7,
"id": "f60b3404-269a-407e-bedd-898b754c5651",
"metadata": {},
"outputs": [
@@ -419,7 +424,7 @@
"[2700 rows x 12 columns]"
]
},
- "execution_count": 8,
+ "execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
@@ -450,7 +455,7 @@
},
{
"cell_type": "code",
- "execution_count": 9,
+ "execution_count": 8,
"id": "2b88d46e-c3af-43eb-8af7-282492147a1f",
"metadata": {},
"outputs": [
@@ -507,9 +512,9 @@
" \n",
" \n",
" | 1 | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav | \n",
" 1.wav | \n",
" 0011 | \n",
" Do you realize what time it is? | \n",
@@ -537,9 +542,9 @@
"
\n",
" \n",
" | 3 | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav | \n",
" 10.wav | \n",
" 0011 | \n",
" What are you still doing here? | \n",
@@ -582,9 +587,9 @@
"
\n",
" \n",
" | 2695 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav | \n",
" 7.wav | \n",
" 0020 | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
@@ -612,9 +617,9 @@
"
\n",
" \n",
" | 2697 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav | \n",
" 8.wav | \n",
" 0020 | \n",
" The deadlines are indeed very tight. | \n",
@@ -642,9 +647,9 @@
"
\n",
" \n",
" | 2699 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav | \n",
" 9.wav | \n",
" 0020 | \n",
" I'm glad you enjoyed yourself. | \n",
@@ -661,57 +666,57 @@
""
],
"text/plain": [
- " m1 \\\n",
- "0 id_1 \n",
- "1 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
- "2 id_4 \n",
- "3 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
- "4 id_7 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4045 \n",
- "2697 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4048 \n",
- "2699 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
+ " m1 \\\n",
+ "0 id_1 \n",
+ "1 generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav \n",
+ "2 id_4 \n",
+ "3 generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav \n",
+ "4 id_7 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav \n",
+ "2696 id_4045 \n",
+ "2697 generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav \n",
+ "2698 id_4048 \n",
+ "2699 generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav \n",
"\n",
- " m2 \\\n",
- "0 id_2 \n",
- "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
- "2 id_5 \n",
- "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
- "4 id_8 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4046 \n",
- "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav \n",
"\n",
- " m3 \\\n",
- "0 id_3 \n",
- "1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
- "2 id_6 \n",
- "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
- "4 id_9 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4050 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
+ " m3 m1_wavbasename \\\n",
+ "0 id_3 None \n",
+ "1 generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav 1.wav \n",
+ "2 id_6 None \n",
+ "3 generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav 10.wav \n",
+ "4 id_9 None \n",
+ "... ... ... \n",
+ "2695 generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav 7.wav \n",
+ "2696 id_4047 None \n",
+ "2697 generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav 8.wav \n",
+ "2698 id_4050 None \n",
+ "2699 generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav 9.wav \n",
"\n",
- " m1_wavbasename m1_accent_speaker \\\n",
- "0 None None \n",
- "1 1.wav 0011 \n",
- "2 None None \n",
- "3 10.wav 0011 \n",
- "4 None None \n",
- "... ... ... \n",
- "2695 7.wav 0020 \n",
- "2696 None None \n",
- "2697 8.wav 0020 \n",
- "2698 None None \n",
- "2699 9.wav 0020 \n",
+ " m1_accent_speaker \\\n",
+ "0 None \n",
+ "1 0011 \n",
+ "2 None \n",
+ "3 0011 \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 0020 \n",
+ "2696 None \n",
+ "2697 0020 \n",
+ "2698 None \n",
+ "2699 0020 \n",
"\n",
" m1_text \\\n",
"0 None \n",
@@ -781,7 +786,7 @@
"[2700 rows x 12 columns]"
]
},
- "execution_count": 9,
+ "execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
@@ -828,7 +833,7 @@
},
{
"cell_type": "code",
- "execution_count": 10,
+ "execution_count": 9,
"id": "efc3b273-7b7d-4165-aef8-38da88cfc154",
"metadata": {
"tags": []
@@ -858,7 +863,7 @@
},
{
"cell_type": "code",
- "execution_count": 11,
+ "execution_count": 10,
"id": "e3f303a2-0923-4b6a-802c-11c497fe5e58",
"metadata": {},
"outputs": [
@@ -868,7 +873,7 @@
"['m1', 'm2', 'm3']"
]
},
- "execution_count": 11,
+ "execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
@@ -880,7 +885,7 @@
},
{
"cell_type": "code",
- "execution_count": 12,
+ "execution_count": 11,
"id": "d1b37dd4-39c3-4956-adf0-22cf45b49f85",
"metadata": {},
"outputs": [
@@ -927,9 +932,9 @@
" 1 | \n",
" Do you realize what time it is? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav | \n",
" Do you realize what time it is? | \n",
"
\n",
" \n",
@@ -945,9 +950,9 @@
" | 3 | \n",
" What are you still doing here? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav | \n",
" What are you still doing here? | \n",
"
\n",
" \n",
@@ -972,9 +977,9 @@
" | 2695 | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
"
\n",
" \n",
@@ -990,9 +995,9 @@
" | 2697 | \n",
" The deadlines are indeed very tight. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav | \n",
" The deadlines are indeed very tight. | \n",
"
\n",
" \n",
@@ -1008,9 +1013,9 @@
" | 2699 | \n",
" I'm glad you enjoyed yourself. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav | \n",
" I'm glad you enjoyed yourself. | \n",
"
\n",
" \n",
@@ -1032,44 +1037,57 @@
"2698 None \n",
"2699 I'm glad you enjoyed yourself. \n",
"\n",
- " m1_accent_speaker m1 \\\n",
- "0 None id_1 \n",
- "1 0011 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
- "2 None id_4 \n",
- "3 0011 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
- "4 None id_7 \n",
- "... ... ... \n",
- "2695 0020 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
- "2696 None id_4045 \n",
- "2697 0020 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
- "2698 None id_4048 \n",
- "2699 0020 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
+ " m1_accent_speaker \\\n",
+ "0 None \n",
+ "1 0011 \n",
+ "2 None \n",
+ "3 0011 \n",
+ "4 None \n",
+ "... ... \n",
+ "2695 0020 \n",
+ "2696 None \n",
+ "2697 0020 \n",
+ "2698 None \n",
+ "2699 0020 \n",
+ "\n",
+ " m1 \\\n",
+ "0 id_1 \n",
+ "1 generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav \n",
+ "2 id_4 \n",
+ "3 generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav \n",
+ "4 id_7 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav \n",
+ "2696 id_4045 \n",
+ "2697 generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav \n",
+ "2698 id_4048 \n",
+ "2699 generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav \n",
"\n",
- " m2 \\\n",
- "0 id_2 \n",
- "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
- "2 id_5 \n",
- "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
- "4 id_8 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4046 \n",
- "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav \n",
"\n",
- " m3 \\\n",
- "0 id_3 \n",
- "1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
- "2 id_6 \n",
- "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
- "4 id_9 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4050 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
+ " m3 \\\n",
+ "0 id_3 \n",
+ "1 generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav \n",
+ "2 id_6 \n",
+ "3 generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav \n",
+ "2696 id_4047 \n",
+ "2697 generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav \n",
+ "2698 id_4050 \n",
+ "2699 generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav \n",
"\n",
" m2_text \n",
"0 None \n",
@@ -1087,7 +1105,7 @@
"[2700 rows x 6 columns]"
]
},
- "execution_count": 12,
+ "execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
@@ -1105,7 +1123,7 @@
},
{
"cell_type": "code",
- "execution_count": 13,
+ "execution_count": 12,
"id": "a9915d2e-01e5-40c0-923b-4bf6bf7389cf",
"metadata": {},
"outputs": [
@@ -1152,9 +1170,9 @@
" 1 | \n",
" Do you realize what time it is? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav | \n",
" Do you realize what time it is? | \n",
" \n",
" \n",
@@ -1170,9 +1188,9 @@
" | 3 | \n",
" What are you still doing here? | \n",
" 0011 | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav | \n",
- " generated_hifi/esd_tune/g_2669999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav | \n",
" What are you still doing here? | \n",
"
\n",
" \n",
@@ -1197,9 +1215,9 @@
" | 2695 | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav | \n",
" Only one vehicle may be allowed to park at any given time. | \n",
"
\n",
" \n",
@@ -1215,9 +1233,9 @@
" | 2697 | \n",
" The deadlines are indeed very tight. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav | \n",
" The deadlines are indeed very tight. | \n",
"
\n",
" \n",
@@ -1233,9 +1251,9 @@
" | 2699 | \n",
" I'm glad you enjoyed yourself. | \n",
" 0020 | \n",
- " generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav | \n",
- " generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav | \n",
+ " generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav | \n",
" I'm glad you enjoyed yourself. | \n",
"
\n",
" \n",
@@ -1270,44 +1288,44 @@
"2698 - \n",
"2699 0020 \n",
"\n",
- " m1 \\\n",
- "0 id_1 \n",
- "1 generated_hifi/esd_tune/g_2669999/0011/angry/1.wav \n",
- "2 id_4 \n",
- "3 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/10.wav \n",
- "4 id_7 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4045 \n",
- "2697 generated_hifi/esd_tune/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4048 \n",
- "2699 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/9.wav \n",
+ " m1 \\\n",
+ "0 id_1 \n",
+ "1 generated_hifi/esd_tune_2/g_2939999/0011/angry/1.wav \n",
+ "2 id_4 \n",
+ "3 generated_hifi/esd_tune_7/g_3059999/0011/angry/10.wav \n",
+ "4 id_7 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_2/g_2939999/0020/surprise/7.wav \n",
+ "2696 id_4045 \n",
+ "2697 generated_hifi/esd_tune_7/g_3059999/0020/surprise/8.wav \n",
+ "2698 id_4048 \n",
+ "2699 generated_hifi/esd_tune_2/g_2939999/0020/surprise/9.wav \n",
"\n",
- " m2 \\\n",
- "0 id_2 \n",
- "1 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/1.wav \n",
- "2 id_5 \n",
- "3 generated_hifi/esd_tune_advloss0/g_2669999/0011/angry/10.wav \n",
- "4 id_8 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4046 \n",
- "2697 generated_hifi/esd_tune_advloss0/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4049 \n",
- "2699 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/9.wav \n",
+ " m2 \\\n",
+ "0 id_2 \n",
+ "1 generated_hifi/esd_tune_7/g_3059999/0011/angry/1.wav \n",
+ "2 id_5 \n",
+ "3 generated_hifi/esd_tune_2/g_2939999/0011/angry/10.wav \n",
+ "4 id_8 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_7/g_3059999/0020/surprise/7.wav \n",
+ "2696 id_4046 \n",
+ "2697 generated_hifi/esd_tune_1/g_2879999/0020/surprise/8.wav \n",
+ "2698 id_4049 \n",
+ "2699 generated_hifi/esd_tune_1/g_2879999/0020/surprise/9.wav \n",
"\n",
- " m3 \\\n",
- "0 id_3 \n",
- "1 generated_hifi/esd_tune_reversal/g_2669999/0011/angry/1.wav \n",
- "2 id_6 \n",
- "3 generated_hifi/esd_tune/g_2669999/0011/angry/10.wav \n",
- "4 id_9 \n",
- "... ... \n",
- "2695 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/7.wav \n",
- "2696 id_4047 \n",
- "2697 generated_hifi/esd_tune_reversal/g_2669999/0020/surprise/8.wav \n",
- "2698 id_4050 \n",
- "2699 generated_hifi/esd_tune/g_2669999/0020/surprise/9.wav \n",
+ " m3 \\\n",
+ "0 id_3 \n",
+ "1 generated_hifi/esd_tune_1/g_2879999/0011/angry/1.wav \n",
+ "2 id_6 \n",
+ "3 generated_hifi/esd_tune_1/g_2879999/0011/angry/10.wav \n",
+ "4 id_9 \n",
+ "... ... \n",
+ "2695 generated_hifi/esd_tune_1/g_2879999/0020/surprise/7.wav \n",
+ "2696 id_4047 \n",
+ "2697 generated_hifi/esd_tune_2/g_2939999/0020/surprise/8.wav \n",
+ "2698 id_4050 \n",
+ "2699 generated_hifi/esd_tune_7/g_3059999/0020/surprise/9.wav \n",
"\n",
" m2_text \n",
"0 - \n",
@@ -1325,7 +1343,7 @@
"[2700 rows x 6 columns]"
]
},
- "execution_count": 13,
+ "execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
@@ -1352,9 +1370,9 @@
"metadata": {},
"outputs": [],
"source": [
- "Path('reports').mkdir(exist_ok=True)\n",
+ "OUTPUT_DIR.mkdir(exist_ok=True, parents=True)\n",
"df_permuted.to_csv(\n",
- " 'reports/eval_map.csv',\n",
+ " OUTPUT_DIR / 'eval_map.csv',\n",
" sep = \"\\t\",\n",
" header = False,\n",
" index = False,\n",
@@ -1432,7 +1450,7 @@
"metadata": {},
"outputs": [],
"source": [
- "output_folder = Path('reports/html')\n",
+ "output_folder = OUTPUT_DIR / 'html'\n",
"output_folder.mkdir(parents=True, exist_ok=True)"
]
},
@@ -1450,59 +1468,59 @@
"output_type": "stream",
"text": [
"0 100\n",
- "reports/html/nat_vctk_esd_tune_test_1.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_1.html\n",
"100 200\n",
- "reports/html/nat_vctk_esd_tune_test_2.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_2.html\n",
"200 300\n",
- "reports/html/nat_vctk_esd_tune_test_3.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_3.html\n",
"300 400\n",
- "reports/html/nat_vctk_esd_tune_test_4.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_4.html\n",
"400 500\n",
- "reports/html/nat_vctk_esd_tune_test_5.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_5.html\n",
"500 600\n",
- "reports/html/nat_vctk_esd_tune_test_6.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_6.html\n",
"600 700\n",
- "reports/html/nat_vctk_esd_tune_test_7.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_7.html\n",
"700 800\n",
- "reports/html/nat_vctk_esd_tune_test_8.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_8.html\n",
"800 900\n",
- "reports/html/nat_vctk_esd_tune_test_9.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_9.html\n",
"900 1000\n",
- "reports/html/nat_vctk_esd_tune_test_10.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_10.html\n",
"1000 1100\n",
- "reports/html/nat_vctk_esd_tune_test_11.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_11.html\n",
"1100 1200\n",
- "reports/html/nat_vctk_esd_tune_test_12.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_12.html\n",
"1200 1300\n",
- "reports/html/nat_vctk_esd_tune_test_13.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_13.html\n",
"1300 1400\n",
- "reports/html/nat_vctk_esd_tune_test_14.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_14.html\n",
"1400 1500\n",
- "reports/html/nat_vctk_esd_tune_test_15.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_15.html\n",
"1500 1600\n",
- "reports/html/nat_vctk_esd_tune_test_16.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_16.html\n",
"1600 1700\n",
- "reports/html/nat_vctk_esd_tune_test_17.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_17.html\n",
"1700 1800\n",
- "reports/html/nat_vctk_esd_tune_test_18.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_18.html\n",
"1800 1900\n",
- "reports/html/nat_vctk_esd_tune_test_19.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_19.html\n",
"1900 2000\n",
- "reports/html/nat_vctk_esd_tune_test_20.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_20.html\n",
"2000 2100\n",
- "reports/html/nat_vctk_esd_tune_test_21.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_21.html\n",
"2100 2200\n",
- "reports/html/nat_vctk_esd_tune_test_22.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_22.html\n",
"2200 2300\n",
- "reports/html/nat_vctk_esd_tune_test_23.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_23.html\n",
"2300 2400\n",
- "reports/html/nat_vctk_esd_tune_test_24.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_24.html\n",
"2400 2500\n",
- "reports/html/nat_vctk_esd_tune_test_25.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_25.html\n",
"2500 2600\n",
- "reports/html/nat_vctk_esd_tune_test_26.html\n",
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_26.html\n",
"2600 2700\n",
- "reports/html/nat_vctk_esd_tune_test_27.html\n"
+ "reports/esd_tune_1-2-7/html/nat_vctk_esd_tune_test_27.html\n"
]
}
],
@@ -1539,8 +1557,8 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "reports/scores/scores.csv\n",
- "reports/scores/scores.xlsx\n"
+ "reports/esd_tune_1-2-7/scores/scores.csv\n",
+ "reports/esd_tune_1-2-7/scores/scores.xlsx\n"
]
}
],
@@ -1569,7 +1587,7 @@
" print(excel_path)\n",
"\n",
"\n",
- "create_scores_file(df_permuted, \"reports/scores\")"
+ "create_scores_file(df_permuted, OUTPUT_DIR / \"scores\")"
]
}
],