diff --git a/.dvc/.gitignore b/.dvc/.gitignore new file mode 100644 index 0000000..62a67db --- /dev/null +++ b/.dvc/.gitignore @@ -0,0 +1,8 @@ +/lock +/config.local +/updater +/updater.lock +/state-journal +/state-wal +/state +/cache diff --git a/.dvc/config b/.dvc/config new file mode 100644 index 0000000..fb0bf91 --- /dev/null +++ b/.dvc/config @@ -0,0 +1,4 @@ +['remote "jsde"'] +url = ssh://me@janek-schleicher.de:/home/me/data/ocrd_segments +[core] +remote = jsde diff --git a/.gitignore b/.gitignore index fb78ca3..272bb42 100644 --- a/.gitignore +++ b/.gitignore @@ -106,3 +106,8 @@ venv.bak/ # vim tmp *.swp *.swo + +# Input files +/input +/downscale* +/masks* diff --git a/README.md b/README.md index 6755a56..dfd61f6 100644 --- a/README.md +++ b/README.md @@ -6,3 +6,26 @@ This repository aims to provide a number of OCR-D-compliant processors for layou - data-driven segmentation aka. `ocrd-segment-via-model` (input file groups N=1, based on a statistical model, e.g. Neural Network) - comparing different layout segmentations aka. `ocrd-segment-evaluate` (input file groups N = 2, compute the distance between two segmentations, e.g. automatic vs. manual) - repairing of layout segmentations aka. `ocrd-segment-repair` (input file groups N >= 1, based on heuristics implemented using Shapely) + + +## Installation + +### Requirements + + $ virtualenv env --python=python3.7 # 3.8 did not work yet for all needed libraries at 2019-08-21 + $ source env/bin/activate + (env) pip install -r requirements.txt # TODO(js): Pin requirements + +### Jupyter Notebook Kernel preparation (to use the virtualenv) + + # XXX(js): Not sure whether we'll need it for a + (env) ipython kernel install --user ocrd-segmentations + +#### And who like VIM key bindings + + (env) jupyter nbextension install https://raw.githubusercontent.com/lambdalisue/jupyter-vim-binding/master/vim_binding.js --nbextensions=$(jupyter --data-dir)/nbextensions/vim_binding + (env) jupyter nbextension enable vim_binding/vim_binding + +#### Run the jupyter notebook + + (env) jupyter notebook diff --git a/downscale_to_4th/.gitignore b/downscale_to_4th/.gitignore new file mode 100644 index 0000000..f633594 --- /dev/null +++ b/downscale_to_4th/.gitignore @@ -0,0 +1 @@ +/models diff --git a/downscale_to_4th/models.dvc b/downscale_to_4th/models.dvc new file mode 100644 index 0000000..2b9eff0 --- /dev/null +++ b/downscale_to_4th/models.dvc @@ -0,0 +1,8 @@ +md5: 028b7fab56f70c52f962fad0d19ed1a2 +wdir: . +outs: +- md5: 7dac48b7918bc02e6b49b56daade5fad.dir + path: models + cache: true + metric: false + persist: false diff --git a/notebooks/1stOverview.ipynb b/notebooks/1stOverview.ipynb new file mode 100644 index 0000000..013d90f --- /dev/null +++ b/notebooks/1stOverview.ipynb @@ -0,0 +1,4956 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# OCRD - A 1st Overview \n", + "\n", + "Here I'll look into the data and train a model following https://towardsdatascience.com/fastai-image-segmentation-eacad8543f6f\n", + "\n", + "## Imports" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-09T12:13:59.305777Z", + "start_time": "2019-09-09T12:13:59.160423Z" + }, + "init_cell": true + }, + "outputs": [], + "source": [ + "import hashlib\n", + "import imghdr\n", + "import os\n", + "from pathlib import PosixPath\n", + "import re\n", + "from tqdm import tqdm_notebook\n", + "from zipfile import ZipFile\n", + "import xml.etree.ElementTree as ET\n", + "\n", + "from PIL import ImageDraw\n", + "from display_xml import XML\n", + "from fastai.vision import *\n", + "import seaborn as sns\n", + "from shapely.geometry import Polygon as ShapelyPolygon\n", + "\n", + "from loguru import logger\n", + "\n", + "!mkdir -p ../input\n", + "BAGS = PosixPath(os.path.expanduser('~/Dropbox/0bags'))\n", + "INPUT = PosixPath('../input/')\n", + "\n", + "RESIZE_FACTOR = 4 # 1/8th of the original images should be good enough to get a first idea\n", + "INPUT_RESIZED = PosixPath(f'../downscale_to_{RESIZE_FACTOR}th')\n", + "\n", + "MASKS = PosixPath('../masks')\n", + "MASKS_RESIZED = PosixPath(f'../masks_downscale_to{RESIZE_FACTOR}th')" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-07T17:19:13.997979Z", + "start_time": "2019-09-07T17:19:13.995193Z" + } + }, + "source": [ + "## Unzip Input data from the (dropbox) folder" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-09T12:13:59.419255Z", + "start_time": "2019-09-09T12:13:59.307212Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[PosixPath('/home/janek/Dropbox/0bags/stein_verwaltungslehre07_1868.zip'), PosixPath('/home/janek/Dropbox/0bags/buesch_handlung01_1792.zip'), PosixPath('/home/janek/Dropbox/0bags/brunner_rechtsgeschichte01_1887.zip'), PosixPath('/home/janek/Dropbox/0bags/karsch_gedichte_1792.zip'), PosixPath('/home/janek/Dropbox/0bags/steinen_naturvoelker_1894.zip')] 211\n", + "2,9G\t/home/janek/Dropbox/0bags\r\n" + ] + } + ], + "source": [ + "zip_archives = BAGS.ls()\n", + "print(zip_archives[:5], len(zip_archives))\n", + "!du -sh ~/Dropbox/0bags" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-09T12:14:12.164355Z", + "start_time": "2019-09-09T12:13:59.421101Z" + } + }, + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "63e1c3a9caff4de2b89107b9b8350d3d", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "HBox(children=(IntProgress(value=1, bar_style='info', max=1), HTML(value='')))" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n" + ] + } + ], + "source": [ + "for f in tqdm_notebook(filter(lambda f: f.name.endswith('.zip'), BAGS.ls())):\n", + " dest = INPUT / f.name.replace('.zip', '')\n", + " ZipFile(f, 'r').extractall(dest)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-07T17:20:13.290332Z", + "start_time": "2019-09-07T17:20:13.285400Z" + } + }, + "source": [ + "## Give image files a .jpeg or whatever suffix\n", + "\n", + "fastai atm needs it to work correctly (but it's also a nice check of the data integrity, too)" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-09T12:14:13.115681Z", + "start_time": "2019-09-09T12:14:12.165973Z" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Found image files [PosixPath('fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg'), PosixPath('fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0011.jpeg'), PosixPath('fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0014.jpeg'), PosixPath('fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0014.jpeg'), PosixPath('fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0013.jpeg')] ... [PosixPath('mohr_fachwerk02_1875/data/OCR-D-IMG/OCR-D-IMG_0020.jpeg'), PosixPath('gerber_staatsrecht_1865/data/OCR-D-IMG/OCR-D-IMG_0020.jpeg'), PosixPath('gerber_staatsrecht_1865/data/OCR-D-IMG/OCR-D-IMG_0020.jpeg'), PosixPath('dahlmann_politik_1835/data/OCR-D-IMG/OCR-D-IMG_0020.jpeg'), PosixPath('dahlmann_politik_1835/data/OCR-D-IMG/OCR-D-IMG_0020.jpeg')]\n", + "Found image types {'.jpeg'}\n" + ] + } + ], + "source": [ + "imgfiles = []\n", + "imgtypes = set()\n", + "\n", + "for root, dirs, files in os.walk(INPUT):\n", + " path = PosixPath(root)\n", + " if path.name != \"OCR-D-IMG\": continue\n", + " for imgf in [PosixPath(f) for f in files]:\n", + " if not imgf.suffix:\n", + " imgtype = imghdr.what(path / imgf.name)\n", + " file_with_jpeg_or_whatever = (imgf.name + \".\" + imgtype)\n", + " os.rename(path / imgf, path / file_with_jpeg_or_whatever)\n", + " imgf = PosixPath(file_with_jpeg_or_whatever)\n", + " imgtypes.add(imgf.suffix)\n", + " imgfiles.append((path / imgf).relative_to(INPUT))\n", + "print(\"Found image files\", imgfiles[:5], \"...\", imgfiles[-5:])\n", + "print(\"Found image types\", imgtypes)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Get an overview of original resolutions" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": { + "ExecuteTime": { + "end_time": "2019-09-09T12:14:13.478098Z", + "start_time": "2019-09-09T12:14:13.116898Z" + } + }, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | orig | \n", + "res | \n", + "width | \n", + "height | \n", + "ratio | \n", + "
|---|---|---|---|---|---|
| 0 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "
| 1 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0011.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "
| 2 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0014.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "
| 3 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0014.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "
| 4 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0013.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "
| \n", + " | width | \n", + "height | \n", + "orig | \n", + "res | \n", + "ratio | \n", + "
|---|---|---|---|---|---|
| 0 | \n", + "2486 | \n", + "3404 | \n", + "118 | \n", + "118 | \n", + "118 | \n", + "
| 1 | \n", + "1560 | \n", + "2241 | \n", + "40 | \n", + "40 | \n", + "40 | \n", + "
| 2 | \n", + "2328 | \n", + "3177 | \n", + "38 | \n", + "38 | \n", + "38 | \n", + "
| 3 | \n", + "1611 | \n", + "2421 | \n", + "38 | \n", + "38 | \n", + "38 | \n", + "
| 4 | \n", + "1563 | \n", + "2304 | \n", + "28 | \n", + "28 | \n", + "28 | \n", + "
| \n", + " | orig | \n", + "res | \n", + "width | \n", + "height | \n", + "ratio | \n", + "ann | \n", + "
|---|---|---|---|---|---|---|
| 0 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-GT-SEG-BLOCK/OCR-D-GT-SEG-BLOCK_0009 | \n", + "
| 1 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0011.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-GT-SEG-BLOCK/OCR-D-GT-SEG-BLOCK_0011 | \n", + "
| 2 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0014.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-GT-SEG-BLOCK/OCR-D-GT-SEG-BLOCK_0014 | \n", + "
| 3 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0014.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-GT-SEG-BLOCK/OCR-D-GT-SEG-BLOCK_0014 | \n", + "
| 4 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0013.jpeg | \n", + "(2724, 3578) | \n", + "2724 | \n", + "3578 | \n", + "1.31351 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-GT-SEG-BLOCK/OCR-D-GT-SEG-BLOCK_0013 | \n", + "
<PcGts xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://schema.primaresearch.org/PAGE/gts/pagecontent/2019-07-15 http://schema.primaresearch.org/PAGE/gts/pagecontent/2019-07-15/pagecontent.xsd">\n",
+ " <Metadata>\n",
+ " <Creator>Deutsches Textarchiv</Creator>\n",
+ " <Created>2018-03-22T09:11:30</Created>\n",
+ " <LastChange>2019-07-23T11:28:33</LastChange>\n",
+ " </Metadata>\n",
+ " <Page imageFilename="fischer_werkzeugmaschinen01_1900_0023.jpg" imageWidth="2724" imageHeight="3578" type="content">\n",
+ " <Border>\n",
+ " <Coords points="13,260 13,3421 2217,3421 2217,260"/>\n",
+ " </Border>\n",
+ " <ReadingOrder>\n",
+ " <OrderedGroup id="ro357564684568544579089" caption="Regions reading order">\n",
+ " <RegionRefIndexed regionRef="region_1" index="0"/>\n",
+ " <RegionRefIndexed regionRef="region_2" index="1"/>\n",
+ " <RegionRefIndexed regionRef="r1" index="2"/>\n",
+ " <RegionRefIndexed regionRef="r5" index="3"/>\n",
+ " <RegionRefIndexed regionRef="region_5" index="4"/>\n",
+ " <RegionRefIndexed regionRef="r7" index="5"/>\n",
+ " </OrderedGroup>\n",
+ " </ReadingOrder>\n",
+ " <TextRegion id="region_1" type="header">\n",
+ " <Coords points="526,440 1475,440 1475,535 526,535"/>\n",
+ " <TextEquiv>\n",
+ " <Unicode/>\n",
+ " </TextEquiv>\n",
+ " </TextRegion>\n",
+ " <TextRegion id="region_2" type="page-number">\n",
+ " <Coords points="1686,450 1775,450 1775,532 1686,532"/>\n",
+ " <TextEquiv>\n",
+ " <Unicode/>\n",
+ " </TextEquiv>\n",
+ " </TextRegion>\n",
+ " <GraphicRegion id="region_4">\n",
+ " <Coords points="306,1253 1740,1253 1740,2205 306,2205"/>\n",
+ " </GraphicRegion>\n",
+ " <TextRegion id="region_5" type="caption">\n",
+ " <Coords points="890,2203 1082,2203 1082,2253 890,2253"/>\n",
+ " <TextEquiv>\n",
+ " <Unicode/>\n",
+ " </TextEquiv>\n",
+ " </TextRegion>\n",
+ " <TextRegion id="r1" type="paragraph">\n",
+ " <Coords points="1802,546 1802,799 1712,799 1712,798 1531,798 1531,797 1349,797 1349,796 1168,796 1168,795 987,795 987,794 805,794 805,793 624,793 624,792 443,792 443,791 261,791 261,790 170,790 170,546"/>\n",
+ " <TextEquiv>\n",
+ " <Unicode/>\n",
+ " </TextEquiv>\n",
+ " </TextRegion>\n",
+ " <TextRegion id="r5" type="paragraph">\n",
+ " <Coords points="260,792 260,793 442,793 442,794 623,794 623,795 804,795 804,796 986,796 986,797 1167,797 1167,798 1348,798 1348,799 1530,799 1530,800 1711,800 1711,801 1802,801 1802,2838 1779,2838 1779,2837 1733,2837 1733,2836 1686,2836 1686,2835 1639,2835 1639,2834 1593,2834 1593,2833 1546,2833 1546,2832 1499,2832 1499,2831 1453,2831 1453,2830 1406,2830 1406,2829 1360,2829 1360,2828 1313,2828 1313,2827 1266,2827 1266,2826 1220,2826 1220,2825 1173,2825 1173,2824 1126,2824 1126,2823 1080,2823 1080,2822 1033,2822 1033,2821 987,2821 987,2820 940,2820 940,2819 893,2819 893,2818 847,2818 847,2817 800,2817 800,2816 753,2816 753,2815 707,2815 707,2814 660,2814 660,2813 613,2813 613,2812 567,2812 567,2811 520,2811 520,2810 474,2810 474,2809 427,2809 427,2808 380,2808 380,2807 334,2807 334,2806 287,2806 287,2805 240,2805 240,2804 194,2804 194,2803 170,2803 170,792"/>\n",
+ " <TextEquiv>\n",
+ " <Unicode/>\n",
+ " </TextEquiv>\n",
+ " </TextRegion>\n",
+ " <TextRegion id="r7" type="paragraph">\n",
+ " <Coords points="193,2805 193,2806 239,2806 239,2807 286,2807 286,2808 333,2808 333,2809 379,2809 379,2810 426,2810 426,2811 473,2811 473,2812 519,2812 519,2813 566,2813 566,2814 612,2814 612,2815 659,2815 659,2816 706,2816 706,2817 752,2817 752,2818 799,2818 799,2819 846,2819 846,2820 892,2820 892,2821 939,2821 939,2822 986,2822 986,2823 1032,2823 1032,2824 1079,2824 1079,2825 1125,2825 1125,2826 1172,2826 1172,2827 1219,2827 1219,2828 1265,2828 1265,2829 1312,2829 1312,2830 1359,2830 1359,2831 1405,2831 1405,2832 1452,2832 1452,2833 1498,2833 1498,2834 1545,2834 1545,2835 1592,2835 1592,2836 1638,2836 1638,2837 1685,2837 1685,2838 1732,2838 1732,2839 1778,2839 1778,2840 1802,2840 1802,3076 170,3076 170,2805"/>\n",
+ " <TextEquiv>\n",
+ " <Unicode/>\n",
+ " </TextEquiv>\n",
+ " </TextRegion>\n",
+ " </Page>\n",
+ "</PcGts>\n",
+ "| \n", + " | path | \n", + "label | \n", + "points | \n", + "is_node | \n", + "
|---|---|---|---|---|
| 0 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "Border | \n", + "13 260 13 3421 2217 3421 2217 260 | \n", + "False | \n", + "
| 1 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "TextRegion-header | \n", + "526 440 1475 440 1475 535 526 535 | \n", + "True | \n", + "
| 2 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "TextRegion-page-number | \n", + "1686 450 1775 450 1775 532 1686 532 | \n", + "True | \n", + "
| 3 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "GraphicRegion | \n", + "306 1253 1740 1253 1740 2205 306 2205 | \n", + "True | \n", + "
| 4 | \n", + "fischer_werkzeugmaschinen01_1900/data/OCR-D-IMG/OCR-D-IMG_0009.jpeg | \n", + "TextRegion-caption | \n", + "890 2203 1082 2203 1082 2253 890 2253 | \n", + "True | \n", + "
| is_node | \n", + "False | \n", + "True | \n", + "
|---|---|---|
| label | \n", + "\n", + " | \n", + " |
| Border | \n", + "2098 | \n", + "26 | \n", + "
| GraphicRegion | \n", + "4 | \n", + "436 | \n", + "
| GraphicRegion-barcode | \n", + "0 | \n", + "114 | \n", + "
| GraphicRegion-decoration | \n", + "0 | \n", + "2 | \n", + "
| GraphicRegion-handwritten-annotation | \n", + "0 | \n", + "56 | \n", + "
| GraphicRegion-other | \n", + "0 | \n", + "10 | \n", + "
| GraphicRegion-stamp | \n", + "0 | \n", + "54 | \n", + "
| MathsRegion | \n", + "0 | \n", + "270 | \n", + "
| NoiseRegion | \n", + "0 | \n", + "42 | \n", + "
| PrintSpace | \n", + "12 | \n", + "0 | \n", + "
| SeparatorRegion | \n", + "0 | \n", + "990 | \n", + "
| TableRegion | \n", + "4 | \n", + "392 | \n", + "
| TextRegion-caption | \n", + "0 | \n", + "306 | \n", + "
| TextRegion-catch-word | \n", + "0 | \n", + "270 | \n", + "
| TextRegion-drop-capital | \n", + "0 | \n", + "26 | \n", + "
| TextRegion-endnote | \n", + "2 | \n", + "54 | \n", + "
| TextRegion-footnote | \n", + "42 | \n", + "660 | \n", + "
| TextRegion-footnote-continued | \n", + "30 | \n", + "132 | \n", + "
| TextRegion-header | \n", + "0 | \n", + "664 | \n", + "
| TextRegion-heading | \n", + "16 | \n", + "782 | \n", + "
| TextRegion-marginalia | \n", + "0 | \n", + "76 | \n", + "
| TextRegion-other | \n", + "10 | \n", + "36 | \n", + "
| TextRegion-page-number | \n", + "0 | \n", + "1702 | \n", + "
| TextRegion-paragraph | \n", + "130 | \n", + "6204 | \n", + "
| TextRegion-signature-mark | \n", + "0 | \n", + "430 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "2.452248 | \n", + "1.807067 | \n", + "0.545857 | \n", + "00:02 | \n", + "
| 1 | \n", + "1.769129 | \n", + "1.071561 | \n", + "0.627103 | \n", + "00:02 | \n", + "
| 2 | \n", + "1.495252 | \n", + "1.182628 | \n", + "0.610088 | \n", + "00:02 | \n", + "
| 3 | \n", + "1.315170 | \n", + "0.915134 | \n", + "0.641344 | \n", + "00:02 | \n", + "
| 4 | \n", + "1.200313 | \n", + "0.984348 | \n", + "0.630071 | \n", + "00:02 | \n", + "
| 5 | \n", + "1.141517 | \n", + "1.070440 | \n", + "0.606206 | \n", + "00:02 | \n", + "
| 6 | \n", + "1.089557 | \n", + "0.870575 | \n", + "0.699404 | \n", + "00:02 | \n", + "
| 7 | \n", + "1.031176 | \n", + "0.958292 | \n", + "0.650068 | \n", + "00:02 | \n", + "
| 8 | \n", + "0.982741 | \n", + "1.379658 | \n", + "0.548396 | \n", + "00:02 | \n", + "
| 9 | \n", + "0.982213 | \n", + "1.001716 | \n", + "0.614245 | \n", + "00:02 | \n", + "
| 10 | \n", + "0.951769 | \n", + "0.883827 | \n", + "0.644286 | \n", + "00:02 | \n", + "
| 11 | \n", + "0.918825 | \n", + "0.819393 | \n", + "0.681505 | \n", + "00:02 | \n", + "
| 12 | \n", + "0.888211 | \n", + "0.861060 | \n", + "0.648050 | \n", + "00:02 | \n", + "
| 13 | \n", + "0.853995 | \n", + "0.758634 | \n", + "0.766083 | \n", + "00:02 | \n", + "
| 14 | \n", + "0.822879 | \n", + "0.754266 | \n", + "0.714894 | \n", + "00:02 | \n", + "
| 15 | \n", + "0.787230 | \n", + "0.735747 | \n", + "0.720275 | \n", + "00:02 | \n", + "
| 16 | \n", + "0.757013 | \n", + "0.722201 | \n", + "0.758523 | \n", + "00:02 | \n", + "
| 17 | \n", + "0.730336 | \n", + "0.725784 | \n", + "0.744105 | \n", + "00:02 | \n", + "
| 18 | \n", + "0.709491 | \n", + "0.723612 | \n", + "0.738678 | \n", + "00:02 | \n", + "
| 19 | \n", + "0.684921 | \n", + "0.725369 | \n", + "0.738656 | \n", + "00:02 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0.584415 | \n", + "0.717265 | \n", + "0.732786 | \n", + "00:02 | \n", + "
| 1 | \n", + "0.596830 | \n", + "0.717026 | \n", + "0.733570 | \n", + "00:02 | \n", + "
| 2 | \n", + "0.601436 | \n", + "0.709002 | \n", + "0.736122 | \n", + "00:02 | \n", + "
| 3 | \n", + "0.599550 | \n", + "0.713888 | \n", + "0.736920 | \n", + "00:02 | \n", + "
| 4 | \n", + "0.600833 | \n", + "0.717822 | \n", + "0.738619 | \n", + "00:02 | \n", + "
| 5 | \n", + "0.598980 | \n", + "0.708948 | \n", + "0.741125 | \n", + "00:02 | \n", + "
| 6 | \n", + "0.595457 | \n", + "0.718515 | \n", + "0.739681 | \n", + "00:02 | \n", + "
| 7 | \n", + "0.596278 | \n", + "0.707717 | \n", + "0.742567 | \n", + "00:02 | \n", + "
| 8 | \n", + "0.596528 | \n", + "0.706706 | \n", + "0.743171 | \n", + "00:02 | \n", + "
| 9 | \n", + "0.594696 | \n", + "0.722052 | \n", + "0.740183 | \n", + "00:02 | \n", + "
| 10 | \n", + "0.596291 | \n", + "0.724721 | \n", + "0.746806 | \n", + "00:02 | \n", + "
| 11 | \n", + "0.592152 | \n", + "0.723754 | \n", + "0.742798 | \n", + "00:02 | \n", + "
| 12 | \n", + "0.590340 | \n", + "0.718343 | \n", + "0.738748 | \n", + "00:02 | \n", + "
| 13 | \n", + "0.588927 | \n", + "0.720416 | \n", + "0.741374 | \n", + "00:02 | \n", + "
| 14 | \n", + "0.587207 | \n", + "0.742684 | \n", + "0.744403 | \n", + "00:02 | \n", + "
| 15 | \n", + "0.581254 | \n", + "0.720121 | \n", + "0.733174 | \n", + "00:02 | \n", + "
| 16 | \n", + "0.574009 | \n", + "0.731865 | \n", + "0.744466 | \n", + "00:02 | \n", + "
| 17 | \n", + "0.567083 | \n", + "0.752474 | \n", + "0.721190 | \n", + "00:02 | \n", + "
| 18 | \n", + "0.557811 | \n", + "0.754703 | \n", + "0.726039 | \n", + "00:02 | \n", + "
| 19 | \n", + "0.546790 | \n", + "0.758058 | \n", + "0.734499 | \n", + "00:02 | \n", + "
| 20 | \n", + "0.539660 | \n", + "0.848547 | \n", + "0.682513 | \n", + "00:02 | \n", + "
| 21 | \n", + "0.525566 | \n", + "0.831548 | \n", + "0.702605 | \n", + "00:02 | \n", + "
| 22 | \n", + "0.519638 | \n", + "0.850751 | \n", + "0.677162 | \n", + "00:02 | \n", + "
| 23 | \n", + "0.509766 | \n", + "0.764902 | \n", + "0.694895 | \n", + "00:02 | \n", + "
| 24 | \n", + "0.499675 | \n", + "0.747176 | \n", + "0.715577 | \n", + "00:02 | \n", + "
| 25 | \n", + "0.488455 | \n", + "0.803307 | \n", + "0.702361 | \n", + "00:02 | \n", + "
| 26 | \n", + "0.470106 | \n", + "0.816956 | \n", + "0.691701 | \n", + "00:02 | \n", + "
| 27 | \n", + "0.466768 | \n", + "0.905624 | \n", + "0.665994 | \n", + "00:02 | \n", + "
| 28 | \n", + "0.453087 | \n", + "0.889961 | \n", + "0.663313 | \n", + "00:02 | \n", + "
| 29 | \n", + "0.434629 | \n", + "0.997205 | \n", + "0.665704 | \n", + "00:02 | \n", + "
| 30 | \n", + "0.422546 | \n", + "1.024793 | \n", + "0.662768 | \n", + "00:02 | \n", + "
| 31 | \n", + "0.410276 | \n", + "0.977791 | \n", + "0.690631 | \n", + "00:02 | \n", + "
| 32 | \n", + "0.407085 | \n", + "0.961790 | \n", + "0.692910 | \n", + "00:02 | \n", + "
| 33 | \n", + "0.402581 | \n", + "0.994130 | \n", + "0.683384 | \n", + "00:02 | \n", + "
| 34 | \n", + "0.389217 | \n", + "0.915918 | \n", + "0.682508 | \n", + "00:02 | \n", + "
| 35 | \n", + "0.375071 | \n", + "0.932147 | \n", + "0.684412 | \n", + "00:02 | \n", + "
| 36 | \n", + "0.358268 | \n", + "0.949784 | \n", + "0.686377 | \n", + "00:02 | \n", + "
| 37 | \n", + "0.341819 | \n", + "1.001307 | \n", + "0.686088 | \n", + "00:02 | \n", + "
| 38 | \n", + "0.326092 | \n", + "0.962453 | \n", + "0.682144 | \n", + "00:02 | \n", + "
| 39 | \n", + "0.312033 | \n", + "1.052761 | \n", + "0.682430 | \n", + "00:02 | \n", + "
| 40 | \n", + "0.299613 | \n", + "1.072640 | \n", + "0.672414 | \n", + "00:02 | \n", + "
| 41 | \n", + "0.288199 | \n", + "1.148553 | \n", + "0.674857 | \n", + "00:02 | \n", + "
| 42 | \n", + "0.274632 | \n", + "1.035845 | \n", + "0.682885 | \n", + "00:02 | \n", + "
| 43 | \n", + "0.262653 | \n", + "1.093239 | \n", + "0.673860 | \n", + "00:02 | \n", + "
| 44 | \n", + "0.251882 | \n", + "1.144466 | \n", + "0.684527 | \n", + "00:02 | \n", + "
| 45 | \n", + "0.241090 | \n", + "1.081552 | \n", + "0.681381 | \n", + "00:02 | \n", + "
| 46 | \n", + "0.232027 | \n", + "1.137870 | \n", + "0.676815 | \n", + "00:02 | \n", + "
| 47 | \n", + "0.222400 | \n", + "1.059747 | \n", + "0.680603 | \n", + "00:02 | \n", + "
| 48 | \n", + "0.216543 | \n", + "1.093719 | \n", + "0.683317 | \n", + "00:02 | \n", + "
| 49 | \n", + "0.210396 | \n", + "1.078966 | \n", + "0.689360 | \n", + "00:02 | \n", + "
| 50 | \n", + "0.202654 | \n", + "1.176466 | \n", + "0.686023 | \n", + "00:02 | \n", + "
| 51 | \n", + "0.193870 | \n", + "1.090814 | \n", + "0.689503 | \n", + "00:02 | \n", + "
| 52 | \n", + "0.185870 | \n", + "1.166513 | \n", + "0.689029 | \n", + "00:02 | \n", + "
| 53 | \n", + "0.178427 | \n", + "1.195029 | \n", + "0.683093 | \n", + "00:02 | \n", + "
| 54 | \n", + "0.171827 | \n", + "1.352738 | \n", + "0.677118 | \n", + "00:02 | \n", + "
| 55 | \n", + "0.169687 | \n", + "1.206098 | \n", + "0.693255 | \n", + "00:02 | \n", + "
| 56 | \n", + "0.166883 | \n", + "1.345477 | \n", + "0.658244 | \n", + "00:02 | \n", + "
| 57 | \n", + "0.163432 | \n", + "1.143228 | \n", + "0.694070 | \n", + "00:02 | \n", + "
| 58 | \n", + "0.158609 | \n", + "1.290022 | \n", + "0.663227 | \n", + "00:02 | \n", + "
| 59 | \n", + "0.155161 | \n", + "1.204916 | \n", + "0.675036 | \n", + "00:02 | \n", + "
| 60 | \n", + "0.150644 | \n", + "1.310703 | \n", + "0.673433 | \n", + "00:02 | \n", + "
| 61 | \n", + "0.145060 | \n", + "1.367506 | \n", + "0.678924 | \n", + "00:02 | \n", + "
| 62 | \n", + "0.140208 | \n", + "1.417464 | \n", + "0.675184 | \n", + "00:02 | \n", + "
| 63 | \n", + "0.135288 | \n", + "1.396392 | \n", + "0.674062 | \n", + "00:02 | \n", + "
| 64 | \n", + "0.130873 | \n", + "1.446485 | \n", + "0.677602 | \n", + "00:02 | \n", + "
| 65 | \n", + "0.126517 | \n", + "1.438383 | \n", + "0.676009 | \n", + "00:02 | \n", + "
| 66 | \n", + "0.122561 | \n", + "1.507830 | \n", + "0.680516 | \n", + "00:02 | \n", + "
| 67 | \n", + "0.119320 | \n", + "1.512994 | \n", + "0.675355 | \n", + "00:02 | \n", + "
| 68 | \n", + "0.115656 | \n", + "1.530193 | \n", + "0.677173 | \n", + "00:02 | \n", + "
| 69 | \n", + "0.112271 | \n", + "1.507552 | \n", + "0.683999 | \n", + "00:02 | \n", + "
| 70 | \n", + "0.109169 | \n", + "1.532348 | \n", + "0.681316 | \n", + "00:02 | \n", + "
| 71 | \n", + "0.107039 | \n", + "1.545915 | \n", + "0.680736 | \n", + "00:02 | \n", + "
| 72 | \n", + "0.104084 | \n", + "1.606340 | \n", + "0.676586 | \n", + "00:02 | \n", + "
| 73 | \n", + "0.102230 | \n", + "1.675215 | \n", + "0.672759 | \n", + "00:02 | \n", + "
| 74 | \n", + "0.099569 | \n", + "1.669022 | \n", + "0.671782 | \n", + "00:02 | \n", + "
| 75 | \n", + "0.098015 | \n", + "1.739677 | \n", + "0.673263 | \n", + "00:02 | \n", + "
| 76 | \n", + "0.095821 | \n", + "1.745798 | \n", + "0.669763 | \n", + "00:02 | \n", + "
| 77 | \n", + "0.094164 | \n", + "1.792201 | \n", + "0.670788 | \n", + "00:02 | \n", + "
| 78 | \n", + "0.092015 | \n", + "1.670760 | \n", + "0.677348 | \n", + "00:02 | \n", + "
| 79 | \n", + "0.090487 | \n", + "1.871062 | \n", + "0.670030 | \n", + "00:02 | \n", + "
| 80 | \n", + "0.089011 | \n", + "1.742501 | \n", + "0.674114 | \n", + "00:02 | \n", + "
| 81 | \n", + "0.087762 | \n", + "1.734340 | \n", + "0.676448 | \n", + "00:02 | \n", + "
| 82 | \n", + "0.087055 | \n", + "1.749249 | \n", + "0.675374 | \n", + "00:02 | \n", + "
| 83 | \n", + "0.086178 | \n", + "1.836990 | \n", + "0.668237 | \n", + "00:02 | \n", + "
| 84 | \n", + "0.085120 | \n", + "1.813544 | \n", + "0.672152 | \n", + "00:02 | \n", + "
| 85 | \n", + "0.084130 | \n", + "1.837068 | \n", + "0.675424 | \n", + "00:02 | \n", + "
| 86 | \n", + "0.082992 | \n", + "1.794075 | \n", + "0.677985 | \n", + "00:02 | \n", + "
| 87 | \n", + "0.082330 | \n", + "1.866639 | \n", + "0.673701 | \n", + "00:02 | \n", + "
| 88 | \n", + "0.081188 | \n", + "1.866591 | \n", + "0.675407 | \n", + "00:02 | \n", + "
| 89 | \n", + "0.081002 | \n", + "1.813551 | \n", + "0.679702 | \n", + "00:02 | \n", + "
| 90 | \n", + "0.080118 | \n", + "1.853538 | \n", + "0.671507 | \n", + "00:02 | \n", + "
| 91 | \n", + "0.078552 | \n", + "1.871848 | \n", + "0.672015 | \n", + "00:02 | \n", + "
| 92 | \n", + "0.077982 | \n", + "1.822861 | \n", + "0.677151 | \n", + "00:02 | \n", + "
| 93 | \n", + "0.077675 | \n", + "1.832665 | \n", + "0.678824 | \n", + "00:02 | \n", + "
| 94 | \n", + "0.077136 | \n", + "1.883268 | \n", + "0.670086 | \n", + "00:02 | \n", + "
| 95 | \n", + "0.076905 | \n", + "1.862414 | \n", + "0.673040 | \n", + "00:02 | \n", + "
| 96 | \n", + "0.076868 | \n", + "1.865319 | \n", + "0.677376 | \n", + "00:02 | \n", + "
| 97 | \n", + "0.076203 | \n", + "1.877391 | \n", + "0.676732 | \n", + "00:02 | \n", + "
| 98 | \n", + "0.075612 | \n", + "1.860847 | \n", + "0.676449 | \n", + "00:02 | \n", + "
| 99 | \n", + "0.075313 | \n", + "1.855111 | \n", + "0.677605 | \n", + "00:02 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "2.856553 | \n", + "1.764640 | \n", + "0.386858 | \n", + "00:37 | \n", + "
| 1 | \n", + "1.011970 | \n", + "1.242398 | \n", + "0.537656 | \n", + "00:38 | \n", + "
| 2 | \n", + "0.881037 | \n", + "1.057869 | \n", + "0.591275 | \n", + "00:38 | \n", + "
| 3 | \n", + "0.780716 | \n", + "0.875322 | \n", + "0.647184 | \n", + "00:38 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0.791178 | \n", + "0.877857 | \n", + "0.649679 | \n", + "00:43 | \n", + "
| 1 | \n", + "0.776143 | \n", + "0.887879 | \n", + "0.645416 | \n", + "00:43 | \n", + "
| 2 | \n", + "0.752719 | \n", + "0.898631 | \n", + "0.647036 | \n", + "00:43 | \n", + "
| 3 | \n", + "0.778018 | \n", + "0.834483 | \n", + "0.660419 | \n", + "00:43 | \n", + "
| 4 | \n", + "0.764870 | \n", + "0.797916 | \n", + "0.671497 | \n", + "00:43 | \n", + "
| 5 | \n", + "0.697720 | \n", + "0.790384 | \n", + "0.678465 | \n", + "00:43 | \n", + "
| 6 | \n", + "0.699789 | \n", + "0.758683 | \n", + "0.680566 | \n", + "00:43 | \n", + "
| 7 | \n", + "0.703927 | \n", + "0.768043 | \n", + "0.686201 | \n", + "00:43 | \n", + "
| 8 | \n", + "0.655529 | \n", + "0.787109 | \n", + "0.681620 | \n", + "00:43 | \n", + "
| 9 | \n", + "0.657443 | \n", + "0.710124 | \n", + "0.697478 | \n", + "00:43 | \n", + "
| 10 | \n", + "0.616673 | \n", + "0.757702 | \n", + "0.690379 | \n", + "00:43 | \n", + "
| 11 | \n", + "0.625324 | \n", + "0.686489 | \n", + "0.702605 | \n", + "00:43 | \n", + "
| 12 | \n", + "0.561288 | \n", + "0.696584 | \n", + "0.701316 | \n", + "00:43 | \n", + "
| 13 | \n", + "0.581710 | \n", + "0.700619 | \n", + "0.691927 | \n", + "00:43 | \n", + "
| 14 | \n", + "0.573933 | \n", + "0.699397 | \n", + "0.703273 | \n", + "00:43 | \n", + "
| 15 | \n", + "0.583466 | \n", + "0.705659 | \n", + "0.698243 | \n", + "00:43 | \n", + "
| 16 | \n", + "0.560208 | \n", + "0.696428 | \n", + "0.708472 | \n", + "00:43 | \n", + "
| 17 | \n", + "0.561483 | \n", + "0.671468 | \n", + "0.712517 | \n", + "00:43 | \n", + "
| 18 | \n", + "0.558307 | \n", + "0.711836 | \n", + "0.707913 | \n", + "00:43 | \n", + "
| 19 | \n", + "0.551497 | \n", + "0.702919 | \n", + "0.707181 | \n", + "00:43 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0.553777 | \n", + "0.667121 | \n", + "0.713071 | \n", + "00:41 | \n", + "
| 1 | \n", + "0.563154 | \n", + "0.638373 | \n", + "0.726345 | \n", + "00:42 | \n", + "
| 2 | \n", + "0.577944 | \n", + "0.694615 | \n", + "0.708609 | \n", + "00:43 | \n", + "
| 3 | \n", + "0.569093 | \n", + "0.673788 | \n", + "0.712787 | \n", + "00:43 | \n", + "
| 4 | \n", + "0.558459 | \n", + "0.660285 | \n", + "0.719369 | \n", + "00:43 | \n", + "
| 5 | \n", + "0.548331 | \n", + "0.675057 | \n", + "0.720175 | \n", + "00:43 | \n", + "
| 6 | \n", + "0.591937 | \n", + "0.669174 | \n", + "0.711785 | \n", + "00:43 | \n", + "
| 7 | \n", + "0.555726 | \n", + "0.653117 | \n", + "0.719579 | \n", + "00:43 | \n", + "
| 8 | \n", + "0.555221 | \n", + "0.692150 | \n", + "0.713082 | \n", + "00:43 | \n", + "
| 9 | \n", + "0.519693 | \n", + "0.664135 | \n", + "0.719941 | \n", + "00:43 | \n", + "
| 10 | \n", + "0.527356 | \n", + "0.660036 | \n", + "0.719104 | \n", + "00:43 | \n", + "
| 11 | \n", + "0.508473 | \n", + "0.609909 | \n", + "0.737036 | \n", + "00:43 | \n", + "
| 12 | \n", + "0.522851 | \n", + "0.633663 | \n", + "0.717664 | \n", + "00:43 | \n", + "
| 13 | \n", + "0.497258 | \n", + "0.631335 | \n", + "0.737905 | \n", + "00:43 | \n", + "
| 14 | \n", + "0.476837 | \n", + "0.631778 | \n", + "0.738951 | \n", + "00:43 | \n", + "
| 15 | \n", + "0.498999 | \n", + "0.658445 | \n", + "0.723294 | \n", + "00:43 | \n", + "
| 16 | \n", + "0.475062 | \n", + "0.644178 | \n", + "0.735008 | \n", + "00:43 | \n", + "
| 17 | \n", + "0.480955 | \n", + "0.638388 | \n", + "0.736090 | \n", + "00:43 | \n", + "
| 18 | \n", + "0.445013 | \n", + "0.686541 | \n", + "0.723129 | \n", + "00:43 | \n", + "
| 19 | \n", + "0.471052 | \n", + "0.638118 | \n", + "0.741390 | \n", + "00:43 | \n", + "
| 20 | \n", + "0.448041 | \n", + "0.660593 | \n", + "0.731921 | \n", + "00:43 | \n", + "
| 21 | \n", + "0.457920 | \n", + "0.664917 | \n", + "0.730958 | \n", + "00:43 | \n", + "
| 22 | \n", + "0.451702 | \n", + "0.614046 | \n", + "0.741799 | \n", + "00:43 | \n", + "
| 23 | \n", + "0.466195 | \n", + "0.643465 | \n", + "0.736834 | \n", + "00:43 | \n", + "
| 24 | \n", + "0.449672 | \n", + "0.639777 | \n", + "0.737823 | \n", + "00:43 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0.458690 | \n", + "0.667569 | \n", + "0.728455 | \n", + "00:41 | \n", + "
| 1 | \n", + "0.450500 | \n", + "0.668234 | \n", + "0.733412 | \n", + "00:42 | \n", + "
| 2 | \n", + "0.447065 | \n", + "0.672303 | \n", + "0.725600 | \n", + "00:43 | \n", + "
| 3 | \n", + "0.457847 | \n", + "0.648830 | \n", + "0.736870 | \n", + "00:43 | \n", + "
| 4 | \n", + "0.437371 | \n", + "0.673808 | \n", + "0.735051 | \n", + "00:43 | \n", + "
| 5 | \n", + "0.466091 | \n", + "0.625616 | \n", + "0.742644 | \n", + "00:43 | \n", + "
| 6 | \n", + "0.475065 | \n", + "0.661551 | \n", + "0.732031 | \n", + "00:43 | \n", + "
| 7 | \n", + "0.452820 | \n", + "0.699153 | \n", + "0.725094 | \n", + "00:43 | \n", + "
| 8 | \n", + "0.479388 | \n", + "0.580281 | \n", + "0.746229 | \n", + "00:43 | \n", + "
| 9 | \n", + "0.487792 | \n", + "0.666369 | \n", + "0.728635 | \n", + "00:43 | \n", + "
| 10 | \n", + "0.460888 | \n", + "0.592563 | \n", + "0.743074 | \n", + "00:43 | \n", + "
| 11 | \n", + "0.453660 | \n", + "0.672159 | \n", + "0.724699 | \n", + "00:43 | \n", + "
| 12 | \n", + "0.466425 | \n", + "0.630584 | \n", + "0.738822 | \n", + "00:43 | \n", + "
| 13 | \n", + "0.451497 | \n", + "0.647101 | \n", + "0.728689 | \n", + "00:43 | \n", + "
| 14 | \n", + "0.442216 | \n", + "0.669773 | \n", + "0.728026 | \n", + "00:43 | \n", + "
| 15 | \n", + "0.423354 | \n", + "0.826278 | \n", + "0.696161 | \n", + "00:43 | \n", + "
| 16 | \n", + "0.411646 | \n", + "0.676306 | \n", + "0.733011 | \n", + "00:43 | \n", + "
| 17 | \n", + "0.416743 | \n", + "0.660450 | \n", + "0.745354 | \n", + "00:43 | \n", + "
| 18 | \n", + "0.429740 | \n", + "0.696473 | \n", + "0.736148 | \n", + "00:43 | \n", + "
| 19 | \n", + "0.413014 | \n", + "0.682398 | \n", + "0.734040 | \n", + "00:43 | \n", + "
| 20 | \n", + "0.403385 | \n", + "0.758630 | \n", + "0.740318 | \n", + "00:43 | \n", + "
| 21 | \n", + "0.415805 | \n", + "0.667512 | \n", + "0.731291 | \n", + "00:43 | \n", + "
| 22 | \n", + "0.412937 | \n", + "0.587587 | \n", + "0.753787 | \n", + "00:43 | \n", + "
| 23 | \n", + "0.403023 | \n", + "0.616789 | \n", + "0.756837 | \n", + "00:43 | \n", + "
| 24 | \n", + "0.383011 | \n", + "0.641458 | \n", + "0.746141 | \n", + "00:43 | \n", + "
| 25 | \n", + "0.368889 | \n", + "0.664418 | \n", + "0.743073 | \n", + "00:43 | \n", + "
| 26 | \n", + "0.367368 | \n", + "0.646991 | \n", + "0.751930 | \n", + "00:43 | \n", + "
| 27 | \n", + "0.360869 | \n", + "0.660852 | \n", + "0.756417 | \n", + "00:43 | \n", + "
| 28 | \n", + "0.357260 | \n", + "0.655095 | \n", + "0.748200 | \n", + "00:43 | \n", + "
| 29 | \n", + "0.344741 | \n", + "0.707433 | \n", + "0.743539 | \n", + "00:43 | \n", + "
| 30 | \n", + "0.368345 | \n", + "0.619674 | \n", + "0.751244 | \n", + "00:43 | \n", + "
| 31 | \n", + "0.354804 | \n", + "0.660078 | \n", + "0.748415 | \n", + "00:43 | \n", + "
| 32 | \n", + "0.341516 | \n", + "0.663558 | \n", + "0.751447 | \n", + "00:43 | \n", + "
| 33 | \n", + "0.345136 | \n", + "0.657692 | \n", + "0.753073 | \n", + "00:43 | \n", + "
| 34 | \n", + "0.352449 | \n", + "0.634947 | \n", + "0.755203 | \n", + "00:43 | \n", + "
| 35 | \n", + "0.349426 | \n", + "0.649608 | \n", + "0.749845 | \n", + "00:43 | \n", + "
| 36 | \n", + "0.341926 | \n", + "0.673897 | \n", + "0.744076 | \n", + "00:43 | \n", + "
| 37 | \n", + "0.332530 | \n", + "0.635248 | \n", + "0.754299 | \n", + "00:43 | \n", + "
| 38 | \n", + "0.328841 | \n", + "0.661589 | \n", + "0.752353 | \n", + "00:43 | \n", + "
| 39 | \n", + "0.335154 | \n", + "0.649349 | \n", + "0.753004 | \n", + "00:43 | \n", + "
| epoch | \n", + "train_loss | \n", + "valid_loss | \n", + "acc_page_seg | \n", + "time | \n", + "
|---|---|---|---|---|
| 0 | \n", + "0.340665 | \n", + "0.640903 | \n", + "0.752394 | \n", + "00:41 | \n", + "
| 1 | \n", + "0.340666 | \n", + "0.626288 | \n", + "0.755166 | \n", + "00:42 | \n", + "
| 2 | \n", + "0.354699 | \n", + "0.654450 | \n", + "0.750507 | \n", + "00:42 | \n", + "
| 3 | \n", + "0.347179 | \n", + "0.686929 | \n", + "0.742491 | \n", + "00:42 | \n", + "
| 4 | \n", + "0.333216 | \n", + "0.653608 | \n", + "0.748903 | \n", + "00:42 | \n", + "
| 5 | \n", + "0.348731 | \n", + "0.657692 | \n", + "0.752562 | \n", + "00:42 | \n", + "
| 6 | \n", + "0.336454 | \n", + "0.628097 | \n", + "0.760422 | \n", + "00:43 | \n", + "
| 7 | \n", + "0.336751 | \n", + "0.651409 | \n", + "0.754049 | \n", + "00:43 | \n", + "
| 8 | \n", + "0.330902 | \n", + "0.653401 | \n", + "0.751645 | \n", + "00:43 | \n", + "
| 9 | \n", + "0.337558 | \n", + "0.669145 | \n", + "0.747862 | \n", + "00:43 | \n", + "
| 10 | \n", + "0.340558 | \n", + "0.652793 | \n", + "0.755198 | \n", + "00:43 | \n", + "
| 11 | \n", + "0.332919 | \n", + "0.657051 | \n", + "0.751085 | \n", + "00:43 | \n", + "
| 12 | \n", + "0.357514 | \n", + "0.667554 | \n", + "0.750962 | \n", + "00:43 | \n", + "
| 13 | \n", + "0.338747 | \n", + "0.660037 | \n", + "0.758884 | \n", + "00:43 | \n", + "
| 14 | \n", + "0.324783 | \n", + "0.670047 | \n", + "0.752970 | \n", + "00:43 | \n", + "
| 15 | \n", + "0.324635 | \n", + "0.663691 | \n", + "0.753103 | \n", + "00:43 | \n", + "
| 16 | \n", + "0.339759 | \n", + "0.643322 | \n", + "0.757580 | \n", + "00:43 | \n", + "
| 17 | \n", + "0.331939 | \n", + "0.667661 | \n", + "0.758993 | \n", + "00:43 | \n", + "
| 18 | \n", + "0.335830 | \n", + "0.655666 | \n", + "0.755442 | \n", + "00:43 | \n", + "
| 19 | \n", + "0.317954 | \n", + "0.679512 | \n", + "0.750495 | \n", + "00:43 | \n", + "
| 20 | \n", + "0.318587 | \n", + "0.654577 | \n", + "0.755742 | \n", + "00:43 | \n", + "
| 21 | \n", + "0.334466 | \n", + "0.647457 | \n", + "0.758164 | \n", + "00:43 | \n", + "
| 22 | \n", + "0.327888 | \n", + "0.645103 | \n", + "0.756676 | \n", + "00:43 | \n", + "
| 23 | \n", + "0.338331 | \n", + "0.710371 | \n", + "0.741083 | \n", + "00:44 | \n", + "
| 24 | \n", + "0.338002 | \n", + "0.707149 | \n", + "0.746945 | \n", + "00:43 | \n", + "
| 25 | \n", + "0.329532 | \n", + "0.708207 | \n", + "0.744364 | \n", + "00:43 | \n", + "
| 26 | \n", + "0.316733 | \n", + "0.709328 | \n", + "0.746489 | \n", + "00:43 | \n", + "
| 27 | \n", + "0.342932 | \n", + "0.751107 | \n", + "0.729875 | \n", + "00:43 | \n", + "
| 28 | \n", + "0.321316 | \n", + "0.709101 | \n", + "0.747497 | \n", + "00:43 | \n", + "
| 29 | \n", + "0.320944 | \n", + "0.706521 | \n", + "0.750620 | \n", + "00:44 | \n", + "
| 30 | \n", + "0.333289 | \n", + "0.687682 | \n", + "0.747933 | \n", + "00:44 | \n", + "
| 31 | \n", + "0.324104 | \n", + "0.731090 | \n", + "0.738172 | \n", + "00:43 | \n", + "
| 32 | \n", + "0.327663 | \n", + "0.694947 | \n", + "0.747116 | \n", + "00:43 | \n", + "
| 33 | \n", + "0.342412 | \n", + "0.722905 | \n", + "0.743069 | \n", + "00:44 | \n", + "
| 34 | \n", + "0.322976 | \n", + "0.680949 | \n", + "0.751069 | \n", + "00:43 | \n", + "
| 35 | \n", + "0.344508 | \n", + "0.724165 | \n", + "0.743796 | \n", + "00:44 | \n", + "
| 36 | \n", + "0.324619 | \n", + "0.666214 | \n", + "0.754821 | \n", + "00:44 | \n", + "
| 37 | \n", + "0.324873 | \n", + "0.674529 | \n", + "0.755849 | \n", + "00:44 | \n", + "
| 38 | \n", + "0.336385 | \n", + "0.647311 | \n", + "0.757676 | \n", + "00:43 | \n", + "
| 39 | \n", + "0.324603 | \n", + "0.678114 | \n", + "0.751366 | \n", + "00:44 | \n", + "
| 40 | \n", + "0.327351 | \n", + "0.722076 | \n", + "0.739368 | \n", + "00:43 | \n", + "
| 41 | \n", + "0.329192 | \n", + "0.720409 | \n", + "0.741318 | \n", + "00:43 | \n", + "
| 42 | \n", + "0.329325 | \n", + "0.728129 | \n", + "0.742389 | \n", + "00:44 | \n", + "
| 43 | \n", + "0.323234 | \n", + "0.711010 | \n", + "0.740416 | \n", + "00:44 | \n", + "
| 44 | \n", + "0.331323 | \n", + "0.711525 | \n", + "0.740923 | \n", + "00:44 | \n", + "
| 45 | \n", + "0.328257 | \n", + "0.723079 | \n", + "0.748594 | \n", + "00:43 | \n", + "
| 46 | \n", + "0.324943 | \n", + "0.718138 | \n", + "0.745262 | \n", + "00:43 | \n", + "
| 47 | \n", + "0.330193 | \n", + "0.686637 | \n", + "0.748900 | \n", + "00:44 | \n", + "
| 48 | \n", + "0.327443 | \n", + "0.691969 | \n", + "0.751834 | \n", + "00:43 | \n", + "
| 49 | \n", + "0.322917 | \n", + "0.679349 | \n", + "0.751797 | \n", + "00:44 | \n", + "
| 50 | \n", + "0.327654 | \n", + "0.709463 | \n", + "0.745563 | \n", + "00:43 | \n", + "
| 51 | \n", + "0.321733 | \n", + "0.701408 | \n", + "0.749177 | \n", + "00:43 | \n", + "
| 52 | \n", + "0.327361 | \n", + "0.677181 | \n", + "0.753340 | \n", + "00:43 | \n", + "
| 53 | \n", + "0.328119 | \n", + "0.683346 | \n", + "0.747560 | \n", + "00:44 | \n", + "
| 54 | \n", + "0.327353 | \n", + "0.676381 | \n", + "0.754274 | \n", + "00:43 | \n", + "
| 55 | \n", + "0.328135 | \n", + "0.710322 | \n", + "0.744036 | \n", + "00:44 | \n", + "
| 56 | \n", + "0.316283 | \n", + "0.709335 | \n", + "0.744395 | \n", + "00:43 | \n", + "
| 57 | \n", + "0.326782 | \n", + "0.678383 | \n", + "0.753343 | \n", + "00:43 | \n", + "
| 58 | \n", + "0.309789 | \n", + "0.691221 | \n", + "0.752644 | \n", + "00:44 | \n", + "
| 59 | \n", + "0.335518 | \n", + "0.705034 | \n", + "0.749208 | \n", + "00:44 | \n", + "
| \n", + " | img | \n", + "bin | \n", + "ann | \n", + "
|---|---|---|---|
| 0 | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0002.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0002.bin.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0002.json | \n", + "
| 1 | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0003.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0003.bin.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0003.json | \n", + "
| 2 | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0004.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0004.bin.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0004.json | \n", + "
| 3 | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0001.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0001.bin.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0001.json | \n", + "
| 4 | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0002.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0002.bin.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0002.json | \n", + "
| \n", + " | img | \n", + "bin | \n", + "ann | \n", + "ann_json | \n", + "
|---|---|---|---|---|
| 0 | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0002.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0002.bin.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0002.json | \n", + "{'angle': None, 'regions': [{'coords': [[890, 245], [890, 62], [504, 62], [5... | \n", + "
| 1 | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0003.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0003.bin.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0003.json | \n", + "{'angle': None, 'regions': [{'coords': [[1110, 1661], [1110, 1223], [566, 12... | \n", + "
| 2 | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0004.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0004.bin.png | \n", + "arent_dichtercharaktere_1885_OCR-D-IMG-CROP2_0004.json | \n", + "{'angle': None, 'regions': [{'coords': [[1065, 1116], [1065, 922], [319, 922... | \n", + "
| 3 | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0001.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0001.bin.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0001.json | \n", + "{'regions': [{'type': 'text', 'coords': [[574, 126], [574, 52], [449, 52], [... | \n", + "
| 4 | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0002.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0002.bin.png | \n", + "arnim_wunderhorn03_1808_OCR-D-IMG-CROP2_0002.json | \n", + "{'regions': [{'type': 'graphic', 'coords': [[1282, 2253], [1282, 11], [0, 11... | \n", + "