@inproceedings{b479a72fea264456bb74f71f68e608bd,
title = "Experimental application of a Japanese historical document image synthesis method to text line segmentation",
abstract = "We plan to use a text line segmentation method based on machine learning in our transcription support system for handwritten Japanese historical document in Kana, and are searching for a data synthesis method of annotated document images because it is time consuming to manually annotate a large set of document images for training data for machine learning. In this paper, we report our synthesis method of annotated document images designed for a Japanese historical document. To compare manually annotated Japanese historical document images and annotated document images synthesized by the method as training data for an object detection algorithm YOLOv3, we conducted text line segmentation experiments using the object detection algorithm. The experimental results show that a model trained by the synthetic annotated document images are competitive with that trained by the manually annotated document images from the view point of a metric intersection-over-union.",
keywords = "Data synthesis, Deep learning, Historical document, Text line segmentation",
author = "Naoto Inuzuka and Tetsuya Suzuki",
note = "Publisher Copyright: {\textcopyright} 2021 by SCITEPRESS - Science and Technology Publications, Lda. All rights reserved; 10th International Conference on Pattern Recognition Applications and Methods, ICPRAM 2021 ; Conference date: 04-02-2021 Through 06-02-2021",
year = "2021",
language = "English",
series = "ICPRAM 2021 - Proceedings of the 10th International Conference on Pattern Recognition Applications and Methods",
publisher = "SciTePress",
pages = "628--634",
editor = "{De Marsico}, Maria and {di Baja}, {Gabriella Sanniti} and Ana Fred",
booktitle = "ICPRAM 2021 - Proceedings of the 10th International Conference on Pattern Recognition Applications and Methods",
}