@inproceedings{1231b992fd6a46dd873478d655f6626e,
title = "Generation of PDF with vector symbols from scanned document",
abstract = "The paper is devoted to the algorithm for generation of PDF with vector symbols from scanned documents. The complex multi-stage technique includes segmentation of the document to text/drawing areas and background, conversion of symbols to lines and Bezier curves, storing compressed background and foreground. In the paper we concentrate on symbol conversion that comprises segmentation of symbol bodies with resolution enhancement, contour tracing and approximation. Presented method outperforms competitive solutions and secures the best compression rate/quality ratio. Scaling of initial document to other sizes as well as several printing/scanning-to-PDF iterations expose advantages of proposed way for handling with document images. Numerical vectorization quality metric was elaborated. The outcomes of OCR software and user opinion survey confirm high quality of proposed method.",
keywords = "Text vectorization, contour approximation, vectorization quality metrics",
author = "Kurilin, {Ilya V.} and Safonov, {Ilia V.} and Rychagov, {Michael N.} and Hokeun Lee and Kim, {Sang Ho} and Donchul Choi",
year = "2013",
doi = "10.1117/12.2000527",
language = "English",
isbn = "9780819494269",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
booktitle = "Proceedings of SPIE-IS and T Electronic Imaging - Image Quality and System Performance X",
note = "Image Quality and System Performance X ; Conference date: 05-02-2013 Through 07-02-2013",
}