@inproceedings{2103f74338fb45228376bafd37d6fbdd,
title = "A Robust Document Processing System Combining Image Segmentation with Content-based Document Compression",
abstract = "A document processing system combining image segmentation with content-based document compression is proposed in the paper. Firstly, a grayscale document image is divided into small blocks and analysed. Then, a modified logical thresholding method based on, local structure analysis and the adaptive logical level technique is used to transform the grayscale document into a binary image. We extract all patterns from the binary document and use a multistage matching method to extract representative patterns. A decomposition method is used to deal with relatively large patterns. Finally, high ratio compression is achieved by coding the relative positions of symbols, extracted representative patterns and other decomposed patterns using the adaptive arithmetic coder anal Q-Coder respectively. {\textcopyright} 2000 IEEE.",
author = "Yibing Yang and Hong Yan",
year = "2000",
month = sep,
doi = "10.1109/ICPR.2000.902971",
language = "English",
isbn = "0769507506",
volume = "4",
series = "International Conference on Pattern Recognition",
publisher = "IEEE",
pages = "519--522",
editor = "Sanfeliu, {A. } and {Villanueva }, {J. J.} and M. Vanrell and Alqukzar, {R. } and {Crowley }, {J. } and {Shirai }, {Y. }",
booktitle = "Proceedings 15th International Conference on Pattern Recognition, ICPR 2000",
address = "United States",
note = "15th International Conference on Pattern Recognition, ICPR 2000 ; Conference date: 03-09-2000 Through 07-09-2000",
}