A pattern-oriented segmentation method for optical character recognition
that leads to document structure analysis is presented. As a first
example, segmentation of handwritten numerals that touch are treated.
Connected pattern components are extracted, and spatial interrelations
between components are measured and grouped into meaningful character
patterns. Stroke shapes are analyzed and a method of finding the
touching positions that separates about 95% of connected numerals
correctly is described. Ambiguities are handled by multiple hypotheses
and verification by recognition. An extended form of pattern-oriented
segmentation, tabular form recognition, is considered. Images of
tabular forms are analyzed, and frames in the tabular structure are
extracted. By identifying semantic relationships between label frames
and data frames, information on the form can be properly recognized
%0 Journal Article
%1 FujisawaJul1992
%A Fujisawa, H.
%A Nakano, Y.
%A Kurino, K.
%D Jul 1992
%J Proceedings of the IEEE
%K analysis, character components, connected data document form frames, handwritten hypotheses, image interrelations, label multiple numerals, optical pattern patterns, positions processing, recognition, recognitionOCR, relationships, segmentation, semantic spatial structure tabular touching
%N 7
%P 1079-1092
%R 10.1109/5.156471
%T Segmentation methods for character recognition: from segmentation
to document structure analysis
%V 80
%X A pattern-oriented segmentation method for optical character recognition
that leads to document structure analysis is presented. As a first
example, segmentation of handwritten numerals that touch are treated.
Connected pattern components are extracted, and spatial interrelations
between components are measured and grouped into meaningful character
patterns. Stroke shapes are analyzed and a method of finding the
touching positions that separates about 95% of connected numerals
correctly is described. Ambiguities are handled by multiple hypotheses
and verification by recognition. An extended form of pattern-oriented
segmentation, tabular form recognition, is considered. Images of
tabular forms are analyzed, and frames in the tabular structure are
extracted. By identifying semantic relationships between label frames
and data frames, information on the form can be properly recognized
@article{FujisawaJul1992,
abstract = {A pattern-oriented segmentation method for optical character recognition
that leads to document structure analysis is presented. As a first
example, segmentation of handwritten numerals that touch are treated.
Connected pattern components are extracted, and spatial interrelations
between components are measured and grouped into meaningful character
patterns. Stroke shapes are analyzed and a method of finding the
touching positions that separates about 95% of connected numerals
correctly is described. Ambiguities are handled by multiple hypotheses
and verification by recognition. An extended form of pattern-oriented
segmentation, tabular form recognition, is considered. Images of
tabular forms are analyzed, and frames in the tabular structure are
extracted. By identifying semantic relationships between label frames
and data frames, information on the form can be properly recognized},
added-at = {2011-03-27T19:47:06.000+0200},
author = {Fujisawa, H. and Nakano, Y. and Kurino, K.},
biburl = {https://www.bibsonomy.org/bibtex/26579e538281aca5c1f0d8b0023d7af12/cocus},
doi = {10.1109/5.156471},
file = {:./Fujisawa.pdf:PDF},
interhash = {03a467e1d7430e57eb29da7ab9fe77a3},
intrahash = {6579e538281aca5c1f0d8b0023d7af12},
issn = {0018-9219},
journal = {Proceedings of the IEEE},
keywords = {analysis, character components, connected data document form frames, handwritten hypotheses, image interrelations, label multiple numerals, optical pattern patterns, positions processing, recognition, recognitionOCR, relationships, segmentation, semantic spatial structure tabular touching},
number = 7,
pages = {1079-1092},
review = {touching characters},
timestamp = {2011-03-27T19:47:07.000+0200},
title = {Segmentation methods for character recognition: from segmentation
to document structure analysis},
volume = 80,
year = {Jul 1992}
}