Text Documents present a great challenge to the field of document recognition. Automatic segmentation and layout analysis of documents is used for interpretation and machine translation of documents. Document such as research papers, address book, news etc. is available in the form of un-structured format. Extracting relevant Knowledge from this document has been recognized as promising task. Extracting interesting rules form it is complex and tedious process. Conditional random fields (CRFs) utilizing contextual information, hand-coded wrappers to label the text (such as Name, Phone number and Address etc). In this paper we propose a novel approach to infer grammar rules using alignment similarity and discriminative context-free grammar. It helps in extracting desired information from the document.
%0 Journal Article
%1 Thakur_2015
%A Thakur, Ramesh
%D 2015
%I Auricle Technologies, Pvt., Ltd.
%J International Journal on Recent and Innovation Trends in Computing and Communication
%K Alignment Extraction Information Labeling Profiling document
%N 4
%P 2269--2272
%R 10.17762/ijritcc2321-8169.1504109
%T Segmentation of Document Using Discriminative Contextfree Grammar Inference and Alignment Similarities
%U http://dx.doi.org/10.17762/ijritcc2321-8169.1504109
%V 3
%X Text Documents present a great challenge to the field of document recognition. Automatic segmentation and layout analysis of documents is used for interpretation and machine translation of documents. Document such as research papers, address book, news etc. is available in the form of un-structured format. Extracting relevant Knowledge from this document has been recognized as promising task. Extracting interesting rules form it is complex and tedious process. Conditional random fields (CRFs) utilizing contextual information, hand-coded wrappers to label the text (such as Name, Phone number and Address etc). In this paper we propose a novel approach to infer grammar rules using alignment similarity and discriminative context-free grammar. It helps in extracting desired information from the document.
@article{Thakur_2015,
abstract = {Text Documents present a great challenge to the field of document recognition. Automatic segmentation and layout analysis of documents is used for interpretation and machine translation of documents. Document such as research papers, address book, news etc. is available in the form of un-structured format. Extracting relevant Knowledge from this document has been recognized as promising task. Extracting interesting rules form it is complex and tedious process. Conditional random fields (CRFs) utilizing contextual information, hand-coded wrappers to label the text (such as Name, Phone number and Address etc). In this paper we propose a novel approach to infer grammar rules using alignment similarity and discriminative context-free grammar. It helps in extracting desired information from the document.},
added-at = {2015-08-26T10:20:56.000+0200},
author = {Thakur, Ramesh},
biburl = {https://www.bibsonomy.org/bibtex/219cf688e73b06c5925cfa78463a6f673/ijritcc},
doi = {10.17762/ijritcc2321-8169.1504109},
interhash = {73b214093913f5bae90f1596506e88a1},
intrahash = {19cf688e73b06c5925cfa78463a6f673},
journal = {International Journal on Recent and Innovation Trends in Computing and Communication},
keywords = {Alignment Extraction Information Labeling Profiling document},
month = {april},
number = 4,
pages = {2269--2272},
publisher = {Auricle Technologies, Pvt., Ltd.},
timestamp = {2015-08-26T10:20:56.000+0200},
title = {Segmentation of Document Using Discriminative Contextfree Grammar Inference and Alignment Similarities},
url = {http://dx.doi.org/10.17762/ijritcc2321-8169.1504109},
volume = 3,
year = 2015
}