Automated document content characterization for a multimedia document retrieval system. Koivusaari M, S., J., &., P., M. In 1997.
abstract   bibtex   
We propose a new approach to automate document image layout extraction for an object-oriented database feature population using rapid low level feature analysis, preclassification and predictive coding. The layout information comprised of region location and classification data is transformed into `feature object(s)'. The information is then fed into an intelligent document image retrieval system (IDIR) to be utilized in document retrieval schemes. The IDIR system consists of user interface, object-oriented database and a variety of document image analysis algo- rithms. In this paper the object-oriented storage model and the database system are presented in formal and functional domains. Moreover, the graphical user interface and a visual document image browser are described. The document analysis techniques used at document characterization are also presented. In this context the documents consist of text, picture and other media (possibly embedded) data. Documents are stored in the database as document, page and region objects. Our test system has been implemented and tested using a document database of 10000 documents.
@inProceedings{
 title = {Automated document content characterization for a multimedia document retrieval system.},
 type = {inProceedings},
 year = {1997},
 id = {f63aae5b-39ee-349f-bb33-a2ce2b1f7a72},
 created = {2019-11-19T13:01:26.822Z},
 file_attached = {false},
 profile_id = {bddcf02d-403b-3b06-9def-6d15cc293e20},
 group_id = {17585b85-df99-3a34-98c2-c73e593397d7},
 last_modified = {2019-11-19T13:45:25.659Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {mvg:35},
 source_type = {inproceedings},
 notes = {Proc. SPIE Vol. 3229, Multimedia Storage and Archiving Systems II, Dallas, TX, 148 - 159.},
 private_publication = {false},
 abstract = {We propose a new approach to automate document image layout extraction for an object-oriented database feature population using rapid low level feature analysis, preclassification and
predictive coding. The layout information comprised of region location and classification data is transformed into `feature object(s)'. The information is then fed into an intelligent document image retrieval system (IDIR) to be utilized in document retrieval schemes. The IDIR system consists of user interface, object-oriented database and a variety of document image analysis algo-
rithms. In this paper the object-oriented storage model and the database system are presented in formal and functional domains. Moreover, the graphical user interface and a visual document image browser are described. The document analysis techniques used at document characterization are also
presented. In this context the documents consist of text, picture and other media (possibly embedded) data. Documents are stored in the database as document, page and region objects. Our test system has been implemented and tested using a document database of 10000 documents.},
 bibtype = {inProceedings},
 author = {Koivusaari M, Sauvola J & Pietikäinen M}
}

Downloads: 0