Correcting OCR errors for German in Fraktur font. Généreux, M., Stemle, E., W., Nicolas, L., & Lyding, V. 12, 2014. abstract bibtex In this paper, we present ongoing experiments for correcting OCR errors on German newspapers in Fraktur font. Our approach borrows from techniques for spelling correction in context using a probabilistic edit-operation error model and lexical resources. We highlight conditions in which high error reduction rates can be obtained and where the approach currently stands with real data.
@misc{
title = {Correcting OCR errors for German in Fraktur font},
type = {misc},
year = {2014},
source = {Talk at the First Italian Conference on Computational Linguistics (CLiC-it 2014)},
pages = {2-5},
websites = {http://clic.humnet.unipi.it/proceedings/vol1/CLICIT2014136.pdf},
month = {12},
city = {Pisa, Italy},
editors = {[object Object],[object Object],[object Object]},
id = {0df2463b-0a0e-3297-96a8-5969b86fbd4b},
created = {2015-09-14T10:58:45.000Z},
file_attached = {false},
profile_id = {94be607e-c433-369f-af1e-99020f3fddbe},
group_id = {336b6408-ac60-3ac5-acc3-f17c991bd54f},
last_modified = {2015-09-23T10:56:34.000Z},
tags = {LT},
read = {true},
starred = {false},
authored = {false},
confirmed = {true},
hidden = {false},
citation_key = {GenereuxStemleNicolasLyding2014},
source_type = {TALK},
user_context = {talk},
abstract = {In this paper, we present ongoing experiments for correcting OCR errors on German newspapers in Fraktur font. Our approach borrows from techniques for spelling correction in context using a probabilistic edit-operation error model and lexical resources. We highlight conditions in which high error reduction rates can be obtained and where the approach currently stands with real data.},
bibtype = {misc},
author = {Généreux, Michel and Stemle, Egon W. and Nicolas, Lionel and Lyding, Verena}
}
Downloads: 0
{"_id":"yNNhENpaC94vPr5Wr","bibbaseid":"gnreux-stemle-nicolas-lyding-correctingocrerrorsforgermaninfrakturfont-2014","downloads":0,"creationDate":"2015-09-02T16:29:26.329Z","title":"Correcting OCR errors for German in Fraktur font","author_short":["Généreux, M.","Stemle, E., W.","Nicolas, L.","Lyding, V."],"year":2014,"bibtype":"misc","biburl":null,"bibdata":{"title":"Correcting OCR errors for German in Fraktur font","type":"misc","year":"2014","source":"Talk at the First Italian Conference on Computational Linguistics (CLiC-it 2014)","pages":"2-5","websites":"http://clic.humnet.unipi.it/proceedings/vol1/CLICIT2014136.pdf","month":"12","city":"Pisa, Italy","editors":"[object Object],[object Object],[object Object]","id":"0df2463b-0a0e-3297-96a8-5969b86fbd4b","created":"2015-09-14T10:58:45.000Z","file_attached":false,"profile_id":"94be607e-c433-369f-af1e-99020f3fddbe","group_id":"336b6408-ac60-3ac5-acc3-f17c991bd54f","last_modified":"2015-09-23T10:56:34.000Z","tags":"LT","read":"true","starred":false,"authored":false,"confirmed":"true","hidden":false,"citation_key":"GenereuxStemleNicolasLyding2014","source_type":"TALK","user_context":"talk","abstract":"In this paper, we present ongoing experiments for correcting OCR errors on German newspapers in Fraktur font. Our approach borrows from techniques for spelling correction in context using a probabilistic edit-operation error model and lexical resources. We highlight conditions in which high error reduction rates can be obtained and where the approach currently stands with real data.","bibtype":"misc","author":"Généreux, Michel and Stemle, Egon W. and Nicolas, Lionel and Lyding, Verena","bibtex":"@misc{\n title = {Correcting OCR errors for German in Fraktur font},\n type = {misc},\n year = {2014},\n source = {Talk at the First Italian Conference on Computational Linguistics (CLiC-it 2014)},\n pages = {2-5},\n websites = {http://clic.humnet.unipi.it/proceedings/vol1/CLICIT2014136.pdf},\n month = {12},\n city = {Pisa, Italy},\n editors = {[object Object],[object Object],[object Object]},\n id = {0df2463b-0a0e-3297-96a8-5969b86fbd4b},\n created = {2015-09-14T10:58:45.000Z},\n file_attached = {false},\n profile_id = {94be607e-c433-369f-af1e-99020f3fddbe},\n group_id = {336b6408-ac60-3ac5-acc3-f17c991bd54f},\n last_modified = {2015-09-23T10:56:34.000Z},\n tags = {LT},\n read = {true},\n starred = {false},\n authored = {false},\n confirmed = {true},\n hidden = {false},\n citation_key = {GenereuxStemleNicolasLyding2014},\n source_type = {TALK},\n user_context = {talk},\n abstract = {In this paper, we present ongoing experiments for correcting OCR errors on German newspapers in Fraktur font. Our approach borrows from techniques for spelling correction in context using a probabilistic edit-operation error model and lexical resources. We highlight conditions in which high error reduction rates can be obtained and where the approach currently stands with real data.},\n bibtype = {misc},\n author = {Généreux, Michel and Stemle, Egon W. and Nicolas, Lionel and Lyding, Verena}\n}","author_short":["Généreux, M.","Stemle, E., W.","Nicolas, L.","Lyding, V."],"bibbaseid":"gnreux-stemle-nicolas-lyding-correctingocrerrorsforgermaninfrakturfont-2014","role":"author","urls":{},"downloads":0},"search_terms":["correcting","ocr","errors","german","fraktur","font","généreux","stemle","nicolas","lyding"],"keywords":[],"authorIDs":[]}