333 lines
12 KiB
BibTeX
333 lines
12 KiB
BibTeX
@book{2007Crs,
|
|
title = {Character recognition systems: a guide for students and practioners},
|
|
author = {Cheriet, Mohamed},
|
|
year = 2007,
|
|
isbn = 9780471415701,
|
|
url = {https://permalink.obvsg.at/fho/AC06408992},
|
|
urldate = {2024-02-12},
|
|
language = {eng},
|
|
keywords = {Optical character recognition devices}
|
|
}
|
|
@book{2022Scas,
|
|
title = {Soft computing and signal processing: proceedings of 4th ICSCSP 2021},
|
|
author = {Reddy, V. Sivakumar},
|
|
year = 2022,
|
|
series = {Advances in Intelligent Systems and Computing ;},
|
|
isbn = {981-16-7088-9},
|
|
url = {https://search-fho.obvsg.at/permalink/f/19351jn/FHO_alma5134174850004527},
|
|
urldate = {2024-02-12},
|
|
language = {eng},
|
|
keywords = {Signal processing ; Congresses}
|
|
}
|
|
@book{BoochGrady1999Tuml,
|
|
title = {The unified modeling language user guide : UML},
|
|
author = {Booch, Grady},
|
|
year = 1999,
|
|
series = {Addison-Wesley object technology series},
|
|
isbn = {0201571684},
|
|
url = {https://permalink.obvsg.at/fho/AC08768402},
|
|
urldate = {2024-02-12},
|
|
edition = {3. print..},
|
|
language = {eng},
|
|
keywords = {Computer software ; Development}
|
|
}
|
|
@book{ChaudhuriArindam2017OCRS,
|
|
title = {Optical Character Recognition Systems for Different Languages with Soft Computing},
|
|
author = {Chaudhuri, Arindam},
|
|
year = 2017,
|
|
series = {Studies in Fuzziness and Soft Computing 352},
|
|
isbn = 9783319502526,
|
|
url = {https://permalink.obvsg.at/fho/AC12323924},
|
|
urldate = {2024-02-12},
|
|
language = {eng},
|
|
keywords = {Engineering}
|
|
}
|
|
@book{DingXiaoqing2012AiCR,
|
|
title = {Advances in Character Recognition},
|
|
author = {Ding, Xiaoqing},
|
|
year = 2012,
|
|
publisher = {IntechOpen},
|
|
doi = {10.5772/2575},
|
|
isbn = {953-51-5669-1},
|
|
url = {https://www.intechopen.com/books/2182},
|
|
urldate = {2024-02-12},
|
|
language = {eng},
|
|
keywords = {Optical character recognition}
|
|
}
|
|
@inproceedings{Smith2007,
|
|
title = {An Overview of the Tesseract OCR Engine},
|
|
author = {Smith R.},
|
|
url = {https://ieeexplore.ieee.org/document/4376991},
|
|
urldate = {2024-02-12},
|
|
date = 2007,
|
|
langid = {ngerman}
|
|
}
|
|
@online{tessdoc,
|
|
title = {Tesseract Documentation},
|
|
url = {https://tesseract-ocr.github.io/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{imagemagick,
|
|
title = {ImageMagick Homepage},
|
|
url = {https://www.imagemagick.org/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{textract_pricing,
|
|
title = {Amazon Textract - Pricing},
|
|
url = {https://aws.amazon.com/textract/pricing/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{textract_home,
|
|
title = {Amazon Textract - Homepage},
|
|
url = {https://aws.amazon.com/textract},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{gcv_pricing,
|
|
title = {Google Cloud Vision - Pricing},
|
|
url = {https://cloud.google.com/vision/pricing},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{gcv_home,
|
|
title = {Google Cloud Vision - Homepage},
|
|
url = {https://cloud.google.com/vision},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{azurevision_pricing,
|
|
title = {Azure AI Vision - Pricing},
|
|
url = {https://azure.microsoft.com/en-gb/pricing/details/cognitive-services/computer-vision/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{azurevision_home,
|
|
title = {Azure AI Vision - Homepage},
|
|
url = {https://azure.microsoft.com/en-us/products/ai-services/ai-vision},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{ironocr_home,
|
|
title = {IronOCR for .NET - Homepage},
|
|
url = {https://ironsoftware.com/csharp/ocr/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{copa-data_zenon,
|
|
title = {COPA-DATA zenon - Homepage},
|
|
url = {https://www.copadata.com/en/product/zenon-software-platform-for-industrial-automation-energy-automation/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@online{tessrepo,
|
|
title = {Tesseract Repository},
|
|
url = {https://github.com/tesseract-ocr/tesseract},
|
|
urldate = {2024-01-04},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@article{asif2014overview,
|
|
title = {An overview and applications of optical character recognition},
|
|
author = {Asif, AMAM and Hannan, Shaikh Abdul and Perwej, Yusuf and Vithalrao, Mane Arjun},
|
|
year = 2014,
|
|
journal = {Int. J. Adv. Res. Sci. Eng},
|
|
volume = 3,
|
|
number = 7,
|
|
}
|
|
@inbook{cc_platforms_comparison,
|
|
title = {“Comparison of Different Cloud Computing Platforms for Data Analytics”},
|
|
author = {Gupta, Urvashi and Sharma, Rohit},
|
|
year = 2023,
|
|
month = {09},
|
|
doi = {10.1007/978-981-99-3716-5_7},
|
|
isbn = {978-981-99-3715-8}
|
|
}
|
|
@online{tessdoc,
|
|
title = {Tesseract Documentation},
|
|
url = {https://tesseract-ocr.github.io/},
|
|
urldate = {2024-02-12},
|
|
date = {2023-05-23},
|
|
language = {eng}
|
|
}
|
|
@inproceedings{the_old_bailey_and_ocr,
|
|
title = {The Old Bailey and OCR: Benchmarking AWS, Azure, and GCP with 180,000 Page Images},
|
|
author = {William Ughetta and Kernighan, {Brian W.}},
|
|
year = 2020,
|
|
month = sep,
|
|
day = 29,
|
|
publisher = {Association for Computing Machinery, Inc},
|
|
doi = {10.1145/3395027.3419595},
|
|
keywords = {Amazon Web Services, Google Cloud Platform, Historical Documents, Microsoft Azure, Old Bailey, Optical Character Recognition},
|
|
language = {English (US)}
|
|
}
|
|
@article{eikvil1993optical,
|
|
title = {Optical character recognition},
|
|
author = {Eikvil, Line},
|
|
year = 1993,
|
|
journal = {citeseer. ist. psu. edu/142042. html},
|
|
volume = 26
|
|
}
|
|
@article{islam2017survey,
|
|
title = {A survey on optical character recognition systems},
|
|
author = {Islam, Islam, Noor},
|
|
year = 2017,
|
|
journal = {arXiv preprint arXiv:1710.05703}
|
|
}
|
|
@article{chowdhary2020natural,
|
|
title = {Natural language processing},
|
|
author = {Chowdhary, KR1442 and Chowdhary, KR},
|
|
year = 2020,
|
|
journal = {Fundamentals of artificial intelligence},
|
|
publisher = {Springer},
|
|
}
|
|
@article{10.1145/219717.219778,
|
|
title = {Commercial Applications of Natural Language Processing},
|
|
author = {Church, Kenneth W. and Rau, Lisa F.},
|
|
year = 1995,
|
|
journal = {Commun. ACM},
|
|
publisher = {Association for Computing Machinery},
|
|
address = {New York, NY, USA},
|
|
volume = 38,
|
|
number = 11,
|
|
doi = {10.1145/219717.219778},
|
|
issn = {0001-0782},
|
|
url = {https://doi.org/10.1145/219717.219778},
|
|
numpages = 9
|
|
}
|
|
@article{kalyanathaya2019advances,
|
|
title = {Advances in natural language processing: a survey of current research trends, development tools and industry applications},
|
|
author = {Kalyanathaya, Krishna Prakash and Akila, D and Rajesh, P},
|
|
year = 2019,
|
|
journal = {International Journal of Recent Technology and Engineering},
|
|
volume = 7,
|
|
number = {5C},
|
|
}
|
|
@inproceedings{tong1996statistical,
|
|
title = {A statistical approach to automatic OCR error correction in context},
|
|
author = {Tong, Xiang and Evans, David A},
|
|
year = 1996,
|
|
booktitle = {Fourth workshop on very large corpora} % todo
|
|
}
|
|
@inproceedings{karpinski2018metrics,
|
|
title = {Metrics for complete evaluation of ocr performance},
|
|
author = {Karpinski, Romain and Lohani, Devashish and Belaid, Abdel},
|
|
year = 2018,
|
|
booktitle = {IPCV'18-The 22nd Int'l Conf on Image Processing, Computer Vision, \& Pattern Recognition}
|
|
}
|
|
@article{approximate_string_matching,
|
|
title = {A Guided Tour to Approximate String Matching},
|
|
author = {Navarro, Gonzalo},
|
|
year = 2000,
|
|
month = {04},
|
|
journal = {ACM Computing Surveys},
|
|
volume = 33,
|
|
doi = {10.1145/375360.375365}
|
|
}
|
|
@inproceedings{levenshtein1966binary,
|
|
title = {Binary codes capable of correcting deletions, insertions, and reversals},
|
|
author = {Levenshtein} % todo
|
|
}
|
|
@inproceedings{wang2003word,
|
|
title = {Is word error rate a good indicator for spoken language understanding accuracy},
|
|
author = {Wang, Ye-Yi and Acero, Alex and Chelba, Ciprian},
|
|
year = 2003,
|
|
booktitle = {2003 IEEE workshop on automatic speech recognition and understanding (IEEE Cat. No. 03EX721)},
|
|
organization = {IEEE}
|
|
}
|
|
@inproceedings{park2008empirical,
|
|
title = {An empirical analysis of word error rate and keyword error rate.},
|
|
author = {Park, Youngja and Patwardhan, Siddharth and Visweswariah, Karthik and Gates, Stephen C},
|
|
year = 2008,
|
|
booktitle = {Interspeech},
|
|
volume = 2008,
|
|
}
|
|
@article{sporici2020improving,
|
|
title = {Improving the accuracy of Tesseract 4.0 OCR engine using convolution-based preprocessing},
|
|
author = {Sporici, Dan and Cușnir, Elena and Boiangiu, Costin-Anton},
|
|
year = 2020,
|
|
journal = {Symmetry},
|
|
publisher = {MDPI},
|
|
volume = 12,
|
|
number = 5,
|
|
}
|
|
@article{mursari2021effectiveness,
|
|
title = {The effectiveness of image preprocessing on digital handwritten scripts recognition with the implementation of OCR Tesseract},
|
|
author = {Mursari, Lily Rojabiyati and Wibowo, Antoni},
|
|
year = 2021,
|
|
journal = {Computer Engineering and Applications Journal},
|
|
volume = 10,
|
|
number = 3,
|
|
}
|
|
@image{unimodal-histogram,
|
|
author = "Wikimedia Commons",
|
|
title = "Histogram of tips given in a restaurant",
|
|
year = "2014",
|
|
urldate = {2024-02-12},
|
|
url = "https://commons.wikimedia.org/wiki/File:Tips-histogram1.png",
|
|
}
|
|
@image{bimodal-histogram,
|
|
author = "Wikimedia Commons",
|
|
title = "Example of a histogram exhibiting bimodalty",
|
|
year = "2014",
|
|
urldate = {2024-02-12},
|
|
url = "https://commons.wikimedia.org/wiki/File:Bimodal-histogram.png",
|
|
}
|
|
@article{zack1977automatic,
|
|
title={Automatic measurement of sister chromatid exchange frequency.},
|
|
author={Zack, Gregory W and Rogers, William E and Latt, Samuel A},
|
|
journal={Journal of Histochemistry \& Cytochemistry},
|
|
volume={25},
|
|
number={7},
|
|
year={1977},
|
|
publisher={SAGE Publications Sage CA: Los Angeles, CA}
|
|
}
|
|
@article{kapur1985new,
|
|
title={A new method for gray-level picture thresholding using the entropy of the histogram},
|
|
author={Kapur, Jagat Narain and Sahoo, Prasanna K and Wong, Andrew KC},
|
|
journal={Computer vision, graphics, and image processing},
|
|
volume={29},
|
|
number={3},
|
|
year={1985},
|
|
publisher={Elsevier}
|
|
}
|
|
@article{otsu1979threshold,
|
|
title={A threshold selection method from gray-level histograms},
|
|
author={Otsu, Nobuyuki},
|
|
journal={IEEE transactions on systems, man, and cybernetics},
|
|
volume={9},
|
|
number={1},
|
|
year={1979},
|
|
publisher={IEEE}
|
|
}
|
|
@article{sahoo1988survey,
|
|
title={A survey of thresholding techniques},
|
|
author={Sahoo, Prasanna K and Soltani, SAKC and Wong, Andrew KC},
|
|
journal={Computer vision, graphics, and image processing},
|
|
volume={41},
|
|
number={2},
|
|
year={1988},
|
|
publisher={Elsevier}
|
|
}
|
|
@article{wilbur1992automatic,
|
|
title={The automatic identification of stop words},
|
|
author={Wilbur, W John and Sirotkin, Karl},
|
|
journal={Journal of information science},
|
|
volume={18},
|
|
number={1},
|
|
year={1992},
|
|
publisher={Sage Publications Sage CA: Thousand Oaks, CA}
|
|
}
|