diff --git a/references.bib b/references.bib index ed9f20e..8588955 100644 --- a/references.bib +++ b/references.bib @@ -2,12 +2,13 @@ title = {An overview and applications of optical character recognition}, author = {Asif, AMAM and Hannan, Shaikh Abdul and Perwej, Yusuf and Vithalrao, Mane Arjun}, year = 2014, - journal = {Int. J. Adv. Res. Sci. Eng}, + journal = {International Journal of Advance Research In Science And Engineering}, volume = 3, number = 7 } @online{azurevision_home, title = {Azure AI Vision - Homepage}, + author = {Microsoft Corporation}, url = {https://azure.microsoft.com/en-us/products/ai-services/ai-vision}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -15,6 +16,7 @@ } @online{azurevision_pricing, title = {Azure AI Vision - Pricing}, + author = {Microsoft Corporation}, url = {https://azure.microsoft.com/en-gb/pricing/details/cognitive-services/computer-vision/}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -37,7 +39,7 @@ } @article{chowdhary2020natural, title = {Natural language processing}, - author = {Chowdhary, KR1442 and Chowdhary, KR}, + author = {Chowdhary, K.R.}, year = 2020, journal = {Fundamentals of artificial intelligence}, publisher = {Springer} @@ -58,6 +60,7 @@ } @online{copa-data_zenon, title = {COPA-DATA zenon - Homepage}, + author = {Ing. Punzenberger COPA-DATA GmbH}, url = {https://www.copadata.com/en/product/zenon-software-platform-for-industrial-automation-energy-automation/}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -84,6 +87,7 @@ } @online{gcv_home, title = {Google Cloud Vision - Homepage}, + author = {Google LLC}, url = {https://cloud.google.com/vision}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -91,6 +95,7 @@ } @online{gcv_pricing, title = {Google Cloud Vision - Pricing}, + author = {Google LLC}, url = {https://cloud.google.com/vision/pricing}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -98,6 +103,7 @@ } @online{imagemagick, title = {ImageMagick Homepage}, + author = {ImageMagick Studio LLC}, url = {https://www.imagemagick.org/}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -105,6 +111,7 @@ } @online{ironocr_home, title = {IronOCR for .NET - Homepage}, + author = {Iron Software LLC}, url = {https://ironsoftware.com/csharp/ocr/}, urldate = {2024-02-12}, date = {2023-05-23}, @@ -112,9 +119,10 @@ } @article{islam2017survey, title = {A survey on optical character recognition systems}, - author = {Islam, Islam, Noor}, + author = {Islam, Noman and Islam, Zeeshan and Noor, Nazia}, + url = {https://doi.org/10.48550/arXiv.1710.05703}, year = 2017, - journal = {arXiv preprint arXiv:1710.05703} + journal = {arXiv preprint} } @article{kalyanathaya2019advances, title = {Advances in natural language processing: a survey of current research trends, development tools and industry applications}, @@ -137,11 +145,18 @@ title = {Metrics for complete evaluation of ocr performance}, author = {Karpinski, Romain and Lohani, Devashish and Belaid, Abdel}, year = 2018, - booktitle = {IPCV'18-The 22nd Int'l Conf on Image Processing, Computer Vision, \& Pattern Recognition} + booktitle = {IPCV'18 - The 22nd Int'l Conf on Image Processing, Computer Vision, \& Pattern Recognition}, + url = {https://inria.hal.science/hal-01981731} } @inproceedings{levenshtein1966binary, - title = {Binary codes capable of correcting deletions, insertions, and reversals}, - author = {Levenshtein} + title = {Binary codes capable of correcting deletions, insertions, and reversals}, + author = {Levenshtein, Vladimir I and others}, + booktitle = {Soviet physics doklady}, + volume = 10, + number = 8, + pages = {707--710}, + year = 1966, + organization = {Soviet Union} } @article{mursari2021effectiveness, title = {The effectiveness of image preprocessing on digital handwritten scripts recognition with the implementation of OCR Tesseract}, @@ -157,6 +172,8 @@ year = 1979, journal = {IEEE transactions on systems, man, and cybernetics}, publisher = {IEEE}, + doi = {10.1109/TSMC.1979.4310076}, + url = {https://ieeexplore.ieee.org/document/4310076}, volume = 9, number = 1 } @@ -164,8 +181,8 @@ title = {An empirical analysis of word error rate and keyword error rate.}, author = {Park, Youngja and Patwardhan, Siddharth and Visweswariah, Karthik and Gates, Stephen C}, year = 2008, - booktitle = {Interspeech}, - volume = 2008 + month = 9, + doi = {10.21437/Interspeech.2008-537} } @article{sahoo1988survey, title = {A survey of thresholding techniques}, @@ -178,10 +195,13 @@ } @inproceedings{Smith2007, title = {An Overview of the Tesseract OCR Engine}, - author = {Smith R.}, + author = {Smith, Ray}, + booktitle = {Ninth international conference on document analysis and recognition (ICDAR 2007)}, url = {https://ieeexplore.ieee.org/document/4376991}, urldate = {2024-02-12}, date = 2007, + organization = {IEEE}, + volume = 2, langid = {ngerman} } @article{sporici2020improving, @@ -202,6 +222,7 @@ } @online{tessrepo, title = {Tesseract Repository}, + author = {tesseract-ocr}, url = {https://github.com/tesseract-ocr/tesseract}, urldate = {2024-01-04}, date = {2023-05-23}, @@ -210,6 +231,7 @@ @online{textract_home, title = {Amazon Textract - Homepage}, url = {https://aws.amazon.com/textract}, + author = {Amazon Web Services, Inc.}, urldate = {2024-02-12}, date = {2023-05-23}, language = {eng} @@ -217,6 +239,7 @@ @online{textract_pricing, title = {Amazon Textract - Pricing}, url = {https://aws.amazon.com/textract/pricing/}, + author = {Amazon Web Services, Inc.}, urldate = {2024-02-12}, date = {2023-05-23}, language = {eng} @@ -232,12 +255,18 @@ keywords = {Amazon Web Services, Google Cloud Platform, Historical Documents, Microsoft Azure, Old Bailey, Optical Character Recognition}, language = {English (US)} } -@inproceedings{tong1996statistical, - title = {A statistical approach to automatic OCR error correction in context}, - author = {Tong, Xiang and Evans, David A}, - year = 1996, - booktitle = {Fourth workshop on very large corpora} +@inproceedings{tong1996statistical + title = {A Statistical Approach to Automatic OCR Error Correction in Context}, + author = {Tong, Xiang and Evans, David A.}, + editor = {Scott, Donia}, + booktitle = {Fourth Workshop on Very Large Corpora}, + month = {jun}, + year = 1996, + address = {Herstmonceux Castle, Sussex, UK}, + publisher = {Association for Computational Linguistics}, + url = {https://aclanthology.org/W96-0108}, } + @image{unimodal-histogram, title = {Histogram of tips given in a restaurant}, author = {Wikimedia Commons}, @@ -250,6 +279,7 @@ author = {Wang, Ye-Yi and Acero, Alex and Chelba, Ciprian}, year = 2003, booktitle = {2003 IEEE workshop on automatic speech recognition and understanding (IEEE Cat. No. 03EX721)}, + pages = {577--582}, organization = {IEEE} } @article{wilbur1992automatic,