mirror of
https://gitlab.ub.uni-bielefeld.de/sfb1288inf/ocr.git
synced 2024-12-26 04:54:18 +00:00
Some cosmetics
This commit is contained in:
parent
880f0efcf9
commit
c1f5252633
9
ocr
9
ocr
@ -16,12 +16,17 @@ import os
|
||||
import re
|
||||
import sys
|
||||
from pyflow import WorkflowRunner
|
||||
from zipfile import ZipFile
|
||||
|
||||
|
||||
def parse_arguments():
|
||||
parser = argparse.ArgumentParser(
|
||||
description='Performs OCR of (historical) documents utilizing OCRopus for preprocessing and Tesseract OCR for OCR. The results are served as hOCR, PDF, raw text and TEI compliant XML files.\nSoftware requirements: imagemagick, ocropus, pdftoppm, pdfunite, poppler-utils, pyflow, python2.7, python3.5, tesseract'
|
||||
description='''Performs OCR of (historical) documents utilizing OCRopus
|
||||
for preprocessing and Tesseract OCR for OCR. The results
|
||||
are served as hOCR, PDF, raw text and TEI compliant XML
|
||||
files.\n
|
||||
Software requirements: imagemagick, ocropus, pdftoppm,
|
||||
pdfunite, poppler-utils, pyflow, python2.7, python3.5,
|
||||
tesseract'''
|
||||
)
|
||||
parser.add_argument(
|
||||
'-i',
|
||||
|
Loading…
Reference in New Issue
Block a user