diff --git a/ocr_pyflow b/ocr_pyflow index 849c00c..3bb6bde 100755 --- a/ocr_pyflow +++ b/ocr_pyflow @@ -31,10 +31,6 @@ from pyflow import WorkflowRunner -ocropusnlbin_bin = "/usr/local/bin/ocropus-nlbin" - - - def parse_arguments(): parser = argparse.ArgumentParser( "Performs OCR of (historical) documents utilizing OCRopus for preprocessing and Tesseract OCR \ @@ -212,8 +208,7 @@ class OCRWorkflow(WorkflowRunner): ocropusnlbin_job_number = 0 for job in self.pdfImageJobs["images"] + self.pdfImageJobs["pdf"]: ocropusnlbin_job_number += 1 - cmd = "%s -Q %i -o %s %s" % ( - ocropusnlbin_bin, + cmd = "ocropus-nlbin -Q %i -o %s %s" % ( self.nCores, os.path.join(job["output_dir"], "tmp", "ocropus-nlbin"), os.path.join(job["output_dir"], "tmp", "tiff_files", os.path.basename(job["path"]).rsplit(".", 1)[0] + "-*.tif"))