From 708da35a196bbc3e53b92f3beb38fdce173f9cdf Mon Sep 17 00:00:00 2001 From: Patrick Jentsch Date: Wed, 13 Mar 2019 19:47:14 +0100 Subject: [PATCH] Update tei. --- hocrtotei | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/hocrtotei b/hocrtotei index 0da6f89..b2ba5d6 100755 --- a/hocrtotei +++ b/hocrtotei @@ -25,7 +25,7 @@ output_file.write('\n' + for input_file in input_files: tree = ET.parse(os.path.join(sys.argv[1], input_file)) - output_file.write(' \n' % (input_file.split(".")[0], input_file.split(".")[0])) + output_file.write(' \n' % (input_file.split(".")[0].split("-")[1])) for para in tree.findall(".//*[@class='ocr_par']"): output_file.write('

\n') for line in para.findall(".//*[@class='ocr_line']"):