diff --git a/hocrtotei b/hocrtotei index b2ba5d6..ee492d7 100755 --- a/hocrtotei +++ b/hocrtotei @@ -25,7 +25,7 @@ output_file.write('\n' + for input_file in input_files: tree = ET.parse(os.path.join(sys.argv[1], input_file)) - output_file.write(' \n' % (input_file.split(".")[0].split("-")[1])) + output_file.write(' \n' % (input_file.split(".")[0])) for para in tree.findall(".//*[@class='ocr_par']"): output_file.write('

\n') for line in para.findall(".//*[@class='ocr_line']"):