diff --git a/spacy-nlp b/spacy-nlp index 7dde3ac..d55bfa0 100755 --- a/spacy-nlp +++ b/spacy-nlp @@ -27,14 +27,12 @@ parser.add_argument('-c', '--check-encoding', help='Check encoding of the input file, UTF-8 is used instead') # noqa args = parser.parse_args() -if args.check_encoding: - with open(args.input, "rb") as text_file: - if args.check_encoding: - encoding = chardet.detect(text_file.read())['encoding'] - else: - encoding = 'utf-8' - with open(args.input, "rb") as text_file: + if args.check_encoding: + encoding = chardet.detect(text_file.read())['encoding'] + else: + encoding = 'utf-8' + text_file.seek(0) text_md5 = hashlib.md5() for chunk in iter(lambda: text_file.read(128 * text_md5.block_size), b''): text_md5.update(chunk)