fixed data for markup

This commit is contained in:
Stephan Porada
2019-02-22 23:52:59 +01:00
parent 4b670ac98c
commit cd9016f2b1
6 changed files with 13968 additions and 408377 deletions

View File

@ -31,17 +31,8 @@ date_string = [\d\t ]*Deutscher Bundestag (?:|—|-|--) \d{1,2} ?\. Wahlperio
multiline_comment = \B\([^\(\)]* ; [^\(\)]*\)\B ; kommentar
[File paths]
nlp_output = /home/stephan/Desktop/tmp_test/nlp_output
nlp_input = /home/stephan/Desktop/tmp_test/nlp_output/nlp_beuatiful_xml/
nlp_lemmatized_tokenized = /home/stephan/Desktop/tmp_test/nlp_output/lemmatized
tmp_path = /home/stephan/Desktop/tmp_test/nlp_output/lemmatized/tmp
nlp_beuatiful_xml = /home/stephan/Desktop/tmp_test/nlp_output/nlp_beuatiful_xml
input_folder_xmls = /home/stephan/Desktop/18_Wahlperiode_2013-2017/
output_folder = /home/stephan/Desktop/output
input_folder_xmls = /home/stephan/Desktop/18_Wahlperiode_2013-2017/
new_metadata = /home/stephan/Desktop/output/new_metadata
new_simple_markup = /home/stephan/Desktop/output/simple_xml
complex_markup = /home/stephan/Desktop/tmp_test/output/complex_markup
clear_speech_markup = /home/stephan/Desktop/tmp_test/output/clear_speech_markup
beautiful_xml = /home/stephan/Desktop/tmp_test/output/beautiful_xml
fixed_markup = /home/stephan/Repos/master_thesis/data/working_data/id_fixed/fixed_markup

File diff suppressed because it is too large Load Diff