mirror of
				https://gitlab.ub.uni-bielefeld.de/sfb1288inf/nlp.git
				synced 2025-10-31 10:52:46 +00:00 
			
		
		
		
	Fix check_encoding functionality
This commit is contained in:
		
							
								
								
									
										8
									
								
								nlp
									
									
									
									
									
								
							
							
						
						
									
										8
									
								
								nlp
									
									
									
									
									
								
							| @@ -45,7 +45,7 @@ def parse_arguments(): | |||||||
|                         action='store_true', |                         action='store_true', | ||||||
|                         default=False, |                         default=False, | ||||||
|                         dest="check_encoding", |                         dest="check_encoding", | ||||||
|                         help='''if used the nlp process will know hat the encoding of  |                         help='''if used the nlp process will know hat the encoding of | ||||||
|                         the input files is unkown and thus != utf-8. The process will |                         the input files is unkown and thus != utf-8. The process will | ||||||
|                         try to determine the encoding of the input files and use this. |                         try to determine the encoding of the input files and use this. | ||||||
|                         encoding.''' |                         encoding.''' | ||||||
| @@ -60,7 +60,7 @@ class NLPWorkflow(WorkflowRunner): | |||||||
|         self.n_cores = args.n_cores |         self.n_cores = args.n_cores | ||||||
|         self.output_dir = args.output_dir |         self.output_dir = args.output_dir | ||||||
|         self.zip = args.zip |         self.zip = args.zip | ||||||
|         self.check_encoding |         self.check_encoding = args.check_encoding | ||||||
|  |  | ||||||
|     def workflow(self): |     def workflow(self): | ||||||
|         if len(self.jobs) == 0: |         if len(self.jobs) == 0: | ||||||
| @@ -95,8 +95,8 @@ class NLPWorkflow(WorkflowRunner): | |||||||
|             cmd = 'spacy_nlp -l "{}" "{}" "{}" "{}"'.format( |             cmd = 'spacy_nlp -l "{}" "{}" "{}" "{}"'.format( | ||||||
|                 self.lang, |                 self.lang, | ||||||
|                 job['path'], |                 job['path'], | ||||||
|                 os.path.join(job['output_dir'], job['name'] + '.vrt', |                 os.path.join(job['output_dir'], job['name'] + '.vrt'), | ||||||
|                 if self.check_encoding "--check-encoding" else "") |                 "--check-encoding" if self.check_encoding else "" | ||||||
|             ) |             ) | ||||||
|             nlp_jobs.append( |             nlp_jobs.append( | ||||||
|                 self.addTask( |                 self.addTask( | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user