Rework corpus analysis list building part 1

This commit is contained in:
Stephan Porada
2020-01-23 16:00:48 +01:00
parent 88873c8aee
commit 87d6380e22
4 changed files with 650 additions and 162 deletions

View File

@ -45,7 +45,7 @@ def corpus_analysis(message):
# Prepare and execute a query
corpus_name = 'CORPUS'
query = str(message['query'])
result_len = 100
result_len = 200
context_len = int(message['context'])
result_offset = 0
client.select_corpus(corpus_name)
@ -60,19 +60,20 @@ def corpus_analysis(message):
context_len=context_len,
result_offset=result_offset)
result_offset += result_len # initial offfset is plus result len because client.show_query_results has been already executed once
socketio.emit('corpus_analysis', results, room=request.sid)
while result_offset < client.total_nr_matches:
logger.warning('====== While loop start for {} ======'.format(query))
logger.warning('result_offset: {}'.format(result_offset))
results_append = client.show_query_results(result_len=result_len,
context_len=context_len,
result_offset=result_offset)
results['matches'].extend(results_append['matches'])
results['cpos_lookup'].update(results_append['cpos_lookup'])
results['text_lookup'].update(results_append['text_lookup'])
results = client.show_query_results(result_len=result_len,
context_len=context_len,
result_offset=result_offset)
# results['matches'].extend(results_append['matches'])
# results['cpos_lookup'].update(results_append['cpos_lookup'])
# results['text_lookup'].update(results_append['text_lookup'])
result_offset += result_len
result_offset = min(result_offset, client.total_nr_matches)
logger.warning('result_offset end of while loop: {}'.format(result_offset))
socketio.emit('corpus_analysis', results, room=request.sid)
socketio.emit('corpus_analysis', results, room=request.sid)
@socketio.on('inspect_match')