mirror of
https://gitlab.ub.uni-bielefeld.de/sfb1288inf/nopaque.git
synced 2025-01-17 13:30:34 +00:00
Compare commits
6 Commits
07103ee4e5
...
912bd7da07
Author | SHA1 | Date | |
---|---|---|---|
|
912bd7da07 | ||
|
e21ef2422d | ||
|
c52c966863 | ||
|
a7a948908f | ||
|
3a97b1a07a | ||
|
315b538c30 |
@ -16,5 +16,4 @@ def before_request():
|
|||||||
pass
|
pass
|
||||||
|
|
||||||
|
|
||||||
from . import cli, cqi_over_socketio, files, followers, routes, json_routes
|
from . import cli, cqi_over_sio, files, followers, routes, json_routes
|
||||||
from . import cqi_over_sio
|
|
||||||
|
@ -8,6 +8,14 @@ from typing import Callable, Dict, List
|
|||||||
from app import socketio
|
from app import socketio
|
||||||
from app.decorators import socketio_login_required
|
from app.decorators import socketio_login_required
|
||||||
from . import NAMESPACE as ns
|
from . import NAMESPACE as ns
|
||||||
|
from .extensions import (
|
||||||
|
corpus_update_db,
|
||||||
|
corpus_static_data,
|
||||||
|
corpus_paginate_corpus,
|
||||||
|
cqp_paginate_subcorpus,
|
||||||
|
cqp_partial_export_subcorpus,
|
||||||
|
cqp_export_subcorpus,
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
CQI_API_FUNCTIONS: List[str] = [
|
CQI_API_FUNCTIONS: List[str] = [
|
||||||
@ -56,15 +64,21 @@ CQI_API_FUNCTIONS: List[str] = [
|
|||||||
'ctrl_ping',
|
'ctrl_ping',
|
||||||
'ctrl_user_abort'
|
'ctrl_user_abort'
|
||||||
]
|
]
|
||||||
|
CQI_NOPAQUE_FUNCTIONS: Dict[str, Callable] = {
|
||||||
|
'nopaque_corpus_update_db': corpus_update_db,
|
||||||
|
'nopaque_corpus_static_data': corpus_static_data,
|
||||||
|
'nopaque_corpus_paginate_corpus': corpus_paginate_corpus,
|
||||||
|
'nopaque_cqp_paginate_subcorpus': cqp_paginate_subcorpus,
|
||||||
|
'nopaque_cqp_partial_export_subcorpus': cqp_partial_export_subcorpus,
|
||||||
|
'nopaque_cqp_export_subcorpus': cqp_export_subcorpus,
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi_client.api', namespace=ns)
|
@socketio.on('cqi', namespace=ns)
|
||||||
@socketio_login_required
|
@socketio_login_required
|
||||||
def cqi_over_sio(fn_data):
|
def cqi_over_sio(fn_data):
|
||||||
try:
|
try:
|
||||||
fn_name: str = fn_data['fn_name']
|
fn_name: str = fn_data['fn_name']
|
||||||
if fn_name not in CQI_API_FUNCTIONS:
|
|
||||||
raise KeyError
|
|
||||||
except KeyError:
|
except KeyError:
|
||||||
return {'code': 400, 'msg': 'Bad Request'}
|
return {'code': 400, 'msg': 'Bad Request'}
|
||||||
fn_name: str = fn_data['fn_name']
|
fn_name: str = fn_data['fn_name']
|
||||||
@ -74,7 +88,13 @@ def cqi_over_sio(fn_data):
|
|||||||
cqi_client_lock: Lock = session['cqi_over_sio']['cqi_client_lock']
|
cqi_client_lock: Lock = session['cqi_over_sio']['cqi_client_lock']
|
||||||
except KeyError:
|
except KeyError:
|
||||||
return {'code': 424, 'msg': 'Failed Dependency'}
|
return {'code': 424, 'msg': 'Failed Dependency'}
|
||||||
|
if fn_name in CQI_API_FUNCTIONS:
|
||||||
fn: Callable = getattr(cqi_client.api, fn_name)
|
fn: Callable = getattr(cqi_client.api, fn_name)
|
||||||
|
elif fn_name in CQI_NOPAQUE_FUNCTIONS:
|
||||||
|
fn_args['cqi_client'] = cqi_client
|
||||||
|
fn: Callable = CQI_NOPAQUE_FUNCTIONS[fn_name]
|
||||||
|
else:
|
||||||
|
return {'code': 400, 'msg': 'Bad Request'}
|
||||||
for param in signature(fn).parameters.values():
|
for param in signature(fn).parameters.values():
|
||||||
if param.default is param.empty:
|
if param.default is param.empty:
|
||||||
if param.name not in fn_args:
|
if param.name not in fn_args:
|
||||||
|
243
app/corpora/cqi_over_sio/extensions/__init__.py
Normal file
243
app/corpora/cqi_over_sio/extensions/__init__.py
Normal file
@ -0,0 +1,243 @@
|
|||||||
|
from collections import Counter
|
||||||
|
from cqi import CQiClient
|
||||||
|
from cqi.status import StatusOk
|
||||||
|
from flask import session
|
||||||
|
from typing import Dict
|
||||||
|
import json
|
||||||
|
import math
|
||||||
|
import os
|
||||||
|
from app import db
|
||||||
|
from app.models import Corpus
|
||||||
|
from .utils import lookups_by_cpos, export_subcorpus, partial_export_subcorpus
|
||||||
|
|
||||||
|
|
||||||
|
def corpus_update_db(cqi_client: CQiClient, corpus: str):
|
||||||
|
db_corpus = Corpus.query.get(session['cqi_over_sio']['corpus_id'])
|
||||||
|
cqi_corpus = cqi_client.corpora.get(corpus)
|
||||||
|
db_corpus.num_tokens = cqi_corpus.size
|
||||||
|
db.session.commit()
|
||||||
|
return StatusOk()
|
||||||
|
|
||||||
|
|
||||||
|
def corpus_static_data(cqi_client: CQiClient, corpus: str) -> Dict:
|
||||||
|
db_corpus = Corpus.query.get(session['cqi_over_sio']['corpus_id'])
|
||||||
|
static_corpus_data_file = os.path.join(db_corpus.path, 'cwb', 'static.json')
|
||||||
|
if os.path.exists(static_corpus_data_file):
|
||||||
|
with open(static_corpus_data_file, 'r') as f:
|
||||||
|
return json.load(f)
|
||||||
|
cqi_corpus = cqi_client.corpora.get(corpus)
|
||||||
|
##########################################################################
|
||||||
|
# A faster way to get cpos boundaries for smaller s_attrs #
|
||||||
|
##########################################################################
|
||||||
|
# cqi_corpus.query('Last', '<s> []* </s>;')
|
||||||
|
# cqi_subcorpus = cqi_corpus.subcorpora.get('Last')
|
||||||
|
# print(cqi_subcorpus.size)
|
||||||
|
# first_match = 0
|
||||||
|
# last_match = cqi_subcorpus.attrs['size'] - 1
|
||||||
|
# match_boundaries = zip(
|
||||||
|
# list(range(first_match, last_match + 1)),
|
||||||
|
# cqi_subcorpus.dump(cqi_subcorpus.attrs['fields']['match'], first_match, last_match),
|
||||||
|
# cqi_subcorpus.dump(cqi_subcorpus.attrs['fields']['matchend'], first_match, last_match)
|
||||||
|
# )
|
||||||
|
# for x in match_boundaries:
|
||||||
|
# print(x)
|
||||||
|
cqi_p_attrs = {
|
||||||
|
p_attr.name: p_attr
|
||||||
|
for p_attr in cqi_corpus.positional_attributes.list()
|
||||||
|
}
|
||||||
|
cqi_s_attrs = {
|
||||||
|
s_attr.name: s_attr
|
||||||
|
for s_attr in cqi_corpus.structural_attributes.list()
|
||||||
|
}
|
||||||
|
static_corpus_data = {
|
||||||
|
'corpus': {
|
||||||
|
'bounds': [0, cqi_corpus.size - 1],
|
||||||
|
'counts': {
|
||||||
|
'token': cqi_corpus.size
|
||||||
|
},
|
||||||
|
'freqs': {}
|
||||||
|
},
|
||||||
|
'p_attrs': {},
|
||||||
|
's_attrs': {},
|
||||||
|
'values': {'p_attrs': {}, 's_attrs': {}}
|
||||||
|
}
|
||||||
|
for p_attr in cqi_p_attrs.values():
|
||||||
|
static_corpus_data['corpus']['freqs'][p_attr.name] = dict(
|
||||||
|
zip(
|
||||||
|
range(0, p_attr.lexicon_size),
|
||||||
|
p_attr.freqs_by_ids(list(range(0, p_attr.lexicon_size)))
|
||||||
|
)
|
||||||
|
)
|
||||||
|
static_corpus_data['p_attrs'][p_attr.name] = dict(
|
||||||
|
zip(
|
||||||
|
range(0, cqi_corpus.size),
|
||||||
|
p_attr.ids_by_cpos(list(range(0, cqi_corpus.size)))
|
||||||
|
)
|
||||||
|
)
|
||||||
|
static_corpus_data['values']['p_attrs'][p_attr.name] = dict(
|
||||||
|
zip(
|
||||||
|
range(0, p_attr.lexicon_size),
|
||||||
|
p_attr.values_by_ids(list(range(0, p_attr.lexicon_size)))
|
||||||
|
)
|
||||||
|
)
|
||||||
|
for s_attr in cqi_s_attrs.values():
|
||||||
|
if s_attr.has_values:
|
||||||
|
continue
|
||||||
|
static_corpus_data['corpus']['counts'][s_attr.name] = s_attr.size
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name] = {'lexicon': {}, 'values': None}
|
||||||
|
static_corpus_data['values']['s_attrs'][s_attr.name] = {}
|
||||||
|
for id in range(0, s_attr.size):
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id] = {}
|
||||||
|
lbound, rbound = s_attr.cpos_by_id(id)
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['bounds'] = [lbound, rbound]
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['counts'] = {}
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['counts']['token'] = rbound - lbound + 1
|
||||||
|
if s_attr.name not in ['text', 's']:
|
||||||
|
continue
|
||||||
|
cpos_range = range(lbound, rbound + 1)
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['counts']['ent'] = len({x for x in cqi_s_attrs['ent'].ids_by_cpos(list(cpos_range)) if x != -1})
|
||||||
|
if s_attr.name != 'text':
|
||||||
|
continue
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['counts']['s'] = len({x for x in cqi_s_attrs['s'].ids_by_cpos(list(cpos_range)) if x != -1})
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['freqs'] = {}
|
||||||
|
for p_attr in cqi_p_attrs.values():
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['lexicon'][id]['freqs'][p_attr.name] = dict(Counter(p_attr.ids_by_cpos(list(cpos_range))))
|
||||||
|
sub_s_attrs = cqi_corpus.structural_attributes.list(filters={'part_of': s_attr})
|
||||||
|
s_attr_value_names = [
|
||||||
|
sub_s_attr.name[(len(s_attr.name) + 1):]
|
||||||
|
for sub_s_attr in sub_s_attrs
|
||||||
|
]
|
||||||
|
sub_s_attr_values = [
|
||||||
|
sub_s_attr.values_by_ids(list(range(0, s_attr.size)))
|
||||||
|
for sub_s_attr in sub_s_attrs
|
||||||
|
]
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['values'] = s_attr_value_names
|
||||||
|
static_corpus_data['values']['s_attrs'][s_attr.name] = {
|
||||||
|
s_attr_id: {
|
||||||
|
s_attr_value_name: sub_s_attr_values[s_attr_value_name_idx][s_attr_id_idx]
|
||||||
|
for s_attr_value_name_idx, s_attr_value_name in enumerate(
|
||||||
|
static_corpus_data['s_attrs'][s_attr.name]['values']
|
||||||
|
)
|
||||||
|
} for s_attr_id_idx, s_attr_id in enumerate(range(0, s_attr.size))
|
||||||
|
}
|
||||||
|
with open(static_corpus_data_file, 'w') as f:
|
||||||
|
json.dump(static_corpus_data, f)
|
||||||
|
return static_corpus_data
|
||||||
|
|
||||||
|
|
||||||
|
def corpus_paginate_corpus(
|
||||||
|
cqi_client: CQiClient,
|
||||||
|
corpus: str,
|
||||||
|
page: int = 1,
|
||||||
|
per_page: int = 20
|
||||||
|
) -> Dict:
|
||||||
|
cqi_corpus = cqi_client.corpora.get(corpus)
|
||||||
|
# Sanity checks
|
||||||
|
if (
|
||||||
|
per_page < 1
|
||||||
|
or page < 1
|
||||||
|
or (
|
||||||
|
cqi_corpus.size > 0
|
||||||
|
and page > math.ceil(cqi_corpus.size / per_page)
|
||||||
|
)
|
||||||
|
):
|
||||||
|
return {'code': 416, 'msg': 'Range Not Satisfiable'}
|
||||||
|
first_cpos = (page - 1) * per_page
|
||||||
|
last_cpos = min(cqi_corpus.size, first_cpos + per_page)
|
||||||
|
cpos_list = [*range(first_cpos, last_cpos)]
|
||||||
|
lookups = lookups_by_cpos(cqi_corpus, cpos_list)
|
||||||
|
payload = {}
|
||||||
|
# the items for the current page
|
||||||
|
payload['items'] = [cpos_list]
|
||||||
|
# the lookups for the items
|
||||||
|
payload['lookups'] = lookups
|
||||||
|
# the total number of items matching the query
|
||||||
|
payload['total'] = cqi_corpus.size
|
||||||
|
# the number of items to be displayed on a page.
|
||||||
|
payload['per_page'] = per_page
|
||||||
|
# The total number of pages
|
||||||
|
payload['pages'] = math.ceil(payload['total'] / payload['per_page'])
|
||||||
|
# the current page number (1 indexed)
|
||||||
|
payload['page'] = page if payload['pages'] > 0 else None
|
||||||
|
# True if a previous page exists
|
||||||
|
payload['has_prev'] = payload['page'] > 1 if payload['page'] else False
|
||||||
|
# True if a next page exists.
|
||||||
|
payload['has_next'] = payload['page'] < payload['pages'] if payload['page'] else False # noqa
|
||||||
|
# Number of the previous page.
|
||||||
|
payload['prev_num'] = payload['page'] - 1 if payload['has_prev'] else None
|
||||||
|
# Number of the next page
|
||||||
|
payload['next_num'] = payload['page'] + 1 if payload['has_next'] else None
|
||||||
|
return payload
|
||||||
|
|
||||||
|
|
||||||
|
def cqp_paginate_subcorpus(
|
||||||
|
cqi_client: CQiClient,
|
||||||
|
subcorpus: str,
|
||||||
|
context: int = 50,
|
||||||
|
page: int = 1,
|
||||||
|
per_page: int = 20
|
||||||
|
) -> Dict:
|
||||||
|
corpus_name, subcorpus_name = subcorpus.split(':', 1)
|
||||||
|
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
||||||
|
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
||||||
|
# Sanity checks
|
||||||
|
if (
|
||||||
|
per_page < 1
|
||||||
|
or page < 1
|
||||||
|
or (
|
||||||
|
cqi_subcorpus.size > 0
|
||||||
|
and page > math.ceil(cqi_subcorpus.size / per_page)
|
||||||
|
)
|
||||||
|
):
|
||||||
|
return {'code': 416, 'msg': 'Range Not Satisfiable'}
|
||||||
|
offset = (page - 1) * per_page
|
||||||
|
cutoff = per_page
|
||||||
|
cqi_results_export = export_subcorpus(
|
||||||
|
cqi_subcorpus, context=context, cutoff=cutoff, offset=offset)
|
||||||
|
payload = {}
|
||||||
|
# the items for the current page
|
||||||
|
payload['items'] = cqi_results_export.pop('matches')
|
||||||
|
# the lookups for the items
|
||||||
|
payload['lookups'] = cqi_results_export
|
||||||
|
# the total number of items matching the query
|
||||||
|
payload['total'] = cqi_subcorpus.size
|
||||||
|
# the number of items to be displayed on a page.
|
||||||
|
payload['per_page'] = per_page
|
||||||
|
# The total number of pages
|
||||||
|
payload['pages'] = math.ceil(payload['total'] / payload['per_page'])
|
||||||
|
# the current page number (1 indexed)
|
||||||
|
payload['page'] = page if payload['pages'] > 0 else None
|
||||||
|
# True if a previous page exists
|
||||||
|
payload['has_prev'] = payload['page'] > 1 if payload['page'] else False
|
||||||
|
# True if a next page exists.
|
||||||
|
payload['has_next'] = payload['page'] < payload['pages'] if payload['page'] else False # noqa
|
||||||
|
# Number of the previous page.
|
||||||
|
payload['prev_num'] = payload['page'] - 1 if payload['has_prev'] else None
|
||||||
|
# Number of the next page
|
||||||
|
payload['next_num'] = payload['page'] + 1 if payload['has_next'] else None
|
||||||
|
return payload
|
||||||
|
|
||||||
|
|
||||||
|
def cqp_partial_export_subcorpus(
|
||||||
|
cqi_client: CQiClient,
|
||||||
|
subcorpus: str,
|
||||||
|
match_id_list: list,
|
||||||
|
context: int = 50
|
||||||
|
) -> Dict:
|
||||||
|
corpus_name, subcorpus_name = subcorpus.split(':', 1)
|
||||||
|
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
||||||
|
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
||||||
|
cqi_subcorpus_partial_export = partial_export_subcorpus(cqi_subcorpus, match_id_list, context=context)
|
||||||
|
return cqi_subcorpus_partial_export
|
||||||
|
|
||||||
|
|
||||||
|
def cqp_export_subcorpus(
|
||||||
|
cqi_client: CQiClient,
|
||||||
|
subcorpus: str,
|
||||||
|
context: int = 50
|
||||||
|
) -> Dict:
|
||||||
|
corpus_name, subcorpus_name = subcorpus.split(':', 1)
|
||||||
|
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
||||||
|
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
||||||
|
cqi_subcorpus_export = export_subcorpus(cqi_subcorpus, context=context)
|
||||||
|
return cqi_subcorpus_export
|
@ -1,64 +1,9 @@
|
|||||||
from flask import session
|
from typing import Dict, List
|
||||||
from functools import wraps
|
from cqi.models.corpora import Corpus
|
||||||
from inspect import signature
|
from cqi.models.subcorpora import Subcorpus
|
||||||
import cqi
|
|
||||||
|
|
||||||
|
|
||||||
def cqi_over_socketio(f):
|
def lookups_by_cpos(corpus: Corpus, cpos_list: List[int]) -> Dict:
|
||||||
@wraps(f)
|
|
||||||
def wrapped(*args):
|
|
||||||
if 'd' not in session:
|
|
||||||
return {'code': 424, 'msg': 'Failed Dependency'}
|
|
||||||
f_args = {}
|
|
||||||
# Check for missing args and if all provided args are of the right type
|
|
||||||
for param in signature(f).parameters.values():
|
|
||||||
if param.name == 'corpus_name':
|
|
||||||
f_args[param.name] = f'NOPAQUE_{session["d"]["corpus_id"]}'
|
|
||||||
continue
|
|
||||||
if param.name == 'cqi_client':
|
|
||||||
f_args[param.name] = session['d']['cqi_client']
|
|
||||||
continue
|
|
||||||
if param.default is param.empty:
|
|
||||||
# args
|
|
||||||
if param.name not in args[0]:
|
|
||||||
return {'code': 400, 'msg': 'Bad Request'}
|
|
||||||
arg = args[0][param.name]
|
|
||||||
if type(arg) is not param.annotation:
|
|
||||||
return {'code': 400, 'msg': 'Bad Request'}
|
|
||||||
f_args[param.name] = arg
|
|
||||||
else:
|
|
||||||
# kwargs
|
|
||||||
if param.name not in args[0]:
|
|
||||||
continue
|
|
||||||
arg = args[0][param.name]
|
|
||||||
if type(arg) is not param.annotation:
|
|
||||||
return {'code': 400, 'msg': 'Bad Request'}
|
|
||||||
f_args[param.name] = arg
|
|
||||||
session['d']['cqi_client_lock'].acquire()
|
|
||||||
try:
|
|
||||||
return_value = f(**f_args)
|
|
||||||
except BrokenPipeError:
|
|
||||||
return_value = {
|
|
||||||
'code': 500,
|
|
||||||
'msg': 'Internal Server Error'
|
|
||||||
}
|
|
||||||
except cqi.errors.CQiException as e:
|
|
||||||
return_value = {
|
|
||||||
'code': 500,
|
|
||||||
'msg': 'Internal Server Error',
|
|
||||||
'payload': {
|
|
||||||
'code': e.code,
|
|
||||||
'desc': e.description,
|
|
||||||
'msg': e.__class__.__name__
|
|
||||||
}
|
|
||||||
}
|
|
||||||
finally:
|
|
||||||
session['d']['cqi_client_lock'].release()
|
|
||||||
return return_value
|
|
||||||
return wrapped
|
|
||||||
|
|
||||||
|
|
||||||
def lookups_by_cpos(corpus, cpos_list):
|
|
||||||
lookups = {}
|
lookups = {}
|
||||||
lookups['cpos_lookup'] = {cpos: {} for cpos in cpos_list}
|
lookups['cpos_lookup'] = {cpos: {} for cpos in cpos_list}
|
||||||
for attr in corpus.positional_attributes.list():
|
for attr in corpus.positional_attributes.list():
|
||||||
@ -93,18 +38,22 @@ def lookups_by_cpos(corpus, cpos_list):
|
|||||||
return lookups
|
return lookups
|
||||||
|
|
||||||
|
|
||||||
def partial_export_subcorpus(subcorpus, match_id_list, context=25):
|
def partial_export_subcorpus(
|
||||||
if subcorpus.attrs['size'] == 0:
|
subcorpus: Subcorpus,
|
||||||
|
match_id_list: List[int],
|
||||||
|
context: int = 25
|
||||||
|
) -> Dict:
|
||||||
|
if subcorpus.size == 0:
|
||||||
return {"matches": []}
|
return {"matches": []}
|
||||||
match_boundaries = []
|
match_boundaries = []
|
||||||
for match_id in match_id_list:
|
for match_id in match_id_list:
|
||||||
if match_id < 0 or match_id >= subcorpus.attrs['size']:
|
if match_id < 0 or match_id >= subcorpus.size:
|
||||||
continue
|
continue
|
||||||
match_boundaries.append(
|
match_boundaries.append(
|
||||||
(
|
(
|
||||||
match_id,
|
match_id,
|
||||||
subcorpus.dump(subcorpus.attrs['fields']['match'], match_id, match_id)[0],
|
subcorpus.dump(subcorpus.fields['match'], match_id, match_id)[0],
|
||||||
subcorpus.dump(subcorpus.attrs['fields']['matchend'], match_id, match_id)[0]
|
subcorpus.dump(subcorpus.fields['matchend'], match_id, match_id)[0]
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
cpos_set = set()
|
cpos_set = set()
|
||||||
@ -120,14 +69,14 @@ def partial_export_subcorpus(subcorpus, match_id_list, context=25):
|
|||||||
lc_rbound = match_start - 1
|
lc_rbound = match_start - 1
|
||||||
lc = (lc_lbound, lc_rbound)
|
lc = (lc_lbound, lc_rbound)
|
||||||
cpos_list_lbound = lc_lbound
|
cpos_list_lbound = lc_lbound
|
||||||
if match_end == (subcorpus.collection.corpus.attrs['size'] - 1) or context == 0:
|
if match_end == (subcorpus.collection.corpus.size - 1) or context == 0:
|
||||||
rc = None
|
rc = None
|
||||||
cpos_list_rbound = match_end
|
cpos_list_rbound = match_end
|
||||||
else:
|
else:
|
||||||
rc_lbound = match_end + 1
|
rc_lbound = match_end + 1
|
||||||
rc_rbound = min(
|
rc_rbound = min(
|
||||||
(match_end + context),
|
(match_end + context),
|
||||||
(subcorpus.collection.corpus.attrs['size'] - 1)
|
(subcorpus.collection.corpus.size - 1)
|
||||||
)
|
)
|
||||||
rc = (rc_lbound, rc_rbound)
|
rc = (rc_lbound, rc_rbound)
|
||||||
cpos_list_rbound = rc_rbound
|
cpos_list_rbound = rc_rbound
|
||||||
@ -138,15 +87,20 @@ def partial_export_subcorpus(subcorpus, match_id_list, context=25):
|
|||||||
return {'matches': matches, **lookups}
|
return {'matches': matches, **lookups}
|
||||||
|
|
||||||
|
|
||||||
def export_subcorpus(subcorpus, context=25, cutoff=float('inf'), offset=0):
|
def export_subcorpus(
|
||||||
if subcorpus.attrs['size'] == 0:
|
subcorpus: Subcorpus,
|
||||||
|
context: int = 25,
|
||||||
|
cutoff: float = float('inf'),
|
||||||
|
offset: int = 0
|
||||||
|
) -> Dict:
|
||||||
|
if subcorpus.size == 0:
|
||||||
return {"matches": []}
|
return {"matches": []}
|
||||||
first_match = max(0, offset)
|
first_match = max(0, offset)
|
||||||
last_match = min((offset + cutoff - 1), (subcorpus.attrs['size'] - 1))
|
last_match = min((offset + cutoff - 1), (subcorpus.size - 1))
|
||||||
match_boundaries = zip(
|
match_boundaries = zip(
|
||||||
list(range(first_match, last_match + 1)),
|
range(first_match, last_match + 1),
|
||||||
subcorpus.dump(subcorpus.attrs['fields']['match'], first_match, last_match),
|
subcorpus.dump(subcorpus.fields['match'], first_match, last_match),
|
||||||
subcorpus.dump(subcorpus.attrs['fields']['matchend'], first_match, last_match)
|
subcorpus.dump(subcorpus.fields['matchend'], first_match, last_match)
|
||||||
)
|
)
|
||||||
cpos_set = set()
|
cpos_set = set()
|
||||||
matches = []
|
matches = []
|
||||||
@ -160,14 +114,14 @@ def export_subcorpus(subcorpus, context=25, cutoff=float('inf'), offset=0):
|
|||||||
lc_rbound = match_start - 1
|
lc_rbound = match_start - 1
|
||||||
lc = (lc_lbound, lc_rbound)
|
lc = (lc_lbound, lc_rbound)
|
||||||
cpos_list_lbound = lc_lbound
|
cpos_list_lbound = lc_lbound
|
||||||
if match_end == (subcorpus.collection.corpus.attrs['size'] - 1) or context == 0:
|
if match_end == (subcorpus.collection.corpus.size - 1) or context == 0:
|
||||||
rc = None
|
rc = None
|
||||||
cpos_list_rbound = match_end
|
cpos_list_rbound = match_end
|
||||||
else:
|
else:
|
||||||
rc_lbound = match_end + 1
|
rc_lbound = match_end + 1
|
||||||
rc_rbound = min(
|
rc_rbound = min(
|
||||||
(match_end + context),
|
(match_end + context),
|
||||||
(subcorpus.collection.corpus.attrs['size'] - 1)
|
(subcorpus.collection.corpus.size - 1)
|
||||||
)
|
)
|
||||||
rc = (rc_lbound, rc_rbound)
|
rc = (rc_lbound, rc_rbound)
|
||||||
cpos_list_rbound = rc_rbound
|
cpos_list_rbound = rc_rbound
|
@ -1,115 +0,0 @@
|
|||||||
from flask import session
|
|
||||||
from flask_login import current_user
|
|
||||||
from flask_socketio import ConnectionRefusedError
|
|
||||||
from threading import Lock
|
|
||||||
import cqi
|
|
||||||
from app import db, hashids, socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from app.models import Corpus, CorpusStatus
|
|
||||||
|
|
||||||
|
|
||||||
'''
|
|
||||||
This package tunnels the Corpus Query interface (CQi) protocol through
|
|
||||||
Socket.IO (SIO) by wrapping each CQi function in a seperate SIO event.
|
|
||||||
|
|
||||||
This module only handles the SIO connect/disconnect, which handles the setup
|
|
||||||
and teardown of necessary ressources for later use. Each CQi function has a
|
|
||||||
corresponding SIO event. The event handlers are spread across the different
|
|
||||||
modules within this package.
|
|
||||||
|
|
||||||
Basic concept:
|
|
||||||
1. A client connects to the SIO namespace and provides the id of a corpus to be
|
|
||||||
analysed.
|
|
||||||
1.1 The analysis session counter of the corpus is incremented.
|
|
||||||
1.2 A CQiClient and a (Mutex) Lock belonging to it is created.
|
|
||||||
1.3 Wait until the CQP server is running.
|
|
||||||
1.4 Connect the CQiClient to the server.
|
|
||||||
1.5 Save the CQiClient and the Lock in the session for subsequential use.
|
|
||||||
2. A client emits an event and may provide a single json object with necessary
|
|
||||||
arguments for the targeted CQi function.
|
|
||||||
3. A SIO event handler (decorated with cqi_over_socketio) gets executed.
|
|
||||||
- The event handler function defines all arguments. Hence the client
|
|
||||||
is sent as a single json object, the decorator decomposes it to fit
|
|
||||||
the functions signature. This also includes type checking and proper
|
|
||||||
use of the lock (acquire/release) mechanism.
|
|
||||||
4. Wait for more events
|
|
||||||
5. The client disconnects from the SIO namespace
|
|
||||||
1.1 The analysis session counter of the corpus is decremented.
|
|
||||||
1.2 The CQiClient and (Mutex) Lock belonging to it are teared down.
|
|
||||||
'''
|
|
||||||
|
|
||||||
|
|
||||||
NAMESPACE = '/corpora/corpus/corpus_analysis'
|
|
||||||
|
|
||||||
|
|
||||||
# Import all CQi over Socket.IO event handlers
|
|
||||||
from .cqi_corpora_corpus_subcorpora import * # noqa
|
|
||||||
from .cqi_corpora_corpus_structural_attributes import * # noqa
|
|
||||||
from .cqi_corpora_corpus_positional_attributes import * # noqa
|
|
||||||
from .cqi_corpora_corpus_alignment_attributes import * # noqa
|
|
||||||
from .cqi_corpora_corpus import * # noqa
|
|
||||||
from .cqi_corpora import * # noqa
|
|
||||||
from .cqi import * # noqa
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('connect', namespace=NAMESPACE)
|
|
||||||
@socketio_login_required
|
|
||||||
def connect(auth):
|
|
||||||
# the auth variable is used in a hacky way. It contains the corpus id for
|
|
||||||
# which a corpus analysis session should be started.
|
|
||||||
corpus_id = hashids.decode(auth['corpus_id'])
|
|
||||||
corpus = Corpus.query.get(corpus_id)
|
|
||||||
if corpus is None:
|
|
||||||
# return {'code': 404, 'msg': 'Not Found'}
|
|
||||||
raise ConnectionRefusedError('Not Found')
|
|
||||||
if not (corpus.user == current_user
|
|
||||||
or current_user.is_following_corpus(corpus)
|
|
||||||
or current_user.is_administrator()):
|
|
||||||
# return {'code': 403, 'msg': 'Forbidden'}
|
|
||||||
raise ConnectionRefusedError('Forbidden')
|
|
||||||
if corpus.status not in [
|
|
||||||
CorpusStatus.BUILT,
|
|
||||||
CorpusStatus.STARTING_ANALYSIS_SESSION,
|
|
||||||
CorpusStatus.RUNNING_ANALYSIS_SESSION,
|
|
||||||
CorpusStatus.CANCELING_ANALYSIS_SESSION
|
|
||||||
]:
|
|
||||||
# return {'code': 424, 'msg': 'Failed Dependency'}
|
|
||||||
raise ConnectionRefusedError('Failed Dependency')
|
|
||||||
if corpus.num_analysis_sessions is None:
|
|
||||||
corpus.num_analysis_sessions = 0
|
|
||||||
db.session.commit()
|
|
||||||
corpus.num_analysis_sessions = Corpus.num_analysis_sessions + 1
|
|
||||||
db.session.commit()
|
|
||||||
retry_counter = 20
|
|
||||||
while corpus.status != CorpusStatus.RUNNING_ANALYSIS_SESSION:
|
|
||||||
if retry_counter == 0:
|
|
||||||
corpus.num_analysis_sessions = Corpus.num_analysis_sessions - 1
|
|
||||||
db.session.commit()
|
|
||||||
return {'code': 408, 'msg': 'Request Timeout'}
|
|
||||||
socketio.sleep(3)
|
|
||||||
retry_counter -= 1
|
|
||||||
db.session.refresh(corpus)
|
|
||||||
cqi_client = cqi.CQiClient(f'cqpserver_{corpus_id}')
|
|
||||||
session['d'] = {
|
|
||||||
'corpus_id': corpus_id,
|
|
||||||
'cqi_client': cqi_client,
|
|
||||||
'cqi_client_lock': Lock(),
|
|
||||||
}
|
|
||||||
# return {'code': 200, 'msg': 'OK'}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('disconnect', namespace=NAMESPACE)
|
|
||||||
def disconnect():
|
|
||||||
if 'd' not in session:
|
|
||||||
return
|
|
||||||
session['d']['cqi_client_lock'].acquire()
|
|
||||||
try:
|
|
||||||
session['d']['cqi_client'].disconnect()
|
|
||||||
except (BrokenPipeError, cqi.errors.CQiException):
|
|
||||||
pass
|
|
||||||
session['d']['cqi_client_lock'].release()
|
|
||||||
corpus = Corpus.query.get(session['d']['corpus_id'])
|
|
||||||
corpus.num_analysis_sessions = Corpus.num_analysis_sessions - 1
|
|
||||||
db.session.commit()
|
|
||||||
session.pop('d')
|
|
||||||
# return {'code': 200, 'msg': 'OK'}
|
|
@ -1,43 +0,0 @@
|
|||||||
from socket import gaierror
|
|
||||||
import cqi
|
|
||||||
from app import socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.connect', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_connect(cqi_client: cqi.CQiClient):
|
|
||||||
try:
|
|
||||||
cqi_status = cqi_client.connect()
|
|
||||||
except gaierror as e:
|
|
||||||
return {
|
|
||||||
'code': 500,
|
|
||||||
'msg': 'Internal Server Error',
|
|
||||||
'payload': {'code': e.args[0], 'desc': e.args[1]}
|
|
||||||
}
|
|
||||||
payload = {'code': cqi_status.code,
|
|
||||||
'msg': cqi_status.__class__.__name__}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.disconnect', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_disconnect(cqi_client: cqi.CQiClient):
|
|
||||||
cqi_status = cqi_client.disconnect()
|
|
||||||
payload = {'code': cqi_status.code,
|
|
||||||
'msg': cqi_status.__class__.__name__}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.ping', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_ping(cqi_client: cqi.CQiClient):
|
|
||||||
cqi_status = cqi_client.ping()
|
|
||||||
payload = {'code': cqi_status.code,
|
|
||||||
'msg': cqi_status.__class__.__name__}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
@ -1,22 +0,0 @@
|
|||||||
import cqi
|
|
||||||
from app import socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.get', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_get(cqi_client: cqi.CQiClient, corpus_name: str):
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
payload = {**cqi_corpus.attrs}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.list', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_list(cqi_client: cqi.CQiClient):
|
|
||||||
payload = [{**x.attrs} for x in cqi_client.corpora.list()]
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
@ -1,199 +0,0 @@
|
|||||||
from collections import Counter
|
|
||||||
from flask import session
|
|
||||||
import cqi
|
|
||||||
import json
|
|
||||||
import math
|
|
||||||
import os
|
|
||||||
from app import db, socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from app.models import Corpus
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio, lookups_by_cpos
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.drop', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_drop(cqi_client: cqi.CQiClient, corpus_name: str):
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_status = cqi_corpus.drop()
|
|
||||||
payload = {'code': cqi_status.code,
|
|
||||||
'msg': cqi_status.__class__.__name__}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.query', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_query(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, query: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_status = cqi_corpus.query(subcorpus_name, query)
|
|
||||||
payload = {'code': cqi_status.code,
|
|
||||||
'msg': cqi_status.__class__.__name__}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
###############################################################################
|
|
||||||
# nopaque specific CQi extensions #
|
|
||||||
###############################################################################
|
|
||||||
@socketio.on('cqi.corpora.corpus.update_db', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_update_db(cqi_client: cqi.CQiClient, corpus_name: str):
|
|
||||||
corpus = Corpus.query.get(session['d']['corpus_id'])
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
corpus.num_tokens = cqi_corpus.size
|
|
||||||
db.session.commit()
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.get_visualization_data', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_get_visualization_data(cqi_client: cqi.CQiClient, corpus_name: str):
|
|
||||||
corpus = Corpus.query.get(session['d']['corpus_id'])
|
|
||||||
visualization_data_file_path = os.path.join(corpus.path, 'cwb', 'visualization_data.json')
|
|
||||||
if os.path.exists(visualization_data_file_path):
|
|
||||||
with open(visualization_data_file_path, 'r') as f:
|
|
||||||
payload = json.load(f)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
##########################################################################
|
|
||||||
# A faster way to get cpos boundaries for smaller s_attrs #
|
|
||||||
##########################################################################
|
|
||||||
# cqi_corpus.query('Last', '<s> []* </s>;')
|
|
||||||
# cqi_subcorpus = cqi_corpus.subcorpora.get('Last')
|
|
||||||
# print(cqi_subcorpus.size)
|
|
||||||
# first_match = 0
|
|
||||||
# last_match = cqi_subcorpus.attrs['size'] - 1
|
|
||||||
# match_boundaries = zip(
|
|
||||||
# list(range(first_match, last_match + 1)),
|
|
||||||
# cqi_subcorpus.dump(cqi_subcorpus.attrs['fields']['match'], first_match, last_match),
|
|
||||||
# cqi_subcorpus.dump(cqi_subcorpus.attrs['fields']['matchend'], first_match, last_match)
|
|
||||||
# )
|
|
||||||
# for x in match_boundaries:
|
|
||||||
# print(x)
|
|
||||||
cqi_p_attrs = {
|
|
||||||
p_attr.name: p_attr
|
|
||||||
for p_attr in cqi_corpus.positional_attributes.list()
|
|
||||||
}
|
|
||||||
cqi_s_attrs = {
|
|
||||||
s_attr.name: s_attr
|
|
||||||
for s_attr in cqi_corpus.structural_attributes.list()
|
|
||||||
}
|
|
||||||
payload = {
|
|
||||||
'corpus': {
|
|
||||||
'bounds': [0, cqi_corpus.size - 1],
|
|
||||||
'counts': {
|
|
||||||
'token': cqi_corpus.size
|
|
||||||
},
|
|
||||||
'freqs': {}
|
|
||||||
},
|
|
||||||
'p_attrs': {},
|
|
||||||
's_attrs': {},
|
|
||||||
'values': {'p_attrs': {}, 's_attrs': {}}
|
|
||||||
}
|
|
||||||
for p_attr in cqi_p_attrs.values():
|
|
||||||
payload['corpus']['freqs'][p_attr.name] = dict(
|
|
||||||
zip(
|
|
||||||
range(0, p_attr.lexicon_size),
|
|
||||||
p_attr.freqs_by_ids(list(range(0, p_attr.lexicon_size)))
|
|
||||||
)
|
|
||||||
)
|
|
||||||
payload['p_attrs'][p_attr.name] = dict(
|
|
||||||
zip(
|
|
||||||
range(0, cqi_corpus.size),
|
|
||||||
p_attr.ids_by_cpos(list(range(0, cqi_corpus.size)))
|
|
||||||
)
|
|
||||||
)
|
|
||||||
payload['values']['p_attrs'][p_attr.name] = dict(
|
|
||||||
zip(
|
|
||||||
range(0, p_attr.lexicon_size),
|
|
||||||
p_attr.values_by_ids(list(range(0, p_attr.lexicon_size)))
|
|
||||||
)
|
|
||||||
)
|
|
||||||
for s_attr in cqi_s_attrs.values():
|
|
||||||
if s_attr.has_values:
|
|
||||||
continue
|
|
||||||
payload['corpus']['counts'][s_attr.name] = s_attr.size
|
|
||||||
payload['s_attrs'][s_attr.name] = {'lexicon': {}, 'values': None}
|
|
||||||
payload['values']['s_attrs'][s_attr.name] = {}
|
|
||||||
for id in range(0, s_attr.size):
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id] = {}
|
|
||||||
lbound, rbound = s_attr.cpos_by_id(id)
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['bounds'] = [lbound, rbound]
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['counts'] = {}
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['counts']['token'] = rbound - lbound + 1
|
|
||||||
if s_attr.name not in ['text', 's']:
|
|
||||||
continue
|
|
||||||
cpos_range = range(lbound, rbound + 1)
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['counts']['ent'] = len({x for x in cqi_s_attrs['ent'].ids_by_cpos(list(cpos_range)) if x != -1})
|
|
||||||
if s_attr.name != 'text':
|
|
||||||
continue
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['counts']['s'] = len({x for x in cqi_s_attrs['s'].ids_by_cpos(list(cpos_range)) if x != -1})
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['freqs'] = {}
|
|
||||||
for p_attr in cqi_p_attrs.values():
|
|
||||||
payload['s_attrs'][s_attr.name]['lexicon'][id]['freqs'][p_attr.name] = dict(Counter(p_attr.ids_by_cpos(list(cpos_range))))
|
|
||||||
sub_s_attrs = cqi_corpus.structural_attributes.list(filters={'part_of': s_attr})
|
|
||||||
s_attr_value_names = [
|
|
||||||
sub_s_attr.name[(len(s_attr.name) + 1):]
|
|
||||||
for sub_s_attr in sub_s_attrs
|
|
||||||
]
|
|
||||||
sub_s_attr_values = [
|
|
||||||
sub_s_attr.values_by_ids(list(range(0, s_attr.size)))
|
|
||||||
for sub_s_attr in sub_s_attrs
|
|
||||||
]
|
|
||||||
payload['s_attrs'][s_attr.name]['values'] = s_attr_value_names
|
|
||||||
payload['values']['s_attrs'][s_attr.name] = {
|
|
||||||
s_attr_id: {
|
|
||||||
s_attr_value_name: sub_s_attr_values[s_attr_value_name_idx][s_attr_id_idx]
|
|
||||||
for s_attr_value_name_idx, s_attr_value_name in enumerate(
|
|
||||||
payload['s_attrs'][s_attr.name]['values']
|
|
||||||
)
|
|
||||||
} for s_attr_id_idx, s_attr_id in enumerate(range(0, s_attr.size))
|
|
||||||
}
|
|
||||||
with open(visualization_data_file_path, 'w') as f:
|
|
||||||
json.dump(payload, f)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.paginate', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_paginate(cqi_client: cqi.CQiClient, corpus_name: str, page: int = 1, per_page: int = 20): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
# Sanity checks
|
|
||||||
if (
|
|
||||||
per_page < 1
|
|
||||||
or page < 1
|
|
||||||
or (
|
|
||||||
cqi_corpus.size > 0
|
|
||||||
and page > math.ceil(cqi_corpus.size / per_page)
|
|
||||||
)
|
|
||||||
):
|
|
||||||
return {'code': 416, 'msg': 'Range Not Satisfiable'}
|
|
||||||
first_cpos = (page - 1) * per_page
|
|
||||||
last_cpos = min(cqi_corpus.size, first_cpos + per_page)
|
|
||||||
cpos_list = [*range(first_cpos, last_cpos)]
|
|
||||||
lookups = lookups_by_cpos(cqi_corpus, cpos_list)
|
|
||||||
payload = {}
|
|
||||||
# the items for the current page
|
|
||||||
payload['items'] = [cpos_list]
|
|
||||||
# the lookups for the items
|
|
||||||
payload['lookups'] = lookups
|
|
||||||
# the total number of items matching the query
|
|
||||||
payload['total'] = cqi_corpus.size
|
|
||||||
# the number of items to be displayed on a page.
|
|
||||||
payload['per_page'] = per_page
|
|
||||||
# The total number of pages
|
|
||||||
payload['pages'] = math.ceil(payload['total'] / payload['per_page'])
|
|
||||||
# the current page number (1 indexed)
|
|
||||||
payload['page'] = page if payload['pages'] > 0 else None
|
|
||||||
# True if a previous page exists
|
|
||||||
payload['has_prev'] = payload['page'] > 1 if payload['page'] else False
|
|
||||||
# True if a next page exists.
|
|
||||||
payload['has_next'] = payload['page'] < payload['pages'] if payload['page'] else False # noqa
|
|
||||||
# Number of the previous page.
|
|
||||||
payload['prev_num'] = payload['page'] - 1 if payload['has_prev'] else None
|
|
||||||
# Number of the next page
|
|
||||||
payload['next_num'] = payload['page'] + 1 if payload['has_next'] else None
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
@ -1,24 +0,0 @@
|
|||||||
import cqi
|
|
||||||
from app import socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.alignment_attributes.get', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_alignment_attributes_get(cqi_client: cqi.CQiClient, corpus_name: str, alignment_attribute_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_alignment_attribute = cqi_corpus.alignment_attributes.get(alignment_attribute_name) # noqa
|
|
||||||
payload = {**cqi_alignment_attribute.attrs}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.alignment_attributes.list', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_alignment_attributes_list(cqi_client: cqi.CQiClient, corpus_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
payload = [{**x.attrs} for x in cqi_corpus.alignment_attributes.list()]
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
@ -1,24 +0,0 @@
|
|||||||
import cqi
|
|
||||||
from app import socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.positional_attributes.get', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_positional_attributes_get(cqi_client: cqi.CQiClient, corpus_name: str, positional_attribute_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_positional_attribute = cqi_corpus.positional_attributes.get(positional_attribute_name) # noqa
|
|
||||||
payload = {**cqi_positional_attribute.attrs}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.positional_attributes.list', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_positional_attributes_list(cqi_client: cqi.CQiClient, corpus_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
payload = [{**x.attrs} for x in cqi_corpus.positional_attributes.list()]
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
@ -1,24 +0,0 @@
|
|||||||
import cqi
|
|
||||||
from app import socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.structural_attributes.get', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_structural_attributes_get(cqi_client: cqi.CQiClient, corpus_name: str, structural_attribute_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_structural_attribute = cqi_corpus.structural_attributes.get(structural_attribute_name) # noqa
|
|
||||||
payload = {**cqi_structural_attribute.attrs}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.structural_attributes.list', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_structural_attributes_list(cqi_client: cqi.CQiClient, corpus_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
payload = [{**x.attrs} for x in cqi_corpus.structural_attributes.list()]
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
@ -1,140 +0,0 @@
|
|||||||
import cqi
|
|
||||||
import math
|
|
||||||
from app import socketio
|
|
||||||
from app.decorators import socketio_login_required
|
|
||||||
from . import NAMESPACE as ns
|
|
||||||
from .utils import cqi_over_socketio, export_subcorpus, partial_export_subcorpus
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.get', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_get(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
payload = {**cqi_subcorpus.attrs}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.list', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_list(cqi_client: cqi.CQiClient, corpus_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
payload = [{**x.attrs} for x in cqi_corpus.subcorpora.list()]
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.drop', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_drop(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
cqi_status = cqi_subcorpus.drop()
|
|
||||||
payload = {'code': cqi_status.code,
|
|
||||||
'msg': cqi_status.__class__.__name__}
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.dump', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_dump(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, field: int, first: int, last: int): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
payload = cqi_subcorpus.dump(field, first, last)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.fdist_1', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_fdist_1(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, cutoff: int, field_name: str, positional_attribute_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
field = cqi_subcorpus.fields[field_name]
|
|
||||||
pos_attr = cqi_corpus.positional_attributes.get(positional_attribute_name)
|
|
||||||
payload = cqi_subcorpus.fdist_1(cutoff, field, pos_attr)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.fdist_2', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_fdist_2(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, cutoff: int, field_1_name: str, positional_attribute_1_name: str, field_2_name: str, positional_attribute_2_name: str): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
field_1 = cqi_subcorpus.fields[field_1_name]
|
|
||||||
pos_attr_1 = cqi_corpus.positional_attributes.get(positional_attribute_1_name)
|
|
||||||
field_2 = cqi_subcorpus.fields[field_2_name]
|
|
||||||
pos_attr_2 = cqi_corpus.positional_attributes.get(positional_attribute_2_name)
|
|
||||||
payload = cqi_subcorpus.fdist_2(cutoff, field_1, pos_attr_1, field_2, pos_attr_2)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
###############################################################################
|
|
||||||
# nopaque specific CQi extensions #
|
|
||||||
###############################################################################
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.paginate', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_paginate(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, context: int = 50, page: int = 1, per_page: int = 20): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
# Sanity checks
|
|
||||||
if (
|
|
||||||
per_page < 1
|
|
||||||
or page < 1
|
|
||||||
or (
|
|
||||||
cqi_subcorpus.attrs['size'] > 0
|
|
||||||
and page > math.ceil(cqi_subcorpus.attrs['size'] / per_page)
|
|
||||||
)
|
|
||||||
):
|
|
||||||
return {'code': 416, 'msg': 'Range Not Satisfiable'}
|
|
||||||
offset = (page - 1) * per_page
|
|
||||||
cutoff = per_page
|
|
||||||
cqi_results_export = export_subcorpus(
|
|
||||||
cqi_subcorpus, context=context, cutoff=cutoff, offset=offset)
|
|
||||||
payload = {}
|
|
||||||
# the items for the current page
|
|
||||||
payload['items'] = cqi_results_export.pop('matches')
|
|
||||||
# the lookups for the items
|
|
||||||
payload['lookups'] = cqi_results_export
|
|
||||||
# the total number of items matching the query
|
|
||||||
payload['total'] = cqi_subcorpus.attrs['size']
|
|
||||||
# the number of items to be displayed on a page.
|
|
||||||
payload['per_page'] = per_page
|
|
||||||
# The total number of pages
|
|
||||||
payload['pages'] = math.ceil(payload['total'] / payload['per_page'])
|
|
||||||
# the current page number (1 indexed)
|
|
||||||
payload['page'] = page if payload['pages'] > 0 else None
|
|
||||||
# True if a previous page exists
|
|
||||||
payload['has_prev'] = payload['page'] > 1 if payload['page'] else False
|
|
||||||
# True if a next page exists.
|
|
||||||
payload['has_next'] = payload['page'] < payload['pages'] if payload['page'] else False # noqa
|
|
||||||
# Number of the previous page.
|
|
||||||
payload['prev_num'] = payload['page'] - 1 if payload['has_prev'] else None
|
|
||||||
# Number of the next page
|
|
||||||
payload['next_num'] = payload['page'] + 1 if payload['has_next'] else None
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': payload}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.partial_export', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_partial_export(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, match_id_list: list, context: int = 50): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
cqi_subcorpus_partial_export = partial_export_subcorpus(cqi_subcorpus, match_id_list, context=context)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': cqi_subcorpus_partial_export}
|
|
||||||
|
|
||||||
|
|
||||||
@socketio.on('cqi.corpora.corpus.subcorpora.subcorpus.export', namespace=ns)
|
|
||||||
@socketio_login_required
|
|
||||||
@cqi_over_socketio
|
|
||||||
def cqi_corpora_corpus_subcorpora_subcorpus_export(cqi_client: cqi.CQiClient, corpus_name: str, subcorpus_name: str, context: int = 50): # noqa
|
|
||||||
cqi_corpus = cqi_client.corpora.get(corpus_name)
|
|
||||||
cqi_subcorpus = cqi_corpus.subcorpora.get(subcorpus_name)
|
|
||||||
cqi_subcorpus_export = export_subcorpus(cqi_subcorpus, context=context)
|
|
||||||
return {'code': 200, 'msg': 'OK', 'payload': cqi_subcorpus_export}
|
|
File diff suppressed because it is too large
Load Diff
@ -26,25 +26,19 @@ class CorpusAnalysisApp {
|
|||||||
this.disableActionElements();
|
this.disableActionElements();
|
||||||
this.elements.m.initModal.open();
|
this.elements.m.initModal.open();
|
||||||
// Init data
|
// Init data
|
||||||
this.data.cQiClient = new CQiClient(this.settings.corpusId);
|
this.data.cqiClient = new cqi.CQiClient('/cqi_over_sio', this.settings.corpusId);
|
||||||
this.data.cQiClient.connect()
|
this.data.cqiClient.connect('anonymous', '')
|
||||||
.then(cQiStatus => {
|
.then((cqiStatus) => {
|
||||||
return this.data.cQiClient.corpora.get(`NOPAQUE_${this.settings.corpusId}`);
|
return this.data.cqiClient.corpora.list();
|
||||||
})
|
})
|
||||||
.then(
|
.then((cqiCorpora) => {
|
||||||
cQiCorpus => {
|
this.data.corpus = {o: cqiCorpora[0]};
|
||||||
this.data.corpus = {o: cQiCorpus};
|
console.log(this.data.corpus.o.staticData);
|
||||||
this.data.corpus.o.getVisualizationData()
|
this.renderGeneralCorpusInfo(this.data.corpus.o.staticData);
|
||||||
.then(
|
this.renderTextInfoList(this.data.corpus.o.staticData);
|
||||||
(data) => {
|
this.renderTextProportionsGraphic(this.data.corpus.o.staticData);
|
||||||
console.log(data);
|
this.renderFrequenciesGraphic(this.data.corpus.o.staticData);
|
||||||
this.renderGeneralCorpusInfo(data);
|
this.renderBoundsGraphic(this.data.corpus.o.staticData);
|
||||||
this.renderTextInfoList(data);
|
|
||||||
this.renderTextProportionsGraphic(data);
|
|
||||||
this.renderFrequenciesGraphic(data);
|
|
||||||
this.renderBoundsGraphic(data);
|
|
||||||
}
|
|
||||||
);
|
|
||||||
// this.data.corpus.o.getCorpusData()
|
// this.data.corpus.o.getCorpusData()
|
||||||
// .then(corpusData => {
|
// .then(corpusData => {
|
||||||
// console.log(corpusData);
|
// console.log(corpusData);
|
||||||
@ -55,19 +49,19 @@ class CorpusAnalysisApp {
|
|||||||
// this.renderBoundsGraphic(corpusData);
|
// this.renderBoundsGraphic(corpusData);
|
||||||
// });
|
// });
|
||||||
// TODO: Don't do this hgere
|
// TODO: Don't do this hgere
|
||||||
cQiCorpus.updateDb();
|
this.data.corpus.o.updateDb();
|
||||||
this.enableActionElements();
|
this.enableActionElements();
|
||||||
for (let extension of Object.values(this.extensions)) {extension.init();}
|
for (let extension of Object.values(this.extensions)) {extension.init();}
|
||||||
this.elements.m.initModal.close();
|
this.elements.m.initModal.close();
|
||||||
},
|
},
|
||||||
cQiError => {
|
(cqiError) => {
|
||||||
let errorsElement = this.elements.initModal.querySelector('.errors');
|
let errorsElement = this.elements.initModal.querySelector('.errors');
|
||||||
let progressElement = this.elements.initModal.querySelector('.progress');
|
let progressElement = this.elements.initModal.querySelector('.progress');
|
||||||
errorsElement.innerText = JSON.stringify(cQiError);
|
errorsElement.innerText = JSON.stringify(cqiError);
|
||||||
errorsElement.classList.remove('hide');
|
errorsElement.classList.remove('hide');
|
||||||
progressElement.classList.add('hide');
|
progressElement.classList.add('hide');
|
||||||
if ('payload' in cQiError && 'code' in cQiError.payload && 'msg' in cQiError.payload) {
|
if ('payload' in cqiError && 'code' in cqiError.payload && 'msg' in cqiError.payload) {
|
||||||
app.flash(`${cQiError.payload.code}: ${cQiError.payload.msg}`, 'error');
|
app.flash(`${cqiError.payload.code}: ${cqiError.payload.msg}`, 'error');
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
);
|
);
|
||||||
|
@ -45,18 +45,18 @@ class CorpusAnalysisConcordance {
|
|||||||
this.elements.progress.classList.remove('hide');
|
this.elements.progress.classList.remove('hide');
|
||||||
let subcorpus = {};
|
let subcorpus = {};
|
||||||
this.data.corpus.o.query(subcorpusName, query)
|
this.data.corpus.o.query(subcorpusName, query)
|
||||||
.then(cQiStatus => {
|
.then((cqiStatus) => {
|
||||||
subcorpus.q = query;
|
subcorpus.q = query;
|
||||||
subcorpus.selectedItems = new Set();
|
subcorpus.selectedItems = new Set();
|
||||||
if (subcorpusName !== 'Last') {this.data.subcorpora.Last = subcorpus;}
|
if (subcorpusName !== 'Last') {this.data.subcorpora.Last = subcorpus;}
|
||||||
return this.data.corpus.o.subcorpora.get(subcorpusName);
|
return this.data.corpus.o.subcorpora.get(subcorpusName);
|
||||||
})
|
})
|
||||||
.then(cQiSubcorpus => {
|
.then((cqiSubcorpus) => {
|
||||||
subcorpus.o = cQiSubcorpus;
|
subcorpus.o = cqiSubcorpus;
|
||||||
return cQiSubcorpus.paginate(1, this.settings.perPage, this.settings.context);
|
return cqiSubcorpus.paginate(this.settings.context, 1, this.settings.perPage);
|
||||||
})
|
})
|
||||||
.then(
|
.then(
|
||||||
paginatedSubcorpus => {
|
(paginatedSubcorpus) => {
|
||||||
subcorpus.p = paginatedSubcorpus;
|
subcorpus.p = paginatedSubcorpus;
|
||||||
this.data.subcorpora[subcorpusName] = subcorpus;
|
this.data.subcorpora[subcorpusName] = subcorpus;
|
||||||
this.settings.selectedSubcorpus = subcorpusName;
|
this.settings.selectedSubcorpus = subcorpusName;
|
||||||
@ -68,11 +68,12 @@ class CorpusAnalysisConcordance {
|
|||||||
this.elements.progress.classList.add('hide');
|
this.elements.progress.classList.add('hide');
|
||||||
this.app.enableActionElements();
|
this.app.enableActionElements();
|
||||||
},
|
},
|
||||||
cQiError => {
|
(cqiStatus) => {
|
||||||
this.elements.error.innerText = JSON.stringify(cQiError);
|
// TODDO: CHECK THIS!
|
||||||
|
this.elements.error.innerText = JSON.stringify(cqiStatus);
|
||||||
this.elements.error.classList.remove('hide');
|
this.elements.error.classList.remove('hide');
|
||||||
if ('payload' in cQiError && 'code' in cQiError.payload && 'msg' in cQiError.payload) {
|
if ('payload' in cqiStatus && 'code' in cqiStatus.payload && 'msg' in cqiStatus.payload) {
|
||||||
app.flash(`${cQiError.payload.code}: ${cQiError.payload.msg}`, 'error');
|
app.flash(`${cqiStatus.payload.code}: ${cqiStatus.payload.msg}`, 'error');
|
||||||
}
|
}
|
||||||
this.elements.progress.classList.add('hide');
|
this.elements.progress.classList.add('hide');
|
||||||
this.app.enableActionElements();
|
this.app.enableActionElements();
|
||||||
@ -236,7 +237,7 @@ class CorpusAnalysisConcordance {
|
|||||||
app.flash('No matches selected', 'error');
|
app.flash('No matches selected', 'error');
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
promise = subcorpus.o.partial_export([...subcorpus.selectedItems], 50);
|
promise = subcorpus.o.partialExport([...subcorpus.selectedItems], 50);
|
||||||
} else {
|
} else {
|
||||||
promise = subcorpus.o.export(50);
|
promise = subcorpus.o.export(50);
|
||||||
}
|
}
|
||||||
@ -291,7 +292,7 @@ class CorpusAnalysisConcordance {
|
|||||||
event.preventDefault();
|
event.preventDefault();
|
||||||
let subcorpus = this.data.subcorpora[this.settings.selectedSubcorpus];
|
let subcorpus = this.data.subcorpora[this.settings.selectedSubcorpus];
|
||||||
subcorpus.o.drop().then(
|
subcorpus.o.drop().then(
|
||||||
cQiStatus => {
|
(cQiStatus) => {
|
||||||
app.flash(`${subcorpus.o.name} deleted`, 'corpus');
|
app.flash(`${subcorpus.o.name} deleted`, 'corpus');
|
||||||
delete this.data.subcorpora[subcorpus.o.name];
|
delete this.data.subcorpora[subcorpus.o.name];
|
||||||
this.settings.selectedSubcorpus = undefined;
|
this.settings.selectedSubcorpus = undefined;
|
||||||
@ -312,7 +313,7 @@ class CorpusAnalysisConcordance {
|
|||||||
this.clearSubcorpusPagination();
|
this.clearSubcorpusPagination();
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
cQiError => {
|
(cQiError) => {
|
||||||
app.flash(`${cQiError.payload.code}: ${cQiError.payload.msg}`, 'error');
|
app.flash(`${cQiError.payload.code}: ${cQiError.payload.msg}`, 'error');
|
||||||
}
|
}
|
||||||
);
|
);
|
||||||
|
@ -28,7 +28,6 @@ class CorpusAnalysisReader {
|
|||||||
init() {
|
init() {
|
||||||
// Init data
|
// Init data
|
||||||
this.data.corpus = this.app.data.corpus;
|
this.data.corpus = this.app.data.corpus;
|
||||||
this.data.subcorpora = {};
|
|
||||||
// Add event listeners
|
// Add event listeners
|
||||||
this.elements.form.addEventListener('submit', (event) => {
|
this.elements.form.addEventListener('submit', (event) => {
|
||||||
event.preventDefault();
|
event.preventDefault();
|
||||||
@ -38,14 +37,14 @@ class CorpusAnalysisReader {
|
|||||||
this.elements.progress.classList.remove('hide');
|
this.elements.progress.classList.remove('hide');
|
||||||
this.data.corpus.o.paginate(1, this.settings.perPage)
|
this.data.corpus.o.paginate(1, this.settings.perPage)
|
||||||
.then(
|
.then(
|
||||||
paginatedCorpus => {
|
(paginatedCorpus) => {
|
||||||
this.data.corpus.p = paginatedCorpus;
|
this.data.corpus.p = paginatedCorpus;
|
||||||
this.renderCorpus();
|
this.renderCorpus();
|
||||||
this.renderCorpusPagination();
|
this.renderCorpusPagination();
|
||||||
this.elements.progress.classList.add('hide');
|
this.elements.progress.classList.add('hide');
|
||||||
this.app.enableActionElements();
|
this.app.enableActionElements();
|
||||||
},
|
},
|
||||||
error => {
|
(cqiError) => {
|
||||||
this.elements.error.innerText = JSON.stringify(error);
|
this.elements.error.innerText = JSON.stringify(error);
|
||||||
this.elements.error.classList.remove('hide');
|
this.elements.error.classList.remove('hide');
|
||||||
if ('payload' in error && 'code' in error.payload && 'msg' in error.payload) {
|
if ('payload' in error && 'code' in error.payload && 'msg' in error.payload) {
|
||||||
@ -247,7 +246,7 @@ class CorpusAnalysisReader {
|
|||||||
this.elements.progress.classList.remove('hide');
|
this.elements.progress.classList.remove('hide');
|
||||||
this.data.corpus.o.paginate(pageNum, this.settings.perPage)
|
this.data.corpus.o.paginate(pageNum, this.settings.perPage)
|
||||||
.then(
|
.then(
|
||||||
paginatedCorpus => {
|
(paginatedCorpus) => {
|
||||||
this.data.corpus.p = paginatedCorpus;
|
this.data.corpus.p = paginatedCorpus;
|
||||||
this.renderCorpus();
|
this.renderCorpus();
|
||||||
this.renderCorpusPagination();
|
this.renderCorpusPagination();
|
||||||
|
@ -1,6 +1,13 @@
|
|||||||
cqi.api.APIClient = class APIClient {
|
cqi.api.APIClient = class APIClient {
|
||||||
constructor(host, corpus_id, version = '0.1') {
|
/**
|
||||||
|
* @param {string} host
|
||||||
|
* @param {string} corpusId
|
||||||
|
* @param {number} [timeout=60] timeout
|
||||||
|
* @param {string} [version=0.1] version
|
||||||
|
*/
|
||||||
|
constructor(host, corpus_id, timeout = 60, version = '0.1') {
|
||||||
this.host = host;
|
this.host = host;
|
||||||
|
this.timeout = timeout * 1000; // convert seconds to milliseconds
|
||||||
this.version = version;
|
this.version = version;
|
||||||
this.socket = io(
|
this.socket = io(
|
||||||
this.host,
|
this.host,
|
||||||
@ -19,7 +26,10 @@ cqi.api.APIClient = class APIClient {
|
|||||||
*/
|
*/
|
||||||
#request(fn_name, fn_args = {}) {
|
#request(fn_name, fn_args = {}) {
|
||||||
return new Promise((resolve, reject) => {
|
return new Promise((resolve, reject) => {
|
||||||
this.socket.emit('cqi_client.api', {fn_name: fn_name, fn_args: fn_args}, (response) => {
|
this.socket.timeout(this.timeout).emit('cqi', {fn_name: fn_name, fn_args: fn_args}, (timeoutError, response) => {
|
||||||
|
if (timeoutError) {
|
||||||
|
reject(timeoutError);
|
||||||
|
}
|
||||||
if (response.code === 200) {
|
if (response.code === 200) {
|
||||||
resolve(response.payload);
|
resolve(response.payload);
|
||||||
}
|
}
|
||||||
@ -595,4 +605,87 @@ cqi.api.APIClient = class APIClient {
|
|||||||
const fn_args = {subcorpus: subcorpus, cutoff: cutoff, field1: field1, attribute1: attribute1, field2: field2, attribute2: attribute2};
|
const fn_args = {subcorpus: subcorpus, cutoff: cutoff, field1: field1, attribute1: attribute1, field2: field2, attribute2: attribute2};
|
||||||
return await this.#request(fn_name, fn_args);
|
return await this.#request(fn_name, fn_args);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**************************************************************************
|
||||||
|
* NOTE: The following is not included in the CQi specification. *
|
||||||
|
**************************************************************************/
|
||||||
|
/**************************************************************************
|
||||||
|
* Custom additions for nopaque *
|
||||||
|
**************************************************************************/
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {string} corpus
|
||||||
|
* @returns {Promise<cqi.status.StatusOk>}
|
||||||
|
*/
|
||||||
|
async corpus_update_db(corpus) {
|
||||||
|
const fn_name = 'nopaque_corpus_update_db';
|
||||||
|
const fn_args = {corpus: corpus};
|
||||||
|
let payload = await this.#request(fn_name, fn_args);
|
||||||
|
return new cqi.status.lookup[payload.code]();
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {string} corpus
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async corpus_static_data(corpus) {
|
||||||
|
const fn_name = 'nopaque_corpus_static_data';
|
||||||
|
const fn_args = {corpus: corpus};
|
||||||
|
return await this.#request(fn_name, fn_args);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {string} corpus
|
||||||
|
* @param {number=} page
|
||||||
|
* @param {number=} per_page
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async corpus_paginate_corpus(corpus, page, per_page) {
|
||||||
|
const fn_name = 'nopaque_corpus_paginate_corpus';
|
||||||
|
const fn_args = {corpus: corpus}
|
||||||
|
if (page !== undefined) {fn_args.page = page;}
|
||||||
|
if (per_page !== undefined) {fn_args.per_page = per_page;}
|
||||||
|
return await this.#request(fn_name, fn_args);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {string} subcorpus
|
||||||
|
* @param {number=} context
|
||||||
|
* @param {number=} page
|
||||||
|
* @param {number=} per_page
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async cqp_paginate_subcorpus(subcorpus, context, page, per_page) {
|
||||||
|
const fn_name = 'nopaque_cqp_paginate_subcorpus';
|
||||||
|
const fn_args = {subcorpus: subcorpus}
|
||||||
|
if (context !== undefined) {fn_args.context = context;}
|
||||||
|
if (page !== undefined) {fn_args.page = page;}
|
||||||
|
if (per_page !== undefined) {fn_args.per_page = per_page;}
|
||||||
|
return await this.#request(fn_name, fn_args);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {string} subcorpus
|
||||||
|
* @param {number[]} match_id_list
|
||||||
|
* @param {number=} context
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async cqp_partial_export_subcorpus(subcorpus, match_id_list, context) {
|
||||||
|
const fn_name = 'nopaque_cqp_partial_export_subcorpus';
|
||||||
|
const fn_args = {subcorpus: subcorpus, match_id_list: match_id_list};
|
||||||
|
if (context !== undefined) {fn_args.context = context;}
|
||||||
|
return await this.#request(fn_name, fn_args);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {string} subcorpus
|
||||||
|
* @param {number=} context
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async cqp_export_subcorpus(subcorpus, context) {
|
||||||
|
const fn_name = 'nopaque_cqp_export_subcorpus';
|
||||||
|
const fn_args = {subcorpus: subcorpus};
|
||||||
|
if (context !== undefined) {fn_args.context = context;}
|
||||||
|
return await this.#request(fn_name, fn_args);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
@ -2,11 +2,12 @@ cqi.CQiClient = class CQiClient {
|
|||||||
/**
|
/**
|
||||||
* @param {string} host
|
* @param {string} host
|
||||||
* @param {string} corpusId
|
* @param {string} corpusId
|
||||||
|
* @param {number} [timeout=60] timeout
|
||||||
* @param {string} [version=0.1] version
|
* @param {string} [version=0.1] version
|
||||||
*/
|
*/
|
||||||
constructor(host, corpusId, version = '0.1') {
|
constructor(host, corpusId, timeout = 60, version = '0.1') {
|
||||||
/** @type {cqi.api.APIClient} */
|
/** @type {cqi.api.APIClient} */
|
||||||
this.api = new cqi.api.APIClient(host, corpusId, version);
|
this.api = new cqi.api.APIClient(host, corpusId, timeout, version);
|
||||||
}
|
}
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
@ -80,6 +80,36 @@ cqi.models.corpora.Corpus = class Corpus extends cqi.models.resource.Model {
|
|||||||
async query(subcorpusName, query) {
|
async query(subcorpusName, query) {
|
||||||
return await this.client.api.cqp_query(this.apiName, subcorpusName, query);
|
return await this.client.api.cqp_query(this.apiName, subcorpusName, query);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**************************************************************************
|
||||||
|
* NOTE: The following is not included in the CQi specification. *
|
||||||
|
**************************************************************************/
|
||||||
|
/**************************************************************************
|
||||||
|
* Custom additions for nopaque *
|
||||||
|
**************************************************************************/
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @returns {string}
|
||||||
|
*/
|
||||||
|
get staticData() {
|
||||||
|
return this.attrs.static_data;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @returns {cqi.status.StatusOk}
|
||||||
|
*/
|
||||||
|
async updateDb() {
|
||||||
|
return await this.client.api.corpus_update_db(this.apiName);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {number=} page
|
||||||
|
* @param {number=} per_page
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async paginate(page, per_page) {
|
||||||
|
return await this.client.api.corpus_paginate_corpus(this.apiName, page, per_page);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
@ -95,11 +125,12 @@ cqi.models.corpora.CorpusCollection = class CorpusCollection extends cqi.models.
|
|||||||
return {
|
return {
|
||||||
api_name: corpusName,
|
api_name: corpusName,
|
||||||
charset: await this.client.api.corpus_charset(corpusName),
|
charset: await this.client.api.corpus_charset(corpusName),
|
||||||
// full_name: await this.client.api.corpus_full_name(api_name),
|
// full_name: await this.client.api.corpus_full_name(corpusName),
|
||||||
// info: await this.client.api.corpus_info(api_name),
|
// info: await this.client.api.corpus_info(corpusName),
|
||||||
name: corpusName,
|
name: corpusName,
|
||||||
properties: await this.client.api.corpus_properties(corpusName),
|
properties: await this.client.api.corpus_properties(corpusName),
|
||||||
size: await this.client.api.cl_attribute_size(`${corpusName}.word`)
|
size: await this.client.api.cl_attribute_size(`${corpusName}.word`),
|
||||||
|
static_data: await this.client.api.corpus_static_data(corpusName),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -85,6 +85,40 @@ cqi.models.subcorpora.Subcorpus = class Subcorpus extends cqi.models.resource.Mo
|
|||||||
attribute2.apiName
|
attribute2.apiName
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/**************************************************************************
|
||||||
|
* NOTE: The following is not included in the CQi specification. *
|
||||||
|
**************************************************************************/
|
||||||
|
/**************************************************************************
|
||||||
|
* Custom additions for nopaque *
|
||||||
|
**************************************************************************/
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {number=} context
|
||||||
|
* @param {number=} page
|
||||||
|
* @param {number=} perPage
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async paginate(context, page, perPage) {
|
||||||
|
return await this.client.api.cqp_paginate_subcorpus(this.apiName, context, page, perPage);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {number[]} matchIdList
|
||||||
|
* @param {number=} context
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async partialExport(matchIdList, context) {
|
||||||
|
return await this.client.api.cqp_partial_export_subcorpus(this.apiName, matchIdList, context);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* @param {number=} context
|
||||||
|
* @returns {Promise<object>}
|
||||||
|
*/
|
||||||
|
async export(context) {
|
||||||
|
return await this.client.api.cqp_export_subcorpus(this.apiName, context);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
|
@ -25,7 +25,6 @@
|
|||||||
output='gen/app.%(version)s.js',
|
output='gen/app.%(version)s.js',
|
||||||
'js/App.js',
|
'js/App.js',
|
||||||
'js/Utils.js',
|
'js/Utils.js',
|
||||||
'js/CorpusAnalysis/CQiClient.js',
|
|
||||||
'js/CorpusAnalysis/CorpusAnalysisApp.js',
|
'js/CorpusAnalysis/CorpusAnalysisApp.js',
|
||||||
'js/CorpusAnalysis/CorpusAnalysisConcordance.js',
|
'js/CorpusAnalysis/CorpusAnalysisConcordance.js',
|
||||||
'js/CorpusAnalysis/CorpusAnalysisReader.js',
|
'js/CorpusAnalysis/CorpusAnalysisReader.js',
|
||||||
|
Loading…
x
Reference in New Issue
Block a user