2020-04-15 14:30:41 +02:00
|
|
|
from flask import (abort, current_app, flash, make_response, redirect, request,
|
2020-04-06 14:12:22 +02:00
|
|
|
render_template, url_for, send_from_directory)
|
|
|
|
from flask_login import current_user, login_required
|
2020-03-28 19:29:19 +01:00
|
|
|
from . import corpora
|
2020-04-21 18:34:21 +02:00
|
|
|
from . import tasks
|
2020-04-06 14:12:22 +02:00
|
|
|
from .forms import (AddCorpusFileForm, AddCorpusForm, EditCorpusFileForm,
|
2020-04-14 15:51:26 +02:00
|
|
|
QueryDownloadForm, QueryForm, DisplayOptionsForm,
|
|
|
|
InspectDisplayOptionsForm)
|
2020-03-28 19:29:19 +01:00
|
|
|
from .. import db
|
2020-04-06 14:12:22 +02:00
|
|
|
from ..models import Corpus, CorpusFile
|
|
|
|
import os
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/add', methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def add_corpus():
|
|
|
|
add_corpus_form = AddCorpusForm()
|
|
|
|
if add_corpus_form.validate_on_submit():
|
|
|
|
corpus = Corpus(creator=current_user,
|
|
|
|
description=add_corpus_form.description.data,
|
|
|
|
status='unprepared', title=add_corpus_form.title.data)
|
|
|
|
db.session.add(corpus)
|
|
|
|
db.session.commit()
|
|
|
|
dir = os.path.join(current_app.config['NOPAQUE_STORAGE'],
|
|
|
|
str(corpus.user_id), 'corpora', str(corpus.id))
|
|
|
|
try:
|
|
|
|
os.makedirs(dir)
|
|
|
|
except OSError:
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('[ERROR]: Could not add corpus!', 'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
corpus.delete()
|
|
|
|
else:
|
2020-04-27 15:22:20 +02:00
|
|
|
url = url_for('corpora.corpus', corpus_id=corpus.id)
|
|
|
|
flash('[<a href="{}">{}</a>] added'.format(url, corpus.title),
|
|
|
|
'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus.id))
|
|
|
|
return render_template('corpora/add_corpus.html.j2',
|
|
|
|
add_corpus_form=add_corpus_form,
|
|
|
|
title='Add corpus')
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>')
|
|
|
|
@login_required
|
|
|
|
def corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2020-07-08 15:24:18 +02:00
|
|
|
corpus_files = [dict(filename=corpus_file.filename,
|
|
|
|
author=corpus_file.author,
|
|
|
|
title=corpus_file.title,
|
|
|
|
publishing_year=corpus_file.publishing_year,
|
|
|
|
corpus_id=corpus.id,
|
|
|
|
id=corpus_file.id
|
|
|
|
)
|
|
|
|
for corpus_file in corpus.files]
|
|
|
|
return render_template('corpora/corpus.html.j2',
|
|
|
|
corpus=corpus,
|
|
|
|
corpus_files=corpus_files,
|
2020-04-06 14:12:22 +02:00
|
|
|
title='Corpus')
|
2020-03-28 19:29:19 +01:00
|
|
|
|
|
|
|
|
2020-04-06 14:27:14 +02:00
|
|
|
@corpora.route('/<int:corpus_id>/analyse')
|
2020-03-28 19:29:19 +01:00
|
|
|
@login_required
|
2020-04-06 14:27:14 +02:00
|
|
|
def analyse_corpus(corpus_id):
|
2020-03-28 19:29:19 +01:00
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if corpus.status == 'prepared':
|
|
|
|
corpus.status = 'start analysis'
|
|
|
|
db.session.commit()
|
2020-04-06 14:09:41 +02:00
|
|
|
display_options_form = DisplayOptionsForm(
|
2020-03-28 19:29:19 +01:00
|
|
|
prefix='display-options-form',
|
|
|
|
result_context=request.args.get('context', 20),
|
|
|
|
results_per_page=request.args.get('results_per_page', 30))
|
2020-04-06 14:09:41 +02:00
|
|
|
query_form = QueryForm(prefix='query-form',
|
2020-04-06 14:12:22 +02:00
|
|
|
query=request.args.get('query'))
|
2020-04-20 13:48:40 +02:00
|
|
|
query_download_form = QueryDownloadForm(prefix='query-download-form')
|
2020-04-23 07:56:23 +02:00
|
|
|
inspect_display_options_form = InspectDisplayOptionsForm(
|
|
|
|
prefix='inspect-display-options-form')
|
|
|
|
return render_template(
|
|
|
|
'corpora/analyse_corpus.html.j2',
|
2020-07-16 16:00:38 +02:00
|
|
|
corpus=corpus,
|
2020-04-23 07:56:23 +02:00
|
|
|
corpus_id=corpus_id,
|
|
|
|
display_options_form=display_options_form,
|
|
|
|
query_form=query_form,
|
|
|
|
query_download_form=query_download_form,
|
|
|
|
inspect_display_options_form=inspect_display_options_form,
|
|
|
|
title='Corpus analysis')
|
2020-04-06 14:12:22 +02:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/delete')
|
|
|
|
@login_required
|
|
|
|
def delete_corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2020-04-21 18:34:21 +02:00
|
|
|
tasks.delete_corpus(corpus_id)
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('Corpus deleted!', 'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
return redirect(url_for('main.dashboard'))
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/files/add', methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def add_corpus_file(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2020-04-16 09:40:38 +02:00
|
|
|
add_corpus_file_form = AddCorpusFileForm(corpus,
|
|
|
|
prefix='add-corpus-file-form')
|
2020-04-15 14:57:17 +02:00
|
|
|
if add_corpus_file_form.is_submitted():
|
|
|
|
if not add_corpus_file_form.validate():
|
|
|
|
return make_response(add_corpus_file_form.errors, 400)
|
2020-04-06 14:12:22 +02:00
|
|
|
# Save the file
|
|
|
|
dir = os.path.join(str(corpus.user_id), 'corpora', str(corpus.id))
|
2020-04-16 09:40:38 +02:00
|
|
|
add_corpus_file_form.file.data.save(
|
|
|
|
os.path.join(current_app.config['NOPAQUE_STORAGE'], dir,
|
|
|
|
add_corpus_file_form.file.data.filename))
|
|
|
|
corpus_file = CorpusFile(
|
|
|
|
address=add_corpus_file_form.address.data,
|
|
|
|
author=add_corpus_file_form.author.data,
|
|
|
|
booktitle=add_corpus_file_form.booktitle.data,
|
|
|
|
chapter=add_corpus_file_form.chapter.data,
|
|
|
|
corpus=corpus,
|
|
|
|
dir=dir,
|
|
|
|
editor=add_corpus_file_form.editor.data,
|
|
|
|
filename=add_corpus_file_form.file.data.filename,
|
|
|
|
institution=add_corpus_file_form.institution.data,
|
|
|
|
journal=add_corpus_file_form.journal.data,
|
|
|
|
pages=add_corpus_file_form.pages.data,
|
|
|
|
publisher=add_corpus_file_form.publisher.data,
|
|
|
|
publishing_year=add_corpus_file_form.publishing_year.data,
|
|
|
|
school=add_corpus_file_form.school.data,
|
|
|
|
title=add_corpus_file_form.title.data)
|
2020-04-06 14:12:22 +02:00
|
|
|
db.session.add(corpus_file)
|
2020-04-23 07:56:23 +02:00
|
|
|
corpus.status = 'unprepared'
|
2020-04-06 14:12:22 +02:00
|
|
|
db.session.commit()
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('Corpus file added!', 'corpus')
|
2020-04-15 14:30:41 +02:00
|
|
|
return make_response(
|
|
|
|
{'redirect_url': url_for('corpora.corpus', corpus_id=corpus.id)},
|
|
|
|
201)
|
2020-04-06 14:12:22 +02:00
|
|
|
return render_template('corpora/add_corpus_file.html.j2',
|
2020-04-17 11:04:09 +02:00
|
|
|
corpus=corpus,
|
2020-04-06 14:12:22 +02:00
|
|
|
add_corpus_file_form=add_corpus_file_form,
|
2020-04-17 11:04:09 +02:00
|
|
|
title='Add corpus file')
|
2020-04-06 14:12:22 +02:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/files/<int:corpus_file_id>/delete')
|
|
|
|
@login_required
|
|
|
|
def delete_corpus_file(corpus_id, corpus_file_id):
|
|
|
|
corpus_file = CorpusFile.query.get_or_404(corpus_file_id)
|
|
|
|
if not corpus_file.corpus_id == corpus_id:
|
|
|
|
abort(404)
|
|
|
|
if not (corpus_file.corpus.creator == current_user
|
|
|
|
or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2020-04-21 18:34:21 +02:00
|
|
|
tasks.delete_corpus_file(corpus_file_id)
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('Corpus file deleted!', 'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/files/<int:corpus_file_id>/download')
|
|
|
|
@login_required
|
|
|
|
def download_corpus_file(corpus_id, corpus_file_id):
|
|
|
|
corpus_file = CorpusFile.query.get_or_404(corpus_file_id)
|
|
|
|
if not corpus_file.corpus_id == corpus_id:
|
|
|
|
abort(404)
|
|
|
|
if not (corpus_file.corpus.creator == current_user
|
|
|
|
or current_user.is_administrator()):
|
|
|
|
abort(403)
|
|
|
|
dir = os.path.join(current_app.config['NOPAQUE_STORAGE'],
|
|
|
|
corpus_file.dir)
|
|
|
|
return send_from_directory(as_attachment=True, directory=dir,
|
|
|
|
filename=corpus_file.filename)
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/files/<int:corpus_file_id>/edit',
|
|
|
|
methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def edit_corpus_file(corpus_id, corpus_file_id):
|
2020-04-17 11:04:09 +02:00
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2020-04-06 14:12:22 +02:00
|
|
|
corpus_file = CorpusFile.query.get_or_404(corpus_file_id)
|
|
|
|
if not corpus_file.corpus_id == corpus_id:
|
|
|
|
abort(404)
|
|
|
|
if not (corpus_file.corpus.creator == current_user
|
|
|
|
or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2020-04-17 11:04:09 +02:00
|
|
|
edit_corpus_file_form = EditCorpusFileForm(prefix='edit-corpus-file-form')
|
2020-04-06 14:12:22 +02:00
|
|
|
if edit_corpus_file_form.validate_on_submit():
|
2020-04-17 11:04:09 +02:00
|
|
|
corpus_file.address = edit_corpus_file_form.address.data
|
|
|
|
corpus_file.author = edit_corpus_file_form.author.data
|
|
|
|
corpus_file.booktitle = edit_corpus_file_form.booktitle.data
|
|
|
|
corpus_file.chapter = edit_corpus_file_form.chapter.data
|
|
|
|
corpus_file.editor = edit_corpus_file_form.editor.data
|
|
|
|
corpus_file.institution = edit_corpus_file_form.institution.data
|
|
|
|
corpus_file.journal = edit_corpus_file_form.journal.data
|
|
|
|
corpus_file.pages = edit_corpus_file_form.pages.data
|
|
|
|
corpus_file.publisher = edit_corpus_file_form.publisher.data
|
|
|
|
corpus_file.publishing_year = \
|
|
|
|
edit_corpus_file_form.publishing_year.data
|
|
|
|
corpus_file.school = edit_corpus_file_form.school.data
|
|
|
|
corpus_file.title = edit_corpus_file_form.title.data
|
2020-04-23 07:56:23 +02:00
|
|
|
corpus.status = 'unprepared'
|
2020-04-06 14:12:22 +02:00
|
|
|
db.session.commit()
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('Corpus file edited!', 'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|
2020-04-17 11:04:09 +02:00
|
|
|
# If no form is submitted or valid, fill out fields with current values
|
|
|
|
edit_corpus_file_form.address.data = corpus_file.address
|
|
|
|
edit_corpus_file_form.author.data = corpus_file.author
|
|
|
|
edit_corpus_file_form.booktitle.data = corpus_file.booktitle
|
|
|
|
edit_corpus_file_form.chapter.data = corpus_file.chapter
|
|
|
|
edit_corpus_file_form.editor.data = corpus_file.editor
|
|
|
|
edit_corpus_file_form.institution.data = corpus_file.institution
|
|
|
|
edit_corpus_file_form.journal.data = corpus_file.journal
|
|
|
|
edit_corpus_file_form.pages.data = corpus_file.pages
|
|
|
|
edit_corpus_file_form.publisher.data = corpus_file.publisher
|
|
|
|
edit_corpus_file_form.publishing_year.data = corpus_file.publishing_year
|
|
|
|
edit_corpus_file_form.school.data = corpus_file.school
|
|
|
|
edit_corpus_file_form.title.data = corpus_file.title
|
2020-04-06 14:12:22 +02:00
|
|
|
return render_template('corpora/edit_corpus_file.html.j2',
|
2020-04-17 11:04:09 +02:00
|
|
|
corpus_file=corpus_file, corpus=corpus,
|
2020-04-06 14:12:22 +02:00
|
|
|
edit_corpus_file_form=edit_corpus_file_form,
|
2020-04-17 11:04:09 +02:00
|
|
|
title='Edit corpus file')
|
2020-04-06 14:12:22 +02:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/prepare')
|
|
|
|
@login_required
|
|
|
|
def prepare_corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2020-04-17 11:04:09 +02:00
|
|
|
if corpus.files.all():
|
2020-04-23 07:56:23 +02:00
|
|
|
tasks.build_corpus(corpus_id)
|
2020-07-08 15:24:18 +02:00
|
|
|
flash('Building Corpus...', 'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
else:
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('Can not build corpus, please add corpus file(s).', 'corpus')
|
2020-04-06 14:12:22 +02:00
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|