2022-02-08 11:26:20 +00:00
|
|
|
from flask import (
|
|
|
|
abort,
|
|
|
|
current_app,
|
|
|
|
flash,
|
2022-09-02 11:07:30 +00:00
|
|
|
Markup,
|
2022-02-08 11:26:20 +00:00
|
|
|
redirect,
|
|
|
|
render_template,
|
|
|
|
send_from_directory
|
|
|
|
)
|
2020-04-06 12:12:22 +00:00
|
|
|
from flask_login import current_user, login_required
|
2022-09-02 11:07:30 +00:00
|
|
|
from threading import Thread
|
2020-04-06 12:12:22 +00:00
|
|
|
import os
|
2022-09-02 11:07:30 +00:00
|
|
|
from app import db
|
|
|
|
from app.models import Corpus, CorpusFile, CorpusStatus
|
|
|
|
from . import bp
|
2022-11-29 14:28:10 +00:00
|
|
|
from .forms import CreateCorpusFileForm, CreateCorpusForm, UpdateCorpusFileForm
|
|
|
|
|
|
|
|
|
|
|
|
def user_can_read_corpus(user, corpus):
|
|
|
|
return corpus.user == user or user.is_administrator() or corpus.is_public
|
|
|
|
|
|
|
|
|
|
|
|
def user_can_update_corpus(user, corpus):
|
|
|
|
return corpus.user == user or user.is_administrator()
|
|
|
|
|
|
|
|
|
|
|
|
def user_can_delete_corpus(user, corpus):
|
|
|
|
return user_can_update_corpus(user, corpus)
|
|
|
|
|
|
|
|
|
|
|
|
@bp.route('')
|
|
|
|
@login_required
|
|
|
|
def corpora():
|
|
|
|
corpora = Corpus.query.filter(Corpus.user_id == current_user.id | Corpus.is_public == True).all()
|
|
|
|
return render_template('corpora/corpora.html', corpora=corpora)
|
2020-04-06 12:12:22 +00:00
|
|
|
|
|
|
|
|
2022-09-02 11:07:30 +00:00
|
|
|
@bp.route('/create', methods=['GET', 'POST'])
|
2020-04-06 12:12:22 +00:00
|
|
|
@login_required
|
2022-09-02 11:07:30 +00:00
|
|
|
def create_corpus():
|
|
|
|
form = CreateCorpusForm(prefix='create-corpus-form')
|
2020-11-13 09:01:51 +00:00
|
|
|
if form.validate_on_submit():
|
2020-04-06 12:12:22 +00:00
|
|
|
try:
|
2022-09-02 11:07:30 +00:00
|
|
|
corpus = Corpus.create(
|
|
|
|
title=form.title.data,
|
|
|
|
description=form.description.data,
|
|
|
|
user=current_user
|
|
|
|
)
|
|
|
|
except OSError:
|
2020-11-13 09:01:51 +00:00
|
|
|
abort(500)
|
2022-02-03 11:39:16 +00:00
|
|
|
db.session.commit()
|
2022-09-02 11:07:30 +00:00
|
|
|
message = Markup(
|
|
|
|
f'Corpus "<a href="{corpus.url}">{corpus.title}</a>" created'
|
2021-11-16 14:23:57 +00:00
|
|
|
)
|
2022-09-02 11:07:30 +00:00
|
|
|
flash(message, 'corpus')
|
|
|
|
return redirect(corpus.url)
|
2022-02-08 11:26:20 +00:00
|
|
|
return render_template(
|
2022-09-02 11:07:30 +00:00
|
|
|
'corpora/create_corpus.html.j2',
|
2022-02-08 11:26:20 +00:00
|
|
|
form=form,
|
2022-09-02 11:07:30 +00:00
|
|
|
title='Create corpus'
|
2022-02-08 11:26:20 +00:00
|
|
|
)
|
2020-10-29 14:20:30 +00:00
|
|
|
|
|
|
|
|
2021-11-30 15:22:16 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>')
|
2020-04-06 12:12:22 +00:00
|
|
|
@login_required
|
|
|
|
def corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2022-11-29 14:28:10 +00:00
|
|
|
if not user_can_read_corpus(current_user, corpus):
|
2020-04-06 12:12:22 +00:00
|
|
|
abort(403)
|
2022-02-08 11:26:20 +00:00
|
|
|
return render_template(
|
|
|
|
'corpora/corpus.html.j2',
|
|
|
|
corpus=corpus,
|
|
|
|
title='Corpus'
|
|
|
|
)
|
2020-03-28 18:29:19 +00:00
|
|
|
|
|
|
|
|
2022-11-29 14:28:10 +00:00
|
|
|
# @bp.route('/<hashid:corpus_id>/update')
|
|
|
|
# @login_required
|
|
|
|
# def update_corpus(corpus_id):
|
|
|
|
# corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
# if not user_can_update_corpus(current_user, corpus):
|
|
|
|
# abort(403)
|
|
|
|
# return render_template(
|
|
|
|
# 'corpora/update_corpus.html.j2',
|
|
|
|
# corpus=corpus,
|
|
|
|
# title='Corpus'
|
|
|
|
# )
|
|
|
|
|
|
|
|
|
2022-09-02 11:07:30 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>', methods=['DELETE'])
|
|
|
|
@login_required
|
|
|
|
def delete_corpus(corpus_id):
|
|
|
|
def _delete_corpus(app, corpus_id):
|
|
|
|
with app.app_context():
|
|
|
|
corpus = Corpus.query.get(corpus_id)
|
|
|
|
corpus.delete()
|
|
|
|
db.session.commit()
|
|
|
|
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2022-11-29 14:28:10 +00:00
|
|
|
if not user_can_delete_corpus(current_user, corpus):
|
2022-09-02 11:07:30 +00:00
|
|
|
abort(403)
|
|
|
|
thread = Thread(
|
|
|
|
target=_delete_corpus,
|
|
|
|
args=(current_app._get_current_object(), corpus_id)
|
|
|
|
)
|
|
|
|
thread.start()
|
|
|
|
return {}, 202
|
|
|
|
|
|
|
|
|
2021-11-30 15:22:16 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>/analyse')
|
2021-11-16 14:23:57 +00:00
|
|
|
@login_required
|
|
|
|
def analyse_corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2022-11-29 14:28:10 +00:00
|
|
|
if not user_can_read_corpus(current_user, corpus):
|
|
|
|
abort(403)
|
2021-11-16 14:23:57 +00:00
|
|
|
return render_template(
|
|
|
|
'corpora/analyse_corpus.html.j2',
|
|
|
|
corpus=corpus,
|
|
|
|
title=f'Analyse Corpus {corpus.title}'
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2022-09-02 11:07:30 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>/build', methods=['POST'])
|
2022-04-19 09:48:44 +00:00
|
|
|
@login_required
|
|
|
|
def build_corpus(corpus_id):
|
2022-09-02 11:07:30 +00:00
|
|
|
def _build_corpus(app, corpus_id):
|
|
|
|
with app.app_context():
|
|
|
|
corpus = Corpus.query.get(corpus_id)
|
|
|
|
corpus.build()
|
|
|
|
db.session.commit()
|
2022-04-19 09:48:44 +00:00
|
|
|
|
2020-04-06 12:12:22 +00:00
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2022-11-29 14:28:10 +00:00
|
|
|
if not user_can_update_corpus(current_user, corpus):
|
2020-04-06 12:12:22 +00:00
|
|
|
abort(403)
|
2022-09-02 11:07:30 +00:00
|
|
|
# Check if the corpus has corpus files
|
|
|
|
if not corpus.files.all():
|
|
|
|
response = {'errors': {'message': 'Corpus file(s) required'}}
|
|
|
|
return response, 409
|
|
|
|
thread = Thread(
|
|
|
|
target=_build_corpus,
|
|
|
|
args=(current_app._get_current_object(), corpus_id)
|
|
|
|
)
|
|
|
|
thread.start()
|
|
|
|
return {}, 202
|
2020-04-06 12:12:22 +00:00
|
|
|
|
|
|
|
|
2022-09-02 11:07:30 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>/files/create', methods=['GET', 'POST'])
|
2022-04-19 09:48:44 +00:00
|
|
|
@login_required
|
2022-09-02 11:07:30 +00:00
|
|
|
def create_corpus_file(corpus_id):
|
2022-04-19 09:48:44 +00:00
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2022-11-29 14:28:10 +00:00
|
|
|
if not user_can_update_corpus(current_user, corpus):
|
2022-04-19 09:48:44 +00:00
|
|
|
abort(403)
|
2022-09-02 11:07:30 +00:00
|
|
|
form = CreateCorpusFileForm(prefix='create-corpus-file-form')
|
|
|
|
if form.is_submitted():
|
|
|
|
if not form.validate():
|
|
|
|
response = {'errors': form.errors}
|
|
|
|
return response, 400
|
|
|
|
try:
|
|
|
|
corpus_file = CorpusFile.create(
|
|
|
|
form.vrt.data,
|
|
|
|
address=form.address.data,
|
|
|
|
author=form.author.data,
|
|
|
|
booktitle=form.booktitle.data,
|
|
|
|
chapter=form.chapter.data,
|
|
|
|
editor=form.editor.data,
|
|
|
|
institution=form.institution.data,
|
|
|
|
journal=form.journal.data,
|
|
|
|
pages=form.pages.data,
|
|
|
|
publisher=form.publisher.data,
|
|
|
|
publishing_year=form.publishing_year.data,
|
|
|
|
school=form.school.data,
|
|
|
|
title=form.title.data,
|
|
|
|
mimetype='application/vrt+xml',
|
|
|
|
corpus=corpus
|
|
|
|
)
|
2022-10-11 09:32:50 +00:00
|
|
|
except (AttributeError, OSError):
|
2022-09-02 11:07:30 +00:00
|
|
|
abort(500)
|
|
|
|
corpus.status = CorpusStatus.UNPREPARED
|
|
|
|
db.session.commit()
|
|
|
|
message = Markup(
|
|
|
|
'Corpus file'
|
|
|
|
f'"<a href="{corpus_file.url}">{corpus_file.filename}</a>" added'
|
|
|
|
)
|
|
|
|
flash(message, category='corpus')
|
|
|
|
return {}, 201, {'Location': corpus.url}
|
|
|
|
return render_template(
|
|
|
|
'corpora/create_corpus_file.html.j2',
|
|
|
|
corpus=corpus,
|
|
|
|
form=form,
|
|
|
|
title='Add corpus file'
|
2022-04-19 09:48:44 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
|
2022-11-29 14:28:10 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>/files/<hashid:corpus_file_id>', methods=['GET', 'POST'])
|
2022-04-19 09:48:44 +00:00
|
|
|
@login_required
|
|
|
|
def corpus_file(corpus_id, corpus_file_id):
|
2022-11-29 14:28:10 +00:00
|
|
|
corpus_file = CorpusFile.query.filter_by(corpus_id = corpus_id, id=corpus_file_id).first_or_404()
|
2022-09-02 11:07:30 +00:00
|
|
|
if not (corpus_file.corpus.user == current_user or current_user.is_administrator()):
|
2022-04-19 09:48:44 +00:00
|
|
|
abort(403)
|
2022-11-29 14:28:10 +00:00
|
|
|
form = UpdateCorpusFileForm(
|
2022-11-24 11:24:29 +00:00
|
|
|
data=corpus_file.to_json_serializeable(),
|
|
|
|
prefix='edit-corpus-file-form'
|
|
|
|
)
|
2022-04-19 09:48:44 +00:00
|
|
|
if form.validate_on_submit():
|
2022-11-17 09:46:16 +00:00
|
|
|
form.populate_obj(corpus_file)
|
|
|
|
if db.session.is_modified(corpus_file):
|
2022-09-02 11:07:30 +00:00
|
|
|
corpus_file.corpus.status = CorpusStatus.UNPREPARED
|
2022-11-17 09:46:16 +00:00
|
|
|
db.session.commit()
|
|
|
|
message = Markup(f'Corpus file "<a href="{corpus_file.url}">{corpus_file.filename}</a>" updated')
|
|
|
|
flash(message, category='corpus')
|
2022-09-02 11:07:30 +00:00
|
|
|
return redirect(corpus_file.corpus.url)
|
2022-04-19 09:48:44 +00:00
|
|
|
return render_template(
|
|
|
|
'corpora/corpus_file.html.j2',
|
|
|
|
corpus=corpus_file.corpus,
|
|
|
|
corpus_file=corpus_file,
|
|
|
|
form=form,
|
|
|
|
title='Edit corpus file'
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2022-09-02 11:07:30 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>/files/<hashid:corpus_file_id>', methods=['DELETE'])
|
2020-04-06 12:12:22 +00:00
|
|
|
@login_required
|
|
|
|
def delete_corpus_file(corpus_id, corpus_file_id):
|
2022-09-02 11:07:30 +00:00
|
|
|
def _delete_corpus_file(app, corpus_file_id):
|
|
|
|
with app.app_context():
|
|
|
|
corpus_file = CorpusFile.query.get(corpus_file_id)
|
|
|
|
corpus_file.delete()
|
|
|
|
db.session.commit()
|
|
|
|
|
2022-11-29 14:28:10 +00:00
|
|
|
corpus_file = CorpusFile.query.filter_by(corpus_id = corpus_id, id=corpus_file_id).first_or_404()
|
2022-09-02 11:07:30 +00:00
|
|
|
if not (corpus_file.corpus.user == current_user or current_user.is_administrator()):
|
2020-04-06 12:12:22 +00:00
|
|
|
abort(403)
|
2022-09-02 11:07:30 +00:00
|
|
|
thread = Thread(
|
|
|
|
target=_delete_corpus_file,
|
|
|
|
args=(current_app._get_current_object(), corpus_file_id)
|
2022-02-08 11:26:20 +00:00
|
|
|
)
|
2022-09-02 11:07:30 +00:00
|
|
|
thread.start()
|
|
|
|
return {}, 202
|
2020-04-06 12:12:22 +00:00
|
|
|
|
|
|
|
|
2021-11-30 15:22:16 +00:00
|
|
|
@bp.route('/<hashid:corpus_id>/files/<hashid:corpus_file_id>/download')
|
2020-04-06 12:12:22 +00:00
|
|
|
@login_required
|
|
|
|
def download_corpus_file(corpus_id, corpus_file_id):
|
2022-11-29 14:28:10 +00:00
|
|
|
corpus_file = CorpusFile.query.filter_by(corpus_id = corpus_id, id=corpus_file_id).first_or_404()
|
2022-09-02 11:07:30 +00:00
|
|
|
if not (corpus_file.corpus.user == current_user or current_user.is_administrator()):
|
2020-04-06 12:12:22 +00:00
|
|
|
abort(403)
|
2022-02-08 11:26:20 +00:00
|
|
|
return send_from_directory(
|
2022-09-02 11:07:30 +00:00
|
|
|
os.path.dirname(corpus_file.path),
|
|
|
|
os.path.basename(corpus_file.path),
|
2022-02-08 11:26:20 +00:00
|
|
|
as_attachment=True,
|
2022-04-12 14:11:24 +00:00
|
|
|
attachment_filename=corpus_file.filename,
|
2022-09-02 11:07:30 +00:00
|
|
|
mimetype=corpus_file.mimetype
|
2022-07-08 09:46:47 +00:00
|
|
|
)
|
2022-09-02 11:07:30 +00:00
|
|
|
|
|
|
|
|
|
|
|
@bp.route('/import', methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def import_corpus():
|
|
|
|
abort(503)
|
|
|
|
|
|
|
|
|
|
|
|
@bp.route('/<hashid:corpus_id>/export')
|
|
|
|
@login_required
|
|
|
|
def export_corpus(corpus_id):
|
|
|
|
abort(503)
|