2019-11-12 12:36:22 +00:00
|
|
|
from app import db, logger
|
2019-11-05 15:22:36 +00:00
|
|
|
from app.models import Corpus, CorpusFile
|
2019-10-31 09:25:48 +00:00
|
|
|
from flask import (abort, current_app, flash, redirect, request,
|
2019-10-31 14:29:02 +00:00
|
|
|
render_template, url_for, send_from_directory)
|
2019-10-31 09:25:48 +00:00
|
|
|
from flask_login import current_user, login_required
|
2019-11-05 15:22:36 +00:00
|
|
|
from werkzeug.utils import secure_filename
|
2019-10-31 09:25:48 +00:00
|
|
|
from . import corpora
|
2019-11-14 08:48:30 +00:00
|
|
|
from .background_functions import (delete_corpus_, delete_corpus_file_,
|
2019-11-06 09:07:34 +00:00
|
|
|
edit_corpus_file_)
|
2019-11-04 08:54:30 +00:00
|
|
|
from .forms import (AddCorpusFileForm, AddCorpusForm, EditCorpusFileForm,
|
|
|
|
QueryDownloadForm, QueryForm)
|
2019-10-31 09:25:48 +00:00
|
|
|
import os
|
|
|
|
import threading
|
|
|
|
|
|
|
|
|
2019-10-31 14:29:02 +00:00
|
|
|
@corpora.route('/add', methods=['GET', 'POST'])
|
2019-10-31 09:25:48 +00:00
|
|
|
@login_required
|
|
|
|
def add_corpus():
|
|
|
|
add_corpus_form = AddCorpusForm()
|
2019-10-31 14:29:02 +00:00
|
|
|
if add_corpus_form.validate_on_submit():
|
2019-10-31 10:34:45 +00:00
|
|
|
corpus = Corpus(creator=current_user,
|
|
|
|
description=add_corpus_form.description.data,
|
2019-11-04 14:06:54 +00:00
|
|
|
status='unprepared', title=add_corpus_form.title.data)
|
2019-10-31 10:34:45 +00:00
|
|
|
db.session.add(corpus)
|
2019-10-31 09:25:48 +00:00
|
|
|
db.session.commit()
|
2019-10-31 10:34:45 +00:00
|
|
|
dir = os.path.join(current_app.config['OPAQUE_STORAGE_DIRECTORY'],
|
|
|
|
str(corpus.user_id), 'corpora', str(corpus.id))
|
|
|
|
try:
|
|
|
|
os.makedirs(dir)
|
|
|
|
except OSError:
|
2019-11-14 08:48:30 +00:00
|
|
|
flash('[ERROR]: Could not add corpus!')
|
|
|
|
corpus.delete()
|
|
|
|
else:
|
|
|
|
flash('Corpus added!')
|
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus.id))
|
2019-10-31 14:29:02 +00:00
|
|
|
return render_template('corpora/add_corpus.html.j2',
|
|
|
|
add_corpus_form=add_corpus_form,
|
|
|
|
title='Add corpus')
|
2019-10-31 09:25:48 +00:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>')
|
|
|
|
@login_required
|
|
|
|
def corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2019-10-31 14:29:02 +00:00
|
|
|
return render_template('corpora/corpus.html.j2', corpus=corpus,
|
|
|
|
title='Corpus')
|
2019-10-31 09:25:48 +00:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/analysis', methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def corpus_analysis(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
2019-11-11 10:51:18 +00:00
|
|
|
if corpus.status == 'prepared':
|
|
|
|
corpus.status = 'start analysis'
|
|
|
|
db.session.commit()
|
2019-10-31 09:25:48 +00:00
|
|
|
query = request.args.get('query')
|
|
|
|
logger.warning('Query first: {}'.format(query))
|
|
|
|
hits_per_page = request.args.get('hits_per_page', 30)
|
|
|
|
context = request.args.get('context', 10)
|
|
|
|
dl_form = QueryDownloadForm()
|
|
|
|
form = QueryForm(hits_per_page=hits_per_page, context=context, query=query)
|
|
|
|
if form.validate_on_submit():
|
|
|
|
flash('Query has been sent!')
|
|
|
|
query = form.query.data
|
|
|
|
hits_per_page = form.hits_per_page.data
|
|
|
|
context = form.context.data
|
|
|
|
return redirect(url_for('corpora.corpus_analysis', corpus_id=corpus_id,
|
|
|
|
query=query, hits_per_page=hits_per_page,
|
|
|
|
context=context))
|
2019-11-05 13:23:45 +00:00
|
|
|
return render_template('corpora/corpus_analysis.html.j2',
|
|
|
|
corpus_id=corpus_id,
|
2019-10-31 09:25:48 +00:00
|
|
|
form=form, dl_form=dl_form,
|
|
|
|
title='Corpus: {}'.format(corpus.title))
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/delete')
|
|
|
|
@login_required
|
|
|
|
def delete_corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2019-11-06 09:07:34 +00:00
|
|
|
thread = threading.Thread(target=delete_corpus_,
|
|
|
|
args=(current_app._get_current_object(),
|
|
|
|
corpus.id))
|
|
|
|
thread.start()
|
2019-10-31 09:25:48 +00:00
|
|
|
flash('Corpus deleted!')
|
|
|
|
return redirect(url_for('main.dashboard'))
|
|
|
|
|
|
|
|
|
2019-10-31 14:29:02 +00:00
|
|
|
@corpora.route('/<int:corpus_id>/files/add', methods=['GET', 'POST'])
|
2019-10-31 09:25:48 +00:00
|
|
|
@login_required
|
|
|
|
def add_corpus_file(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
|
|
|
add_corpus_file_form = AddCorpusFileForm()
|
2019-10-31 10:34:45 +00:00
|
|
|
if add_corpus_file_form.validate_on_submit():
|
|
|
|
file = add_corpus_file_form.file.data
|
|
|
|
filename = secure_filename(file.filename)
|
|
|
|
for corpus_file in corpus.files:
|
|
|
|
if filename == corpus_file.filename:
|
|
|
|
flash('File already registered to this corpus.')
|
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|
|
|
|
# Save the file
|
|
|
|
dir = os.path.join(str(corpus.user_id), 'corpora', str(corpus.id))
|
|
|
|
file.save(os.path.join(current_app.config['OPAQUE_STORAGE_DIRECTORY'],
|
2019-10-31 14:29:02 +00:00
|
|
|
dir, filename))
|
|
|
|
|
|
|
|
corpus_file = CorpusFile(author=add_corpus_file_form.author.data,
|
2019-11-12 13:02:01 +00:00
|
|
|
corpus=corpus,
|
|
|
|
dir=dir,
|
|
|
|
filename=filename,
|
2019-10-31 14:29:02 +00:00
|
|
|
publishing_year=add_corpus_file_form.publishing_year.data,
|
|
|
|
title=add_corpus_file_form.title.data)
|
2019-10-31 10:34:45 +00:00
|
|
|
db.session.add(corpus_file)
|
|
|
|
db.session.commit()
|
2019-11-06 09:07:34 +00:00
|
|
|
thread = threading.Thread(target=edit_corpus_file_,
|
|
|
|
args=(current_app._get_current_object(),
|
|
|
|
corpus_file.id))
|
|
|
|
thread.start()
|
2019-10-31 10:34:45 +00:00
|
|
|
flash('Corpus file added!')
|
2019-10-31 14:29:02 +00:00
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|
|
|
|
return render_template('corpora/add_corpus_file.html.j2',
|
|
|
|
add_corpus_file_form=add_corpus_file_form,
|
|
|
|
corpus=corpus, title='Add corpus file')
|
2019-10-31 09:25:48 +00:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/files/<int:corpus_file_id>/delete')
|
|
|
|
@login_required
|
|
|
|
def delete_corpus_file(corpus_id, corpus_file_id):
|
|
|
|
corpus_file = CorpusFile.query.get_or_404(corpus_file_id)
|
|
|
|
if not corpus_file.corpus_id == corpus_id:
|
|
|
|
abort(404)
|
|
|
|
if not (corpus_file.corpus.creator == current_user
|
|
|
|
or current_user.is_administrator()):
|
|
|
|
abort(403)
|
2019-11-06 09:07:34 +00:00
|
|
|
thread = threading.Thread(target=delete_corpus_file_,
|
|
|
|
args=(current_app._get_current_object(),
|
|
|
|
corpus_file.id))
|
|
|
|
thread.start()
|
2019-10-31 09:25:48 +00:00
|
|
|
flash('Corpus file deleted!')
|
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/files/<int:corpus_file_id>/download')
|
|
|
|
@login_required
|
|
|
|
def download_corpus_file(corpus_id, corpus_file_id):
|
|
|
|
corpus_file = CorpusFile.query.get_or_404(corpus_file_id)
|
|
|
|
if not corpus_file.corpus_id == corpus_id:
|
|
|
|
abort(404)
|
|
|
|
if not (corpus_file.corpus.creator == current_user
|
|
|
|
or current_user.is_administrator()):
|
|
|
|
abort(403)
|
|
|
|
dir = os.path.join(current_app.config['OPAQUE_STORAGE_DIRECTORY'],
|
|
|
|
corpus_file.dir)
|
|
|
|
return send_from_directory(as_attachment=True, directory=dir,
|
|
|
|
filename=corpus_file.filename)
|
2019-11-04 08:54:30 +00:00
|
|
|
|
|
|
|
|
2019-11-12 13:02:01 +00:00
|
|
|
@corpora.route('/<int:corpus_id>/files/<int:corpus_file_id>/edit',
|
|
|
|
methods=['GET', 'POST'])
|
2019-11-04 08:54:30 +00:00
|
|
|
@login_required
|
|
|
|
def edit_corpus_file(corpus_id, corpus_file_id):
|
|
|
|
corpus_file = CorpusFile.query.get_or_404(corpus_file_id)
|
|
|
|
if not corpus_file.corpus_id == corpus_id:
|
|
|
|
abort(404)
|
|
|
|
if not (corpus_file.corpus.creator == current_user
|
|
|
|
or current_user.is_administrator()):
|
|
|
|
abort(403)
|
|
|
|
edit_corpus_file_form = EditCorpusFileForm()
|
|
|
|
if edit_corpus_file_form.validate_on_submit():
|
|
|
|
corpus_file.author = edit_corpus_file_form.author.data
|
|
|
|
corpus_file.publishing_year = edit_corpus_file_form.publishing_year.data
|
|
|
|
corpus_file.title = edit_corpus_file_form.title.data
|
|
|
|
db.session.commit()
|
2019-11-06 09:07:34 +00:00
|
|
|
thread = threading.Thread(target=edit_corpus_file_,
|
|
|
|
args=(current_app._get_current_object(),
|
|
|
|
corpus_file.id))
|
|
|
|
thread.start()
|
2019-11-04 08:54:30 +00:00
|
|
|
flash('Corpus file edited!')
|
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|
|
|
|
return render_template('corpora/edit_corpus_file.html.j2',
|
|
|
|
edit_corpus_file_form=edit_corpus_file_form,
|
|
|
|
corpus_file=corpus_file, title='Edit corpus file')
|
2019-11-06 09:07:34 +00:00
|
|
|
|
|
|
|
|
|
|
|
@corpora.route('/<int:corpus_id>/prepare')
|
|
|
|
@login_required
|
|
|
|
def prepare_corpus(corpus_id):
|
|
|
|
corpus = Corpus.query.get_or_404(corpus_id)
|
|
|
|
if not (corpus.creator == current_user or current_user.is_administrator()):
|
|
|
|
abort(403)
|
|
|
|
if len(corpus.files.all()) > 0:
|
|
|
|
corpus.status = 'preparable'
|
|
|
|
db.session.commit()
|
|
|
|
flash('Corpus marked for preparation!')
|
|
|
|
else:
|
|
|
|
flash('Can not prepare corpus, please add corpus file(s).')
|
|
|
|
return redirect(url_for('corpora.corpus', corpus_id=corpus_id))
|