2019-11-18 14:23:53 +01:00
|
|
|
from flask import (abort, current_app, flash, make_response, render_template,
|
2019-11-25 10:12:39 +01:00
|
|
|
url_for)
|
2019-07-19 13:28:17 +02:00
|
|
|
from flask_login import current_user, login_required
|
2019-10-16 16:52:05 +02:00
|
|
|
from werkzeug.utils import secure_filename
|
|
|
|
from . import services
|
2020-03-27 12:06:11 +01:00
|
|
|
from .. import db
|
2020-04-03 18:49:45 +02:00
|
|
|
from ..jobs.forms import AddFileSetupJobForm, AddNLPJobForm, AddOCRJobForm
|
2020-07-07 15:08:15 +02:00
|
|
|
from ..models import Job, JobInput
|
2019-08-06 14:27:41 +02:00
|
|
|
import json
|
2019-08-09 11:48:43 +02:00
|
|
|
import os
|
2019-07-19 13:28:17 +02:00
|
|
|
|
|
|
|
|
2020-02-07 15:21:59 +01:00
|
|
|
SERVICES = {'corpus_analysis': {'name': 'Corpus analysis'},
|
2020-04-09 09:53:56 +02:00
|
|
|
'file-setup': {'name': 'File setup',
|
2020-04-03 18:49:45 +02:00
|
|
|
'resources': {'mem_mb': 4096, 'n_cores': 4},
|
|
|
|
'add_job_form': AddFileSetupJobForm},
|
2020-01-07 13:03:42 +01:00
|
|
|
'nlp': {'name': 'Natural Language Processing',
|
2019-09-27 13:56:52 +02:00
|
|
|
'resources': {'mem_mb': 4096, 'n_cores': 2},
|
2019-11-08 12:21:59 +01:00
|
|
|
'add_job_form': AddNLPJobForm},
|
2019-09-27 13:56:52 +02:00
|
|
|
'ocr': {'name': 'Optical Character Recognition',
|
|
|
|
'resources': {'mem_mb': 8192, 'n_cores': 4},
|
2020-04-03 18:49:45 +02:00
|
|
|
'add_job_form': AddOCRJobForm}}
|
2019-08-06 14:27:41 +02:00
|
|
|
|
2019-08-01 08:22:17 +02:00
|
|
|
|
2019-11-08 12:21:59 +01:00
|
|
|
@services.route('/<service>', methods=['GET', 'POST'])
|
2019-08-05 15:35:18 +02:00
|
|
|
@login_required
|
2019-11-08 12:21:59 +01:00
|
|
|
def service(service):
|
|
|
|
if service not in SERVICES:
|
2019-09-24 16:55:24 +02:00
|
|
|
abort(404)
|
2020-02-07 15:21:59 +01:00
|
|
|
if service == 'corpus_analysis':
|
|
|
|
return render_template('services/{}.html.j2'.format(service),
|
|
|
|
title=SERVICES[service]['name'])
|
2020-02-18 12:01:36 +01:00
|
|
|
add_job_form = SERVICES[service]['add_job_form'](prefix='add-job-form')
|
2019-11-18 14:23:53 +01:00
|
|
|
if add_job_form.is_submitted():
|
|
|
|
if not add_job_form.validate():
|
|
|
|
return make_response(add_job_form.errors, 400)
|
2019-11-08 12:21:59 +01:00
|
|
|
service_args = []
|
|
|
|
if service == 'nlp':
|
|
|
|
service_args.append('-l {}'.format(add_job_form.language.data))
|
2020-02-13 14:41:02 +01:00
|
|
|
if add_job_form.check_encoding.data:
|
|
|
|
service_args.append('--check-encoding')
|
2019-11-08 12:21:59 +01:00
|
|
|
if service == 'ocr':
|
|
|
|
service_args.append('-l {}'.format(add_job_form.language.data))
|
2020-04-03 17:36:38 +02:00
|
|
|
if add_job_form.binarization.data:
|
|
|
|
service_args.append('--binarize')
|
2019-11-08 12:21:59 +01:00
|
|
|
job = Job(creator=current_user,
|
|
|
|
description=add_job_form.description.data,
|
|
|
|
mem_mb=SERVICES[service]['resources']['mem_mb'],
|
|
|
|
n_cores=SERVICES[service]['resources']['n_cores'],
|
|
|
|
service=service, service_args=json.dumps(service_args),
|
|
|
|
service_version=add_job_form.version.data,
|
|
|
|
status='preparing', title=add_job_form.title.data)
|
2020-02-17 14:57:24 +01:00
|
|
|
if job.service != 'corpus_analysis':
|
|
|
|
job.create_secure_filename()
|
2019-09-24 16:55:24 +02:00
|
|
|
db.session.add(job)
|
2019-08-06 14:27:41 +02:00
|
|
|
db.session.commit()
|
2019-11-08 12:21:59 +01:00
|
|
|
relative_dir = os.path.join(str(job.user_id), 'jobs', str(job.id))
|
2020-02-13 15:08:15 +01:00
|
|
|
absolut_dir = os.path.join(current_app.config['NOPAQUE_STORAGE'],
|
|
|
|
relative_dir)
|
2019-08-05 15:35:18 +02:00
|
|
|
try:
|
2019-11-08 12:21:59 +01:00
|
|
|
os.makedirs(absolut_dir)
|
2019-08-05 15:35:18 +02:00
|
|
|
except OSError:
|
2019-11-14 09:48:30 +01:00
|
|
|
job.delete()
|
2020-04-27 15:22:20 +02:00
|
|
|
flash('Internal Server Error', 'job')
|
2020-02-13 15:08:15 +01:00
|
|
|
return make_response({'redirect_url': url_for('services.service',
|
|
|
|
service=service)},
|
|
|
|
500)
|
2019-08-05 15:35:18 +02:00
|
|
|
else:
|
2019-11-08 12:21:59 +01:00
|
|
|
for file in add_job_form.files.data:
|
2019-10-16 16:52:05 +02:00
|
|
|
filename = secure_filename(file.filename)
|
2019-11-08 12:21:59 +01:00
|
|
|
file.save(os.path.join(absolut_dir, filename))
|
|
|
|
job_input = JobInput(dir=relative_dir, filename=filename,
|
|
|
|
job=job)
|
2019-10-16 16:52:05 +02:00
|
|
|
db.session.add(job_input)
|
2019-09-24 16:55:24 +02:00
|
|
|
job.status = 'submitted'
|
2019-08-12 17:03:12 +02:00
|
|
|
db.session.commit()
|
2020-04-27 15:22:20 +02:00
|
|
|
url = url_for('jobs.job', job_id=job.id)
|
|
|
|
flash('[<a href="{}">{}</a>] added'.format(url, job.title), 'job')
|
2019-11-18 14:23:53 +01:00
|
|
|
return make_response(
|
|
|
|
{'redirect_url': url_for('jobs.job', job_id=job.id)}, 201)
|
2019-11-08 12:21:59 +01:00
|
|
|
return render_template('services/{}.html.j2'.format(service),
|
|
|
|
title=SERVICES[service]['name'],
|
|
|
|
add_job_form=add_job_form)
|