2019-08-01 08:33:05 +00:00
|
|
|
from flask import current_app, flash, redirect, render_template, url_for
|
2019-07-19 11:28:17 +00:00
|
|
|
from . import services
|
|
|
|
from flask_login import current_user, login_required
|
2019-08-05 13:35:18 +00:00
|
|
|
from .forms import NewOCRJobForm, NewNLPJobForm
|
2019-08-06 12:27:41 +00:00
|
|
|
from ..models import Job
|
2019-07-19 11:28:17 +00:00
|
|
|
from ..import swarm
|
2019-08-06 12:27:41 +00:00
|
|
|
from .. import db
|
2019-07-19 11:28:17 +00:00
|
|
|
from threading import Thread
|
2019-08-01 06:22:17 +00:00
|
|
|
import os
|
2019-08-06 12:27:41 +00:00
|
|
|
import json
|
2019-07-19 11:28:17 +00:00
|
|
|
|
|
|
|
|
|
|
|
@services.route('/ocr', methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def ocr():
|
2019-08-05 06:36:29 +00:00
|
|
|
new_ocr_job_form = NewOCRJobForm()
|
|
|
|
if new_ocr_job_form.validate_on_submit():
|
2019-08-01 06:22:17 +00:00
|
|
|
app = current_app._get_current_object()
|
2019-08-06 15:04:38 +00:00
|
|
|
ocr_job = Job(creator=current_user._get_current_object(),
|
|
|
|
description=new_ocr_job_form.description.data,
|
|
|
|
service="ocr",
|
|
|
|
ressources=json.dumps({"n_cores": 2,
|
|
|
|
"mem_mb": 4096}),
|
|
|
|
service_args=json.dumps({"args": ["--keep-intermediates",
|
|
|
|
"--skip-binarisation"],
|
|
|
|
"lang": new_ocr_job_form.language.data,
|
|
|
|
"version": new_ocr_job_form.version.data}),
|
2019-08-07 13:01:37 +00:00
|
|
|
status="pending",
|
2019-08-06 15:04:38 +00:00
|
|
|
title=new_ocr_job_form.title.data)
|
2019-08-06 12:27:41 +00:00
|
|
|
db.session.add(ocr_job)
|
|
|
|
db.session.commit()
|
|
|
|
|
2019-08-06 12:54:00 +00:00
|
|
|
dir = os.path.join(app.config['OPAQUE_STORAGE'],
|
|
|
|
str(ocr_job.user_id),
|
|
|
|
'jobs',
|
|
|
|
str(ocr_job.id))
|
2019-08-01 06:22:17 +00:00
|
|
|
|
|
|
|
try:
|
2019-08-01 09:47:14 +00:00
|
|
|
os.makedirs(dir)
|
|
|
|
except OSError:
|
|
|
|
flash('OSError!')
|
2019-08-01 06:22:17 +00:00
|
|
|
else:
|
2019-08-05 06:36:29 +00:00
|
|
|
for file in new_ocr_job_form.files.data:
|
2019-08-01 10:16:31 +00:00
|
|
|
file.save(os.path.join(dir, file.filename))
|
2019-08-01 06:22:17 +00:00
|
|
|
'''
|
|
|
|
' TODO: Let the scheduler run this job in the background.
|
|
|
|
'
|
|
|
|
' NOTE: Using self created threads is just for testing purpose as
|
|
|
|
' there is no scheduler available.
|
|
|
|
'''
|
2019-08-06 12:27:41 +00:00
|
|
|
thread = Thread(target=swarm.run, args=(ocr_job,))
|
2019-08-01 06:22:17 +00:00
|
|
|
thread.start()
|
2019-08-01 09:47:14 +00:00
|
|
|
flash('Job created!')
|
2019-07-19 11:28:17 +00:00
|
|
|
return redirect(url_for('services.ocr'))
|
|
|
|
|
|
|
|
return render_template(
|
|
|
|
'services/ocr.html.j2',
|
|
|
|
title='Optical Character Recognition',
|
2019-08-05 06:36:29 +00:00
|
|
|
new_ocr_job_form=new_ocr_job_form
|
2019-07-19 11:28:17 +00:00
|
|
|
)
|
2019-08-05 13:35:18 +00:00
|
|
|
|
|
|
|
|
|
|
|
@services.route('/nlp', methods=['GET', 'POST'])
|
|
|
|
@login_required
|
|
|
|
def nlp():
|
|
|
|
new_nlp_job_form = NewNLPJobForm()
|
|
|
|
if new_nlp_job_form.validate_on_submit():
|
|
|
|
app = current_app._get_current_object()
|
2019-08-06 15:04:38 +00:00
|
|
|
nlp_job = Job(creator=current_user._get_current_object(),
|
|
|
|
description=new_nlp_job_form.description.data,
|
|
|
|
service="nlp",
|
|
|
|
ressources=json.dumps({"n_cores": 1,
|
|
|
|
"mem_mb": 2048}),
|
|
|
|
service_args=json.dumps({"args": [],
|
|
|
|
"lang": new_nlp_job_form.language.data,
|
|
|
|
"version": new_nlp_job_form.version.data}),
|
2019-08-07 13:01:37 +00:00
|
|
|
status="pending",
|
2019-08-06 15:04:38 +00:00
|
|
|
title=new_nlp_job_form.title.data)
|
2019-08-06 12:27:41 +00:00
|
|
|
db.session.add(nlp_job)
|
|
|
|
db.session.commit()
|
2019-08-06 12:54:00 +00:00
|
|
|
|
|
|
|
dir = os.path.join(app.config['OPAQUE_STORAGE'],
|
|
|
|
str(nlp_job.user_id),
|
|
|
|
'jobs',
|
|
|
|
str(nlp_job.id))
|
2019-08-05 13:35:18 +00:00
|
|
|
|
|
|
|
try:
|
|
|
|
os.makedirs(dir)
|
|
|
|
except OSError:
|
|
|
|
flash('OSError!')
|
|
|
|
else:
|
|
|
|
for file in new_nlp_job_form.files.data:
|
|
|
|
file.save(os.path.join(dir, file.filename))
|
|
|
|
'''
|
|
|
|
' TODO: Let the scheduler run this job in the background.
|
|
|
|
'
|
|
|
|
' NOTE: Using self created threads is just for testing purpose as
|
|
|
|
' there is no scheduler available.
|
|
|
|
'''
|
2019-08-06 12:27:41 +00:00
|
|
|
thread = Thread(target=swarm.run, args=(nlp_job,))
|
2019-08-05 13:35:18 +00:00
|
|
|
thread.start()
|
|
|
|
flash('Job created!')
|
|
|
|
return redirect(url_for('services.nlp'))
|
|
|
|
|
|
|
|
return render_template(
|
|
|
|
'services/nlp.html.j2',
|
|
|
|
title='Natrual Language Processing',
|
|
|
|
new_nlp_job_form=new_nlp_job_form
|
|
|
|
)
|