From 9da08508c0a7195aab6ebcaff4e5d0dfdbefc61e Mon Sep 17 00:00:00 2001
From: Patrick Jentsch <pjentsch@sfb1288inf-Laptop.fritz.box>
Date: Fri, 3 Apr 2020 17:36:38 +0200
Subject: [PATCH] Add changes for new OCR and NLP Pipelines

---
 app/jobs/forms.py                  | 14 +++++---------
 app/services/views.py              |  4 ++--
 app/templates/services/ocr.html.j2 |  2 +-
 3 files changed, 8 insertions(+), 12 deletions(-)

diff --git a/app/jobs/forms.py b/app/jobs/forms.py
index d47e9403..2b569a7f 100644
--- a/app/jobs/forms.py
+++ b/app/jobs/forms.py
@@ -21,9 +21,7 @@ class AddNLPJobForm(FlaskForm):
                            validators=[DataRequired()])
     submit = SubmitField()
     title = StringField('Title', validators=[DataRequired(), Length(1, 32)])
-    version = SelectField('Version',
-                          choices=[('2.2.0', 'Latest (2.2.0)'),
-                                   ('2.2.0', '2.2.0')],
+    version = SelectField('Version', choices=[('latest', 'Latest')],
                           validators=[DataRequired()])
     check_encoding = BooleanField('Check encoding')
 
@@ -54,15 +52,14 @@ class AddOCRJobForm(FlaskForm):
     split = BooleanField('Split')
     submit = SubmitField()
     title = StringField('Title', validators=[DataRequired(), Length(1, 32)])
-    version = SelectField('Version',
-                          choices=[('latest', 'Latest')],
+    version = SelectField('Version', choices=[('latest', 'Latest')],
                           validators=[DataRequired()])
 
     def validate_files(form, field):
         for file in field.data:
-            if not file.filename.lower().endswith(('.pdf', '.tif', '.tiff')):
+            if not file.filename.lower().endswith('.pdf'):
                 raise ValidationError('File does not have an approved '
-                                      'extension: .pdf | .tif | .tiff')
+                                      'extension: .pdf')
 
 
 class AddSetupFilesJobForm(FlaskForm):
@@ -71,8 +68,7 @@ class AddSetupFilesJobForm(FlaskForm):
     submit = SubmitField()
     title = StringField('Title', validators=[DataRequired(), Length(1, 32)])
     files = MultipleFileField('Files', validators=[DataRequired()])
-    version = SelectField('Version',
-                          choices=[('latest', 'Latest')],
+    version = SelectField('Version', choices=[('latest', 'Latest')],
                           validators=[DataRequired()])
 
     def validate_files(form, field):
diff --git a/app/services/views.py b/app/services/views.py
index 2339260b..c906acef 100644
--- a/app/services/views.py
+++ b/app/services/views.py
@@ -41,8 +41,8 @@ def service(service):
                 service_args.append('--check-encoding')
         if service == 'ocr':
             service_args.append('-l {}'.format(add_job_form.language.data))
-            if not add_job_form.binarization.data:
-                service_args.append('--skip-binarisation')
+            if add_job_form.binarization.data:
+                service_args.append('--binarize')
         job = Job(creator=current_user,
                   description=add_job_form.description.data,
                   mem_mb=SERVICES[service]['resources']['mem_mb'],
diff --git a/app/templates/services/ocr.html.j2 b/app/templates/services/ocr.html.j2
index 76cfac6b..6986f7f7 100644
--- a/app/templates/services/ocr.html.j2
+++ b/app/templates/services/ocr.html.j2
@@ -53,7 +53,7 @@
             <div class="file-field input-field">
               <div class="btn">
                 <span>{{ add_job_form.files.label.text }}</span>
-                {{ add_job_form.files(accept='application/pdf, image/tiff') }}
+                {{ add_job_form.files(accept='application/pdf') }}
               </div>
               <div class="file-path-wrapper">
                 <input class="file-path validate" type="text">
-- 
GitLab