-
Notifications
You must be signed in to change notification settings - Fork 10
/
config.py
29 lines (21 loc) · 1.13 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
LOGGING_LEVEL = 'DEBUG'
CELERY_INCLUDE = ['adsft.tasks']
CELERY_BROKER = 'pyamqp://guest@localhost:6672/fulltext_pipeline'
PDF_EXTRACTOR = 'org.adslabs.adsfulltext.PDFExtractList'
#GROBID_SERVICE = 'http://localhost:8080/processFulltextDocument'
GROBID_SERVICE = None # Disable
EXTRACT_PDF_SCRIPT = '/scripts/extract_pdf_with_pdftotext.sh'
#EXTRACT_PDF_SCRIPT = '/scripts/extract_pdf_with_pdfbox.sh'
OUTPUT_CELERY_BROKER = 'pyamqp://guest:guest@localhost:6672/master_pipeline'
OUTPUT_TASKNAME = 'adsmp.tasks.task_update_record'
PREFERRED_XML_PARSER_NAMES = ("html5lib", "html.parser", "lxml-html", "direct-lxml-html", "lxml-xml", "direct-lxml-xml",)
FULLTEXT_EXTRACT_PATH = './live'
NER_FACILITY_MODEL_ACK = '/app/ner_models/ner_facility_ack/ner_model_facility/'
NER_FACILITY_MODEL_FT = '/app/ner_models/ner_facility_ft/ner_model_facility/'
RUN_NER_FACILITIES_AFTER_EXTRACTION = False
### Testing:
# When 'True', it converts all the asynchronous calls into synchronous,
# thus no need for rabbitmq, it does not forward to master
# and it allows debuggers to run if needed:
#CELERY_ALWAYS_EAGER = True
#CELERY_EAGER_PROPAGATES_EXCEPTIONS = True