forked from adsabs/ADSfulltext
-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.py
24 lines (17 loc) · 916 Bytes
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
LOGGING_LEVEL = 'DEBUG'
CELERY_BROKER = 'pyamqp://guest@localhost:6672/fulltext_pipeline'
PDF_EXTRACTOR = 'org.adslabs.adsfulltext.PDFExtractList'
#GROBID_SERVICE = 'http://localhost:8080/processFulltextDocument'
GROBID_SERVICE = None # Disable
EXTRACT_PDF_SCRIPT = '/scripts/extract_pdf_with_pdftotext.sh'
#EXTRACT_PDF_SCRIPT = '/scripts/extract_pdf_with_pdfbox.sh'
OUTPUT_CELERY_BROKER = 'pyamqp://guest:guest@localhost:6672/master_pipeline'
OUTPUT_TASKNAME = 'adsmp.tasks.task_update_record'
PREFERRED_XML_PARSER_NAMES = ("html5lib", "html.parser", "lxml-html", "direct-lxml-html", "lxml-xml", "direct-lxml-xml",)
FULLTEXT_EXTRACT_PATH = './live'
### Testing:
# When 'True', it converts all the asynchronous calls into synchronous,
# thus no need for rabbitmq, it does not forward to master
# and it allows debuggers to run if needed:
#CELERY_ALWAYS_EAGER = True
#CELERY_EAGER_PROPAGATES_EXCEPTIONS = True