Lucas ARRIESSE commited on
Commit
f461b05
·
1 Parent(s): 2f60010

Enable Table Extraction

Browse files
Files changed (2) hide show
  1. api/docs.py +1 -1
  2. requirements.txt +1 -1
api/docs.py CHANGED
@@ -36,7 +36,7 @@ NSMAP = {
36
  # ================================== Converting of files to .txt ====================================
37
 
38
  KREUZBERG_CONFIG: ExtractionConfig = ExtractionConfig(
39
- force_ocr=False, ocr_backend=None)
40
 
41
  # Unfortunately needs to be kept to 1, as libreoffice isn't built to support parallel instances
42
  LO_CONVERSION_MUTEX = asyncio.Semaphore(1)
 
36
  # ================================== Converting of files to .txt ====================================
37
 
38
  KREUZBERG_CONFIG: ExtractionConfig = ExtractionConfig(
39
+ force_ocr=False, ocr_backend=None, extract_tables=True)
40
 
41
  # Unfortunately needs to be kept to 1, as libreoffice isn't built to support parallel instances
42
  LO_CONVERSION_MUTEX = asyncio.Semaphore(1)
requirements.txt CHANGED
@@ -11,4 +11,4 @@ beautifulsoup4
11
  aiolimiter
12
  httpx
13
  Jinja2
14
- kreuzberg
 
11
  aiolimiter
12
  httpx
13
  Jinja2
14
+ kreuzberg[gmft]