From 025119e9ce3648dee3e570425cff6abd3e7aa6b0 Mon Sep 17 00:00:00 2001 From: mlbonhomme <bonhomme@teklia.com> Date: Tue, 17 Dec 2024 15:29:20 +0100 Subject: [PATCH] Add DOCX export worker and feature --- arkindex/process/models.py | 5 ++++- arkindex/system_workers.yml | 3 +++ 2 files changed, 7 insertions(+), 1 deletion(-) diff --git a/arkindex/process/models.py b/arkindex/process/models.py index b618b6c530..ba7788bf38 100644 --- a/arkindex/process/models.py +++ b/arkindex/process/models.py @@ -70,6 +70,7 @@ class ProcessMode(Enum): class ExportFormat(Enum): PDF = "pdf" PageXML = "page_xml" + DOCX = "docx" class Process(IndexableModel): @@ -703,6 +704,7 @@ class ArkindexFeature(Enum): # FEATURE_FORMAT_MAP dictionary which maps export formats to arkindex features ExportPDF = "pdf_export" ExportPageXML = "pagexml_export" + ExportDOCX = "docx_export" class WorkerVersion(models.Model): @@ -1222,5 +1224,6 @@ class CorpusWorkerVersion(models.Model): # A mapping of export formats with their corresponding arkindex feature FEATURE_FORMAT_MAP = { ExportFormat.PDF: ArkindexFeature.ExportPDF, - ExportFormat.PageXML: ArkindexFeature.ExportPageXML + ExportFormat.PageXML: ArkindexFeature.ExportPageXML, + ExportFormat.DOCX: ArkindexFeature.ExportDOCX } diff --git a/arkindex/system_workers.yml b/arkindex/system_workers.yml index 3a94f9635b..c5f659f14a 100644 --- a/arkindex/system_workers.yml +++ b/arkindex/system_workers.yml @@ -17,3 +17,6 @@ features: pagexml_export: image: registry.gitlab.teklia.com/arkindex/workers/export:0.2.0 command: worker-export-pagexml + docx_export: + image: registry.gitlab.teklia.com/arkindex/workers/export:0.2.0 + command: worker-export-docx -- GitLab