From 025119e9ce3648dee3e570425cff6abd3e7aa6b0 Mon Sep 17 00:00:00 2001
From: mlbonhomme <bonhomme@teklia.com>
Date: Tue, 17 Dec 2024 15:29:20 +0100
Subject: [PATCH] Add DOCX export worker and feature

---
 arkindex/process/models.py  | 5 ++++-
 arkindex/system_workers.yml | 3 +++
 2 files changed, 7 insertions(+), 1 deletion(-)

diff --git a/arkindex/process/models.py b/arkindex/process/models.py
index b618b6c530..ba7788bf38 100644
--- a/arkindex/process/models.py
+++ b/arkindex/process/models.py
@@ -70,6 +70,7 @@ class ProcessMode(Enum):
 class ExportFormat(Enum):
     PDF = "pdf"
     PageXML = "page_xml"
+    DOCX = "docx"
 
 
 class Process(IndexableModel):
@@ -703,6 +704,7 @@ class ArkindexFeature(Enum):
     # FEATURE_FORMAT_MAP dictionary which maps export formats to arkindex features
     ExportPDF = "pdf_export"
     ExportPageXML = "pagexml_export"
+    ExportDOCX = "docx_export"
 
 
 class WorkerVersion(models.Model):
@@ -1222,5 +1224,6 @@ class CorpusWorkerVersion(models.Model):
 # A mapping of export formats with their corresponding arkindex feature
 FEATURE_FORMAT_MAP = {
     ExportFormat.PDF: ArkindexFeature.ExportPDF,
-    ExportFormat.PageXML: ArkindexFeature.ExportPageXML
+    ExportFormat.PageXML: ArkindexFeature.ExportPageXML,
+    ExportFormat.DOCX: ArkindexFeature.ExportDOCX
 }
diff --git a/arkindex/system_workers.yml b/arkindex/system_workers.yml
index 3a94f9635b..c5f659f14a 100644
--- a/arkindex/system_workers.yml
+++ b/arkindex/system_workers.yml
@@ -17,3 +17,6 @@ features:
     pagexml_export:
         image: registry.gitlab.teklia.com/arkindex/workers/export:0.2.0
         command: worker-export-pagexml
+    docx_export:
+        image: registry.gitlab.teklia.com/arkindex/workers/export:0.2.0
+        command: worker-export-docx
-- 
GitLab