diff --git a/arkindex/process/models.py b/arkindex/process/models.py
index 920823bb691604338faf99f26ea0af8734f2fdd3..f9fa1efaa52ee049f8c82503e88e40d61f8fcf21 100644
--- a/arkindex/process/models.py
+++ b/arkindex/process/models.py
@@ -723,6 +723,7 @@ class ArkindexFeature(Enum):
     InitElements = "init_elements"
     FileImport = "file_import"
     S3Ingest = "s3_ingest"
+    DatasetExtractor = "dataset_extractor"
     # When adding a new export worker, don't forget to also update the ExportFormat enum and the
     # FEATURE_FORMAT_MAP dictionary which maps export formats to arkindex features
     ExportPDF = "pdf_export"
diff --git a/arkindex/system_workers.yml b/arkindex/system_workers.yml
index 8e87093bab7c4f157e09ba9da6a8c1c68d4307ca..e8f59083a393b9e94608d36fc2bd70e01091b45d 100644
--- a/arkindex/system_workers.yml
+++ b/arkindex/system_workers.yml
@@ -31,3 +31,8 @@ features:
             name: arkindex/workers/export
             version: 0.2.1
             slug: csv-export
+    dataset_extractor:
+        teklia_worker:
+            name: arkindex/workers/generic-training-dataset
+            version: 0.3.0
+            slug: generic-training-dataset