From 2ed4bde20f648d8cc8ff302b2d16ae7a70984f8b Mon Sep 17 00:00:00 2001 From: NolanB <nboukachab@teklia.com> Date: Mon, 15 May 2023 16:58:53 +0200 Subject: [PATCH] remove new_tokens --- dan/manager/ocr.py | 5 ----- 1 file changed, 5 deletions(-) diff --git a/dan/manager/ocr.py b/dan/manager/ocr.py index 50389b87..bd464073 100644 --- a/dan/manager/ocr.py +++ b/dan/manager/ocr.py @@ -42,11 +42,6 @@ class OCRDatasetManager(DatasetManager): ): self.synthetic_data = self.params["config"]["synthetic_data"] - if "new_tokens" in params: - self.charset = sorted( - list(set(self.charset).union(set(params["new_tokens"]))) - ) - self.tokens = { "pad": params["config"]["padding_token"], } -- GitLab