diff --git a/dan/manager/ocr.py b/dan/manager/ocr.py index 50389b87d9a40193532833702d18281d4ab875f4..bd4640731aafa905b05b596233e917e1971a7209 100644 --- a/dan/manager/ocr.py +++ b/dan/manager/ocr.py @@ -42,11 +42,6 @@ class OCRDatasetManager(DatasetManager): ): self.synthetic_data = self.params["config"]["synthetic_data"] - if "new_tokens" in params: - self.charset = sorted( - list(set(self.charset).union(set(params["new_tokens"]))) - ) - self.tokens = { "pad": params["config"]["padding_token"], }