From c3d2f8fea08f0a99fc428faaeff2d97ead87ac7f Mon Sep 17 00:00:00 2001
From: Nolan <nboukachab@teklia.com>
Date: Tue, 16 May 2023 08:42:37 +0000
Subject: [PATCH] Remove get_valid_fonts function

---
 dan/manager/ocr.py | 31 -------------------------------
 1 file changed, 31 deletions(-)

diff --git a/dan/manager/ocr.py b/dan/manager/ocr.py
index 6d72ca06..50389b87 100644
--- a/dan/manager/ocr.py
+++ b/dan/manager/ocr.py
@@ -9,7 +9,6 @@ import torch
 from fontTools.ttLib import TTFont
 from PIL import Image, ImageDraw, ImageFont
 
-from dan import logger
 from dan.manager.dataset import DatasetManager, GenericDataset, apply_preprocessing
 from dan.ocr.utils import LM_str_to_ind
 from dan.utils import (
@@ -42,8 +41,6 @@ class OCRDatasetManager(DatasetManager):
             and self.params["config"]["synthetic_data"]
         ):
             self.synthetic_data = self.params["config"]["synthetic_data"]
-            if "config" in self.synthetic_data:
-                self.synthetic_data["config"]["valid_fonts"] = self.get_valid_fonts()
 
         if "new_tokens" in params:
             self.charset = sorted(
@@ -104,34 +101,6 @@ class OCRDatasetManager(DatasetManager):
                 [s["img"].shape[1] for s in self.train_dataset.samples]
             )
 
-    def get_valid_fonts(self):
-        """
-        Select fonts that are compatible with the alphabet
-        """
-        font_path = self.synthetic_data["font_path"]
-        alphabet = self.charset.copy()
-        special_chars = ["\n"]
-        alphabet = [char for char in alphabet if char not in special_chars]
-        valid_fonts = list()
-        for fold_detail in os.walk(font_path):
-            if fold_detail[2]:
-                for font_name in fold_detail[2]:
-                    if ".ttf" not in font_name:
-                        continue
-                    font_path = os.path.join(fold_detail[0], font_name)
-                    to_add = True
-                    if alphabet is not None:
-                        for char in alphabet:
-                            if not char_in_font(char, font_path):
-                                to_add = False
-                                break
-                        if to_add:
-                            valid_fonts.append(font_path)
-                    else:
-                        valid_fonts.append(font_path)
-        logger.info(f"Found {len(valid_fonts)} fonts.")
-        return valid_fonts
-
 
 class OCRDataset(GenericDataset):
     """
-- 
GitLab