diff --git a/kaldi_data_generator/main.py b/kaldi_data_generator/main.py index 1a6bf9afbab81966ff9bca0d16aab84bb7b49764..a9706ba3b2cf6a7f1ea44d5d4fceffee93e2b254 100644 --- a/kaldi_data_generator/main.py +++ b/kaldi_data_generator/main.py @@ -184,7 +184,6 @@ class HTRDataGenerator: def get_accepted_zones(self, page_id: str): try: - skip_count = 0 accepted_zones = [] for elt in self.api_client.cached_paginate( "ListElementChildren", id=page_id, with_classes=True @@ -223,14 +222,9 @@ class HTRDataGenerator: found_class = list(style_counts.keys())[0] found_class = Style(found_class) else: - logger.info( - f"Multiple style classes on the same element! Skipping {elt['id']} - {elem_classes}" + raise ValueError( + f"Multiple style classes on the same element! {elt['id']} - {elem_classes}" ) - skip_count += 1 - continue - # raise ValueError( - # f"Multiple style classes on the same element! {elt['id']} - {elem_classes}" - # ) if found_class == self.style: accepted_zones.append(elt["zone"]["id"]) @@ -238,8 +232,8 @@ class HTRDataGenerator: accepted_zones.append(elt["zone"]["id"]) logger.info( - "Number of accepted zone for page {} : {} ; skipped {}".format( - page_id, len(accepted_zones), skip_count + "Number of accepted zone for page {} : {}".format( + page_id, len(accepted_zones) ) ) return accepted_zones