Skip to content
Snippets Groups Projects
Commit f48d9f49 authored by Martin's avatar Martin
Browse files

skip instead of fail

parent 0a628757
No related branches found
No related tags found
1 merge request!22Add style filter (handwritten, typewritten); support ignored_classes
Pipeline #74329 passed
...@@ -180,6 +180,7 @@ class HTRDataGenerator: ...@@ -180,6 +180,7 @@ class HTRDataGenerator:
def get_accepted_zones(self, page_id: str): def get_accepted_zones(self, page_id: str):
try: try:
skip_count = 0
accepted_zones = [] accepted_zones = []
for elt in self.api_client.cached_paginate( for elt in self.api_client.cached_paginate(
"ListElementChildren", id=page_id, with_classes=True "ListElementChildren", id=page_id, with_classes=True
...@@ -215,9 +216,14 @@ class HTRDataGenerator: ...@@ -215,9 +216,14 @@ class HTRDataGenerator:
found_class = list(style_counts.keys())[0] found_class = list(style_counts.keys())[0]
found_class = Style(found_class) found_class = Style(found_class)
else: else:
raise ValueError( logger.info(
f"Multiple style classes on the same element! {elt['id']} - {elem_classes}" f"Multiple style classes on the same element! Skipping {elt['id']} - {elem_classes}"
) )
skip_count += 1
continue
# raise ValueError(
# f"Multiple style classes on the same element! {elt['id']} - {elem_classes}"
# )
if found_class == self.style: if found_class == self.style:
accepted_zones.append(elt["zone"]["id"]) accepted_zones.append(elt["zone"]["id"])
...@@ -225,8 +231,8 @@ class HTRDataGenerator: ...@@ -225,8 +231,8 @@ class HTRDataGenerator:
accepted_zones.append(elt["zone"]["id"]) accepted_zones.append(elt["zone"]["id"])
logger.info( logger.info(
"Number of accepted zone for page {} : {}".format( "Number of accepted zone for page {} : {} ; skipped {}".format(
page_id, len(accepted_zones) page_id, len(accepted_zones), skip_count
) )
) )
return accepted_zones return accepted_zones
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment