diff --git a/kaldi_data_generator/main.py b/kaldi_data_generator/main.py index a9706ba3b2cf6a7f1ea44d5d4fceffee93e2b254..02def12dbf7143a1dd057ddce88c2bc116166b73 100644 --- a/kaldi_data_generator/main.py +++ b/kaldi_data_generator/main.py @@ -312,6 +312,10 @@ class HTRDataGenerator: if not text or not text.strip(): continue + if "\n" in text.strip(): + elem_id = res["element"]["id"] + raise ValueError(f"Newlines are not allowed in line transcriptions - {page_id} - {elem_id} - {text}") + if "zone" in res: polygon = res["zone"]["polygon"] elif "element" in res: