Skip to content
Snippets Groups Projects

Support subword and word language models

Merged Solene Tarride requested to merge subword-and-word-lm into main
Compare and Show latest version
50 files
+ 944
448
Compare changes
  • Side-by-side
  • Inline
Files
50
+ 28
0
# -*- coding: utf-8 -*-
"""
Extract entities from Arkindex using a corpus export.
"""
from pathlib import Path
from dan.datasets.entities.extract import run
def add_entities_parser(subcommands) -> None:
parser = subcommands.add_parser(
"entities",
description=__doc__,
help=__doc__,
)
parser.add_argument(
"database",
type=Path,
help="Path where the data were exported from Arkindex.",
)
parser.add_argument(
"--output-file",
type=Path,
default=Path("entities.yml"),
required=False,
help="Path to a YAML file to save the extracted entities.",
)
parser.set_defaults(func=run)
Loading