architxt.cli#

Functions

corpus_stats([corpus_path, language, ...])

Display overall corpus statistics.

largest_tree([corpus_path, language, ...])

Display the largest tree in the corpus along with its sentence and structure.

mlflow_setup()

simplify([files, tau, epoch, min_support, ...])

ui(ctx)

Launch the web-based UI using Streamlit.

architxt.cli.corpus_stats(corpus_path=typer.Argument(..., exists=True, readable=True, help='Path to the input corpus.'), language=typer.Option(['French'], help='Language of the input corpus.'), *, corenlp_url=typer.Option('http://localhost:9000', help='URL of the CoreNLP server.'), cache=typer.Option(True, help='Enable caching of the analyzed corpus to prevent re-parsing.'))[source]#

Display overall corpus statistics.

Return type:

None

architxt.cli.largest_tree(corpus_path=typer.Argument(..., exists=True, readable=True, help='Path to the input corpus.'), language=typer.Option(['French'], help='Language of the input corpus.'), *, corenlp_url=typer.Option('http://localhost:9000', help='URL of the CoreNLP server.'), cache=typer.Option(True, help='Enable caching of the analyzed corpus to prevent re-parsing.'))[source]#

Display the largest tree in the corpus along with its sentence and structure.

Return type:

None

architxt.cli.mlflow_setup()[source]#
Return type:

None

architxt.cli.simplify(files=typer.Argument(..., exists=True, readable=True, help='Path of the data files to load.'), *, tau=typer.Option(0.7, help='The similarity threshold.', min=0, max=1), epoch=typer.Option(100, help='Number of iteration for tree rewriting.', min=1), min_support=typer.Option(20, help='Minimum support for tree patterns.', min=1), sample=typer.Option(None, help='Number of tree to use from the simplification.', min=1), workers=typer.Option(None, help='Number of parallel worker processes to use. Defaults to the number of available CPU cores.', min=1), output=typer.Option(None, help='Path to save the result.'), shuffle=typer.Option(False, help='Shuffle the data before processing to introduce randomness.'), debug=typer.Option(False, help='Enable debug mode for more verbose output.'), metrics=typer.Option(False, help='Show metrics of the simplification.'), log=typer.Option(False, help='Enable logging to MLFlow.'))[source]#
Return type:

None

architxt.cli.ui(ctx)[source]#

Launch the web-based UI using Streamlit.

Return type:

None

Modules