diff --git a/arlas/cli/index.py b/arlas/cli/index.py index b9de496..0251ef6 100644 --- a/arlas/cli/index.py +++ b/arlas/cli/index.py @@ -98,8 +98,8 @@ def create( @indices.command(help="Index data") def data( index: str = typer.Argument(help="index's name"), - files: list[str] = typer.Argument(help="List of pathes to the file conaining the data. Format: NDJSON"), - bulk: int = typer.Option(default=100, help="Bulk size for indexing data") + files: list[str] = typer.Argument(help="List of paths to the file(s) containing the data. Format: NDJSON"), + bulk: int = typer.Option(default=5000, help="Bulk size for indexing data") ): config = variables["arlas"] i = 1 @@ -115,9 +115,9 @@ def data( @indices.command(help="Generate the mapping based on the data") def mapping( - file: str = typer.Argument(help="Path to the file conaining the data. Format: NDJSON"), + file: str = typer.Argument(help="Path to the file containing the data. Format: NDJSON"), nb_lines: int = typer.Option(default=2, help="Number of line to consider for generating the mapping. Avoid going over 10."), - field_mapping: list[str] = typer.Option(default=[], help="Overide the mapping with the provided field path/type. Example: fragment.location:geo_point. Important: the full field path must be provided."), + field_mapping: list[str] = typer.Option(default=[], help="Override the mapping with the provided field path/type. Example: fragment.location:geo_point. Important: the full field path must be provided."), no_fulltext: list[str] = typer.Option(default=[], help="List of keyword or text fields that should not be in the fulltext search. Important: the field name only must be provided."), push_on: str = typer.Option(default=None, help="Push the generated mapping for the provided index name"), ): diff --git a/arlas/cli/service.py b/arlas/cli/service.py index 7f95594..f72565f 100644 --- a/arlas/cli/service.py +++ b/arlas/cli/service.py @@ -384,7 +384,7 @@ def __index_bulk__(arlas: str, index: str, bulk: []): if result["errors"] is True: print("ERROR: " + json.dumps(result)) - def index_hits(arlas: str, index: str, file_path: str, bulk_size: int = 100, count: int = -1) -> dict[str, int]: + def index_hits(arlas: str, index: str, file_path: str, bulk_size: int = 5000, count: int = -1) -> dict[str, int]: line_number = 0 line_in_bulk = 0 bulk = []