From 402d3ce28df3cceaa21476c0a5f1b97ff68abb7c Mon Sep 17 00:00:00 2001 From: Jeffrey Quesnelle Date: Fri, 5 Jul 2024 09:34:01 -0400 Subject: [PATCH] Update tools/preprocess_data.py Co-authored-by: Antoni-Joan Solergibert <74564958+TJ-Solergibert@users.noreply.github.com> --- tools/preprocess_data.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tools/preprocess_data.py b/tools/preprocess_data.py index 24586bdd..c668aa58 100644 --- a/tools/preprocess_data.py +++ b/tools/preprocess_data.py @@ -77,7 +77,7 @@ def get_args(): "--dataset", type=str, required=True, - help="Path to a .paquet file or hf:// path", + help="Path to a .parquet file or a folder containing multiple .parquet files", ) p3.add_argument("--column", type=str, default="text", help="Column to preprocess from the Dataset. Default: text") p3.add_argument(