From 984ca2dcc521f0a96bb6aa90663c280171dd43d6 Mon Sep 17 00:00:00 2001 From: Avinash Sooriyarachchi Date: Thu, 15 Aug 2024 00:29:55 -0700 Subject: [PATCH 1/2] Updated WPS and params_config for large and nemo --- utils/validate_data.py | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/utils/validate_data.py b/utils/validate_data.py index 402e724..60407a9 100644 --- a/utils/validate_data.py +++ b/utils/validate_data.py @@ -34,6 +34,8 @@ "open-mistral-7b": 5720, "open-mixtral-8x7b": 2966, "open-mixtral-8x22b": 1007, + "mistral-large-latest": 326, + 'open-mistral-nemo': 3337, } MIN_NUM_JSONL_LINES = 10 @@ -104,7 +106,11 @@ def get_train_stats( model_id = "open-mixtral-8x7b" elif params_config["dim"] == 6144: model_id = "open-mixtral-8x22b" - else: + elif params_config["dim"] == 12288: + model_id = "mistral-large-latest" + elif params_config["dim"] == 5120: + model_id = "open-mistral-nemo" + else: raise ValueError("Provided model folder seems incorrect.") else: model_id = train_args.model_id_or_path From 79730dc79b51417e2ec86f4e17b5460d47ff0e11 Mon Sep 17 00:00:00 2001 From: Avinash Sooriyarachchi <39173418+AviSoori1x@users.noreply.github.com> Date: Thu, 15 Aug 2024 01:25:11 -0700 Subject: [PATCH 2/2] Apply suggestions from code review Co-authored-by: Patrick von Platen --- utils/validate_data.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/utils/validate_data.py b/utils/validate_data.py index 60407a9..2632eaf 100644 --- a/utils/validate_data.py +++ b/utils/validate_data.py @@ -34,7 +34,7 @@ "open-mistral-7b": 5720, "open-mixtral-8x7b": 2966, "open-mixtral-8x22b": 1007, - "mistral-large-latest": 326, + "mistral-large-latest": 567, 'open-mistral-nemo': 3337, }