From 5addcd9de862d163e1a85ea7a63cc2c619aa4721 Mon Sep 17 00:00:00 2001 From: Vensenmu Date: Thu, 5 Jun 2025 13:07:07 +0800 Subject: [PATCH] fix: Fix: Correctly define choices as tuple for reward-model arg Fixes #941 Signed-off-by: Vensenmu --- applications/DeepSpeed-Chat/e2e_rlhf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/applications/DeepSpeed-Chat/e2e_rlhf.py b/applications/DeepSpeed-Chat/e2e_rlhf.py index 51616ad6d..5abae153f 100644 --- a/applications/DeepSpeed-Chat/e2e_rlhf.py +++ b/applications/DeepSpeed-Chat/e2e_rlhf.py @@ -65,7 +65,7 @@ def parse_args(): "--reward-model", type=lambda x: x.replace("facebook/opt-", ""), default="350m", - choices=("350m"), + choices=("350m", ), help="Which facebook/opt-* model to use for Reward (step 2)", ) parser.add_argument(