From 5addcd9de862d163e1a85ea7a63cc2c619aa4721 Mon Sep 17 00:00:00 2001
From: Vensenmu <vensenmu@gmail.com>
Date: Thu, 5 Jun 2025 13:07:07 +0800
Subject: [PATCH] fix: Fix: Correctly define choices as tuple for reward-model
 arg   Fixes #941

Signed-off-by: Vensenmu <vensenmu@gmail.com>
---
 applications/DeepSpeed-Chat/e2e_rlhf.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/applications/DeepSpeed-Chat/e2e_rlhf.py b/applications/DeepSpeed-Chat/e2e_rlhf.py
index 51616ad6d..5abae153f 100644
--- a/applications/DeepSpeed-Chat/e2e_rlhf.py
+++ b/applications/DeepSpeed-Chat/e2e_rlhf.py
@@ -65,7 +65,7 @@ def parse_args():
         "--reward-model",
         type=lambda x: x.replace("facebook/opt-", ""),
         default="350m",
-        choices=("350m"),
+        choices=("350m", ),
         help="Which facebook/opt-* model to use for Reward (step 2)",
     )
     parser.add_argument(