kick off RFT in one command

benjibc · benjibc · commit 97b5dc53a8e0 · 2025-10-13T15:36:46.000-07:00
diff --git a/eval_protocol/cli.py b/eval_protocol/cli.py
@@ -358,8 +358,7 @@ def parse_args(args=None):
     )
     rft_parser.add_argument(
         "--evaluator-id",
-        required=True,
-        help="Evaluator ID used during upload; resolves evaluator resource via local trace",
+        help="Evaluator ID used during upload; if omitted, derive from local traces or a single discovered test",
     )
     # Dataset options
     rft_parser.add_argument(
diff --git a/eval_protocol/cli_commands/create_rft.py b/eval_protocol/cli_commands/create_rft.py
@@ -19,6 +19,7 @@
     load_evaluator_trace,
     materialize_dataset_via_builder,
 )
+from .upload import _discover_tests, _normalize_evaluator_id, _resolve_entry_to_qual_and_source
 
 
 def _ensure_account_id() -> Optional[str]:
@@ -48,8 +49,26 @@ def _print_links(evaluator_id: str, dataset_id: str, job_name: Optional[str]) ->
             pass
 
 
+def _auto_select_evaluator_id(cwd: str) -> Optional[str]:
+    # Try local traces
+    traces_dir = os.path.join(cwd, ".eval_protocol", "evaluators")
+    if os.path.isdir(traces_dir):
+        candidates = [f[:-5] for f in os.listdir(traces_dir) if f.endswith(".json")]
+        if len(candidates) == 1:
+            return candidates[0]
+    # Fall back to discovering a single evaluation_test
+    tests = _discover_tests(cwd)
+    if len(tests) == 1:
+        qualname, source_file_path = tests[0].qualname, tests[0].file_path
+        test_func_name = qualname.split(".")[-1]
+        source_file_name = os.path.splitext(os.path.basename(source_file_path))[0]
+        evaluator_id = _normalize_evaluator_id(f"{source_file_name}-{test_func_name}")
+        return evaluator_id
+    return None
+
+
 def create_rft_command(args) -> int:
-    evaluator_id: str = getattr(args, "evaluator_id")
+    evaluator_id: Optional[str] = getattr(args, "evaluator_id", None)
     non_interactive: bool = bool(getattr(args, "yes", False))
     dry_run: bool = bool(getattr(args, "dry_run", False))
 
@@ -65,8 +84,15 @@ def create_rft_command(args) -> int:
 
     api_base = get_fireworks_api_base()
 
-    # Resolve evaluator resource name via local trace
+    # Resolve evaluator id if omitted
     project_root = os.getcwd()
+    if not evaluator_id:
+        evaluator_id = _auto_select_evaluator_id(project_root)
+        if not evaluator_id:
+            print("Error: Could not infer evaluator id. Provide --evaluator-id or run 'eval-protocol upload' first.")
+            return 1
+
+    # Resolve evaluator resource name via local trace
     trace = load_evaluator_trace(project_root, evaluator_id)
     if not trace or not isinstance(trace, dict):
         print(

Original file line number	Diff line number	Diff line change
`@@ -358,8 +358,7 @@ def parse_args(args=None):`
`358`	`358`	`)`
`359`	`359`	`rft_parser.add_argument(`
`360`	`360`	`"--evaluator-id",`
`361`		`- required=True,`
`362`		`- help="Evaluator ID used during upload; resolves evaluator resource via local trace",`
	`361`	`+ help="Evaluator ID used during upload; if omitted, derive from local traces or a single discovered test",`
`363`	`362`	`)`
`364`	`363`	`# Dataset options`
`365`	`364`	`rft_parser.add_argument(`