diff --git a/training/api-reference.mdx b/training/api-reference.mdx index 83ba064418..c2a4a9a3f1 100644 --- a/training/api-reference.mdx +++ b/training/api-reference.mdx @@ -41,8 +41,8 @@ https://api.training.wandb.ai/v1 ### training-jobs -- **[POST /v1/preview/sft-training-jobs](https://docs.wandb.ai/training/api-reference/training-jobs/create-sft-training-job)** - Create SFT Training Job -- **[POST /v1/preview/training-jobs](https://docs.wandb.ai/training/api-reference/training-jobs/create-rl-training-job)** - Create RL Training Job +- **[POST /v1/preview/sft-training-jobs](https://docs.wandb.ai/training/api-reference/training-jobs/create-sft-training-job)** - Create Sft Training Job +- **[POST /v1/preview/training-jobs](https://docs.wandb.ai/training/api-reference/training-jobs/create-rl-training-job)** - Create Rl Training Job - **[GET /v1/preview/training-jobs/{training_job_id}](https://docs.wandb.ai/training/api-reference/training-jobs/get-training-job)** - Get Training Job - **[GET /v1/preview/training-jobs/{training_job_id}/events](https://docs.wandb.ai/training/api-reference/training-jobs/get-training-job-events)** - Get Training Job Events diff --git a/training/api-reference/openapi.json b/training/api-reference/openapi.json index b1175206ef..104a44f28a 100644 --- a/training/api-reference/openapi.json +++ b/training/api-reference/openapi.json @@ -399,8 +399,9 @@ "tags": [ "training-jobs" ], - "summary": "Create RL Training Job", - "operationId": "create_training_job_v1_preview_training_jobs_post", + "summary": "Create Rl Training Job", + "description": "Create a new RL (Reinforcement Learning) training job.", + "operationId": "Create_RL_Training_Job_v1_preview_training_jobs_post", "requestBody": { "content": { "application/json": { @@ -445,9 +446,9 @@ "tags": [ "training-jobs" ], - "summary": "Create SFT Training Job", + "summary": "Create Sft Training Job", "description": "Create a new SFT (Supervised Fine-Tuning) training job.", - "operationId": "create_sft_training_job_v1_preview_sft_training_jobs_post", + "operationId": "Create_SFT_Training_Job_v1_preview_sft_training_jobs_post", "requestBody": { "content": { "application/json": { @@ -1886,6 +1887,7 @@ "anyOf": [ { "type": "integer", + "maximum": 9.223372036854776e+18, "minimum": -1.0 }, { @@ -4335,7 +4337,8 @@ ] }, "type": "array", - "title": "Messages And Choices" + "title": "Messages And Choices", + "default": [] }, "tools": { "anyOf": [ @@ -4361,7 +4364,8 @@ }, "reward": { "type": "number", - "title": "Reward" + "title": "Reward", + "default": 0.0 }, "initial_policy_version": { "anyOf": [ @@ -4403,24 +4407,6 @@ "title": "Metrics", "default": {} }, - "auto_metrics": { - "additionalProperties": { - "anyOf": [ - { - "type": "number" - }, - { - "type": "integer" - }, - { - "type": "boolean" - } - ] - }, - "type": "object", - "title": "Auto Metrics", - "default": {} - }, "metadata": { "additionalProperties": { "anyOf": [ @@ -4460,10 +4446,6 @@ } }, "type": "object", - "required": [ - "messages_and_choices", - "reward" - ], "title": "Trajectory" }, "TrajectoryGroup": { @@ -4610,4 +4592,4 @@ } } } -} \ No newline at end of file +}