Amazon Bedrock Update: Adding support in Amazon Bedrock to customize models with reinforcement fine-tuning (RFT) and support for updating the existing Custom Model Deployments.

AWS · AWS · commit 6a5e9fc0de2a · 2025-12-03T16:28:50.000Z
diff --git a/.changes/next-release/feature-AmazonBedrock-46abd56.json b/.changes/next-release/feature-AmazonBedrock-46abd56.json
@@ -0,0 +1,6 @@
+{
+    "type": "feature",
+    "category": "Amazon Bedrock",
+    "contributor": "",
+    "description": "Adding support in Amazon Bedrock to customize models with reinforcement fine-tuning (RFT) and support for updating the existing Custom Model Deployments."
+}
diff --git a/services/bedrock/src/main/resources/codegen-resources/service-2.json b/services/bedrock/src/main/resources/codegen-resources/service-2.json
@@ -1836,6 +1836,25 @@
       "documentation":"<p>Updates an existing Automated Reasoning policy test. You can modify the content, query, expected result, and confidence threshold.</p>",
       "idempotent":true
     },
+    "UpdateCustomModelDeployment":{
+      "name":"UpdateCustomModelDeployment",
+      "http":{
+        "method":"PATCH",
+        "requestUri":"/model-customization/custom-model-deployments/{customModelDeploymentIdentifier}",
+        "responseCode":202
+      },
+      "input":{"shape":"UpdateCustomModelDeploymentRequest"},
+      "output":{"shape":"UpdateCustomModelDeploymentResponse"},
+      "errors":[
+        {"shape":"ResourceNotFoundException"},
+        {"shape":"AccessDeniedException"},
+        {"shape":"ValidationException"},
+        {"shape":"InternalServerException"},
+        {"shape":"ThrottlingException"}
+      ],
+      "documentation":"<p> Updates a custom model deployment with a new custom model. This allows you to deploy updated models without creating new deployment endpoints. </p>",
+      "idempotent":true
+    },
     "UpdateGuardrail":{
       "name":"UpdateGuardrail",
       "http":{
@@ -5189,6 +5208,32 @@
       "type":"list",
       "member":{"shape":"CustomModelDeploymentSummary"}
     },
+    "CustomModelDeploymentUpdateDetails":{
+      "type":"structure",
+      "required":[
+        "modelArn",
+        "updateStatus"
+      ],
+      "members":{
+        "modelArn":{
+          "shape":"ModelArn",
+          "documentation":"<p> ARN of the new custom model being deployed as part of the update. </p>"
+        },
+        "updateStatus":{
+          "shape":"CustomModelDeploymentUpdateStatus",
+          "documentation":"<p> Current status of the deployment update. </p>"
+        }
+      },
+      "documentation":"<p> Details about an update to a custom model deployment, including the new custom model resource ARN and current update status. </p>"
+    },
+    "CustomModelDeploymentUpdateStatus":{
+      "type":"string",
+      "enum":[
+        "Updating",
+        "UpdateCompleted",
+        "UpdateFailed"
+      ]
+    },
     "CustomModelName":{
       "type":"string",
       "max":63,
@@ -5268,6 +5313,10 @@
         "distillationConfig":{
           "shape":"DistillationConfig",
           "documentation":"<p>The Distillation configuration for the custom model.</p>"
+        },
+        "rftConfig":{
+          "shape":"RFTConfig",
+          "documentation":"<p> Configuration settings for reinforcement fine-tuning (RFT) model customization, including grader configuration and hyperparameters. </p>"
         }
       },
       "documentation":"<p>A model customization configuration</p>",
@@ -5279,6 +5328,7 @@
         "FINE_TUNING",
         "CONTINUED_PRE_TRAINING",
         "DISTILLATION",
+        "REINFORCEMENT_FINE_TUNING",
         "IMPORTED"
       ]
     },
@@ -5630,6 +5680,12 @@
         "NOT_AVAILABLE"
       ]
     },
+    "EpochCount":{
+      "type":"integer",
+      "box":true,
+      "max":50,
+      "min":1
+    },
     "ErrorMessage":{
       "type":"string",
       "max":2048,
@@ -6821,6 +6877,10 @@
           "shape":"CustomModelDeploymentDescription",
           "documentation":"<p>The description of the custom model deployment.</p>"
         },
+        "updateDetails":{
+          "shape":"CustomModelDeploymentUpdateDetails",
+          "documentation":"<p> Details about any pending or completed updates to the custom model deployment, including the new model ARN and update status. </p>"
+        },
         "failureMessage":{
           "shape":"ErrorMessage",
           "documentation":"<p>If the deployment status is <code>FAILED</code>, this field contains a message describing the failure reason.</p>"
@@ -7846,6 +7906,17 @@
         }
       }
     },
+    "GraderConfig":{
+      "type":"structure",
+      "members":{
+        "lambdaGrader":{
+          "shape":"LambdaGraderConfig",
+          "documentation":"<p> Configuration for using an AWS Lambda function as the grader for evaluating model responses and provide reward signals in reinforcement fine-tuning. </p>"
+        }
+      },
+      "documentation":"<p> Configuration for the grader used in reinforcement fine-tuning to evaluate model responses and provide reward signals. </p>",
+      "union":true
+    },
     "GuardrailArn":{
       "type":"string",
       "max":2048,
@@ -9563,6 +9634,23 @@
       "max":100,
       "min":1
     },
+    "LambdaArn":{
+      "type":"string",
+      "max":512,
+      "min":1,
+      "pattern":"arn:(aws[a-zA-Z-]*)?:lambda:[a-z]{2}(-gov)?-[a-z]+-\\d{1}:\\d{12}:function:[a-zA-Z0-9-_\\.]+(:(\\$LATEST|[a-zA-Z0-9-_]+))?"
+    },
+    "LambdaGraderConfig":{
+      "type":"structure",
+      "required":["lambdaArn"],
+      "members":{
+        "lambdaArn":{
+          "shape":"LambdaArn",
+          "documentation":"<p> ARN of the AWS Lambda function that will evaluate model responses and return reward scores for RFT training. </p>"
+        }
+      },
+      "documentation":"<p> Configuration for using an AWS Lambda function to grade model responses during reinforcement fine-tuning training. </p>"
+    },
     "LegalTerm":{
       "type":"structure",
       "members":{
@@ -11761,6 +11849,90 @@
       "max":1000,
       "min":1
     },
+    "RFTBatchSize":{
+      "type":"integer",
+      "box":true,
+      "max":512,
+      "min":16
+    },
+    "RFTConfig":{
+      "type":"structure",
+      "members":{
+        "graderConfig":{
+          "shape":"GraderConfig",
+          "documentation":"<p> Configuration for the grader that evaluates model responses and provides reward signals during RFT training. </p>"
+        },
+        "hyperParameters":{
+          "shape":"RFTHyperParameters",
+          "documentation":"<p> Hyperparameters that control the reinforcement fine-tuning training process, including learning rate, batch size, and epoch count. </p>"
+        }
+      },
+      "documentation":"<p> Configuration settings for reinforcement fine-tuning (RFT), including grader configuration and training hyperparameters. </p>"
+    },
+    "RFTEvalInterval":{
+      "type":"integer",
+      "box":true,
+      "max":100,
+      "min":1
+    },
+    "RFTHyperParameters":{
+      "type":"structure",
+      "members":{
+        "epochCount":{
+          "shape":"EpochCount",
+          "documentation":"<p> Number of training epochs to run during reinforcement fine-tuning. Higher values may improve performance but increase training time. </p>"
+        },
+        "batchSize":{
+          "shape":"RFTBatchSize",
+          "documentation":"<p> Number of training samples processed in each batch during reinforcement fine-tuning (RFT) training. Larger batches may improve training stability. </p>"
+        },
+        "learningRate":{
+          "shape":"RFTLearningRate",
+          "documentation":"<p> Learning rate for the reinforcement fine-tuning. Controls how quickly the model adapts to reward signals. </p>"
+        },
+        "maxPromptLength":{
+          "shape":"RFTMaxPromptLength",
+          "documentation":"<p> Maximum length of input prompts during RFT training, measured in tokens. Longer prompts allow more context but increase memory usage and training-time. </p>"
+        },
+        "trainingSamplePerPrompt":{
+          "shape":"RFTTrainingSamplePerPrompt",
+          "documentation":"<p> Number of response samples generated per prompt during RFT training. More samples provide better reward signal estimation. </p>"
+        },
+        "inferenceMaxTokens":{
+          "shape":"RFTInferenceMaxTokens",
+          "documentation":"<p> Maximum number of tokens the model can generate in response to each prompt during RFT training. </p>"
+        },
+        "reasoningEffort":{
+          "shape":"ReasoningEffort",
+          "documentation":"<p> Level of reasoning effort applied during RFT training. Higher values may improve response quality but increase training time. </p>"
+        },
+        "evalInterval":{
+          "shape":"RFTEvalInterval",
+          "documentation":"<p> Interval between evaluation runs during RFT training, measured in training steps. More frequent evaluation provides better monitoring. </p>"
+        }
+      },
+      "documentation":"<p> Hyperparameters for controlling the reinforcement fine-tuning training process, including learning settings and evaluation intervals. </p>"
+    },
+    "RFTInferenceMaxTokens":{
+      "type":"integer",
+      "box":true
+    },
+    "RFTLearningRate":{
+      "type":"float",
+      "box":true,
+      "max":0.001,
+      "min":0.0000001
+    },
+    "RFTMaxPromptLength":{
+      "type":"integer",
+      "box":true
+    },
+    "RFTTrainingSamplePerPrompt":{
+      "type":"integer",
+      "box":true,
+      "max":16,
+      "min":2
+    },
     "RagConfigs":{
       "type":"list",
       "member":{"shape":"RAGConfig"},
@@ -11820,6 +11992,14 @@
       "max":100,
       "min":1
     },
+    "ReasoningEffort":{
+      "type":"string",
+      "enum":[
+        "low",
+        "medium",
+        "high"
+      ]
+    },
     "RegionAvailability":{
       "type":"string",
       "enum":[
@@ -12853,6 +13033,35 @@
         }
       }
     },
+    "UpdateCustomModelDeploymentRequest":{
+      "type":"structure",
+      "required":[
+        "modelArn",
+        "customModelDeploymentIdentifier"
+      ],
+      "members":{
+        "modelArn":{
+          "shape":"CustomModelArn",
+          "documentation":"<p> ARN of the new custom model to deploy. This replaces the currently deployed model. </p>"
+        },
+        "customModelDeploymentIdentifier":{
+          "shape":"CustomModelDeploymentIdentifier",
+          "documentation":"<p> Identifier of the custom model deployment to update with the new custom model. </p>",
+          "location":"uri",
+          "locationName":"customModelDeploymentIdentifier"
+        }
+      }
+    },
+    "UpdateCustomModelDeploymentResponse":{
+      "type":"structure",
+      "required":["customModelDeploymentArn"],
+      "members":{
+        "customModelDeploymentArn":{
+          "shape":"CustomModelDeploymentArn",
+          "documentation":"<p> ARN of the custom model deployment being updated. </p>"
+        }
+      }
+    },
     "UpdateGuardrailRequest":{
       "type":"structure",
       "required":[