|
1836 | 1836 | "documentation":"<p>Updates an existing Automated Reasoning policy test. You can modify the content, query, expected result, and confidence threshold.</p>", |
1837 | 1837 | "idempotent":true |
1838 | 1838 | }, |
| 1839 | + "UpdateCustomModelDeployment":{ |
| 1840 | + "name":"UpdateCustomModelDeployment", |
| 1841 | + "http":{ |
| 1842 | + "method":"PATCH", |
| 1843 | + "requestUri":"/model-customization/custom-model-deployments/{customModelDeploymentIdentifier}", |
| 1844 | + "responseCode":202 |
| 1845 | + }, |
| 1846 | + "input":{"shape":"UpdateCustomModelDeploymentRequest"}, |
| 1847 | + "output":{"shape":"UpdateCustomModelDeploymentResponse"}, |
| 1848 | + "errors":[ |
| 1849 | + {"shape":"ResourceNotFoundException"}, |
| 1850 | + {"shape":"AccessDeniedException"}, |
| 1851 | + {"shape":"ValidationException"}, |
| 1852 | + {"shape":"InternalServerException"}, |
| 1853 | + {"shape":"ThrottlingException"} |
| 1854 | + ], |
| 1855 | + "documentation":"<p> Updates a custom model deployment with a new custom model. This allows you to deploy updated models without creating new deployment endpoints. </p>", |
| 1856 | + "idempotent":true |
| 1857 | + }, |
1839 | 1858 | "UpdateGuardrail":{ |
1840 | 1859 | "name":"UpdateGuardrail", |
1841 | 1860 | "http":{ |
|
5189 | 5208 | "type":"list", |
5190 | 5209 | "member":{"shape":"CustomModelDeploymentSummary"} |
5191 | 5210 | }, |
| 5211 | + "CustomModelDeploymentUpdateDetails":{ |
| 5212 | + "type":"structure", |
| 5213 | + "required":[ |
| 5214 | + "modelArn", |
| 5215 | + "updateStatus" |
| 5216 | + ], |
| 5217 | + "members":{ |
| 5218 | + "modelArn":{ |
| 5219 | + "shape":"ModelArn", |
| 5220 | + "documentation":"<p> ARN of the new custom model being deployed as part of the update. </p>" |
| 5221 | + }, |
| 5222 | + "updateStatus":{ |
| 5223 | + "shape":"CustomModelDeploymentUpdateStatus", |
| 5224 | + "documentation":"<p> Current status of the deployment update. </p>" |
| 5225 | + } |
| 5226 | + }, |
| 5227 | + "documentation":"<p> Details about an update to a custom model deployment, including the new custom model resource ARN and current update status. </p>" |
| 5228 | + }, |
| 5229 | + "CustomModelDeploymentUpdateStatus":{ |
| 5230 | + "type":"string", |
| 5231 | + "enum":[ |
| 5232 | + "Updating", |
| 5233 | + "UpdateCompleted", |
| 5234 | + "UpdateFailed" |
| 5235 | + ] |
| 5236 | + }, |
5192 | 5237 | "CustomModelName":{ |
5193 | 5238 | "type":"string", |
5194 | 5239 | "max":63, |
|
5268 | 5313 | "distillationConfig":{ |
5269 | 5314 | "shape":"DistillationConfig", |
5270 | 5315 | "documentation":"<p>The Distillation configuration for the custom model.</p>" |
| 5316 | + }, |
| 5317 | + "rftConfig":{ |
| 5318 | + "shape":"RFTConfig", |
| 5319 | + "documentation":"<p> Configuration settings for reinforcement fine-tuning (RFT) model customization, including grader configuration and hyperparameters. </p>" |
5271 | 5320 | } |
5272 | 5321 | }, |
5273 | 5322 | "documentation":"<p>A model customization configuration</p>", |
|
5279 | 5328 | "FINE_TUNING", |
5280 | 5329 | "CONTINUED_PRE_TRAINING", |
5281 | 5330 | "DISTILLATION", |
| 5331 | + "REINFORCEMENT_FINE_TUNING", |
5282 | 5332 | "IMPORTED" |
5283 | 5333 | ] |
5284 | 5334 | }, |
|
5630 | 5680 | "NOT_AVAILABLE" |
5631 | 5681 | ] |
5632 | 5682 | }, |
| 5683 | + "EpochCount":{ |
| 5684 | + "type":"integer", |
| 5685 | + "box":true, |
| 5686 | + "max":50, |
| 5687 | + "min":1 |
| 5688 | + }, |
5633 | 5689 | "ErrorMessage":{ |
5634 | 5690 | "type":"string", |
5635 | 5691 | "max":2048, |
|
6821 | 6877 | "shape":"CustomModelDeploymentDescription", |
6822 | 6878 | "documentation":"<p>The description of the custom model deployment.</p>" |
6823 | 6879 | }, |
| 6880 | + "updateDetails":{ |
| 6881 | + "shape":"CustomModelDeploymentUpdateDetails", |
| 6882 | + "documentation":"<p> Details about any pending or completed updates to the custom model deployment, including the new model ARN and update status. </p>" |
| 6883 | + }, |
6824 | 6884 | "failureMessage":{ |
6825 | 6885 | "shape":"ErrorMessage", |
6826 | 6886 | "documentation":"<p>If the deployment status is <code>FAILED</code>, this field contains a message describing the failure reason.</p>" |
|
7846 | 7906 | } |
7847 | 7907 | } |
7848 | 7908 | }, |
| 7909 | + "GraderConfig":{ |
| 7910 | + "type":"structure", |
| 7911 | + "members":{ |
| 7912 | + "lambdaGrader":{ |
| 7913 | + "shape":"LambdaGraderConfig", |
| 7914 | + "documentation":"<p> Configuration for using an AWS Lambda function as the grader for evaluating model responses and provide reward signals in reinforcement fine-tuning. </p>" |
| 7915 | + } |
| 7916 | + }, |
| 7917 | + "documentation":"<p> Configuration for the grader used in reinforcement fine-tuning to evaluate model responses and provide reward signals. </p>", |
| 7918 | + "union":true |
| 7919 | + }, |
7849 | 7920 | "GuardrailArn":{ |
7850 | 7921 | "type":"string", |
7851 | 7922 | "max":2048, |
|
9563 | 9634 | "max":100, |
9564 | 9635 | "min":1 |
9565 | 9636 | }, |
| 9637 | + "LambdaArn":{ |
| 9638 | + "type":"string", |
| 9639 | + "max":512, |
| 9640 | + "min":1, |
| 9641 | + "pattern":"arn:(aws[a-zA-Z-]*)?:lambda:[a-z]{2}(-gov)?-[a-z]+-\\d{1}:\\d{12}:function:[a-zA-Z0-9-_\\.]+(:(\\$LATEST|[a-zA-Z0-9-_]+))?" |
| 9642 | + }, |
| 9643 | + "LambdaGraderConfig":{ |
| 9644 | + "type":"structure", |
| 9645 | + "required":["lambdaArn"], |
| 9646 | + "members":{ |
| 9647 | + "lambdaArn":{ |
| 9648 | + "shape":"LambdaArn", |
| 9649 | + "documentation":"<p> ARN of the AWS Lambda function that will evaluate model responses and return reward scores for RFT training. </p>" |
| 9650 | + } |
| 9651 | + }, |
| 9652 | + "documentation":"<p> Configuration for using an AWS Lambda function to grade model responses during reinforcement fine-tuning training. </p>" |
| 9653 | + }, |
9566 | 9654 | "LegalTerm":{ |
9567 | 9655 | "type":"structure", |
9568 | 9656 | "members":{ |
|
11761 | 11849 | "max":1000, |
11762 | 11850 | "min":1 |
11763 | 11851 | }, |
| 11852 | + "RFTBatchSize":{ |
| 11853 | + "type":"integer", |
| 11854 | + "box":true, |
| 11855 | + "max":512, |
| 11856 | + "min":16 |
| 11857 | + }, |
| 11858 | + "RFTConfig":{ |
| 11859 | + "type":"structure", |
| 11860 | + "members":{ |
| 11861 | + "graderConfig":{ |
| 11862 | + "shape":"GraderConfig", |
| 11863 | + "documentation":"<p> Configuration for the grader that evaluates model responses and provides reward signals during RFT training. </p>" |
| 11864 | + }, |
| 11865 | + "hyperParameters":{ |
| 11866 | + "shape":"RFTHyperParameters", |
| 11867 | + "documentation":"<p> Hyperparameters that control the reinforcement fine-tuning training process, including learning rate, batch size, and epoch count. </p>" |
| 11868 | + } |
| 11869 | + }, |
| 11870 | + "documentation":"<p> Configuration settings for reinforcement fine-tuning (RFT), including grader configuration and training hyperparameters. </p>" |
| 11871 | + }, |
| 11872 | + "RFTEvalInterval":{ |
| 11873 | + "type":"integer", |
| 11874 | + "box":true, |
| 11875 | + "max":100, |
| 11876 | + "min":1 |
| 11877 | + }, |
| 11878 | + "RFTHyperParameters":{ |
| 11879 | + "type":"structure", |
| 11880 | + "members":{ |
| 11881 | + "epochCount":{ |
| 11882 | + "shape":"EpochCount", |
| 11883 | + "documentation":"<p> Number of training epochs to run during reinforcement fine-tuning. Higher values may improve performance but increase training time. </p>" |
| 11884 | + }, |
| 11885 | + "batchSize":{ |
| 11886 | + "shape":"RFTBatchSize", |
| 11887 | + "documentation":"<p> Number of training samples processed in each batch during reinforcement fine-tuning (RFT) training. Larger batches may improve training stability. </p>" |
| 11888 | + }, |
| 11889 | + "learningRate":{ |
| 11890 | + "shape":"RFTLearningRate", |
| 11891 | + "documentation":"<p> Learning rate for the reinforcement fine-tuning. Controls how quickly the model adapts to reward signals. </p>" |
| 11892 | + }, |
| 11893 | + "maxPromptLength":{ |
| 11894 | + "shape":"RFTMaxPromptLength", |
| 11895 | + "documentation":"<p> Maximum length of input prompts during RFT training, measured in tokens. Longer prompts allow more context but increase memory usage and training-time. </p>" |
| 11896 | + }, |
| 11897 | + "trainingSamplePerPrompt":{ |
| 11898 | + "shape":"RFTTrainingSamplePerPrompt", |
| 11899 | + "documentation":"<p> Number of response samples generated per prompt during RFT training. More samples provide better reward signal estimation. </p>" |
| 11900 | + }, |
| 11901 | + "inferenceMaxTokens":{ |
| 11902 | + "shape":"RFTInferenceMaxTokens", |
| 11903 | + "documentation":"<p> Maximum number of tokens the model can generate in response to each prompt during RFT training. </p>" |
| 11904 | + }, |
| 11905 | + "reasoningEffort":{ |
| 11906 | + "shape":"ReasoningEffort", |
| 11907 | + "documentation":"<p> Level of reasoning effort applied during RFT training. Higher values may improve response quality but increase training time. </p>" |
| 11908 | + }, |
| 11909 | + "evalInterval":{ |
| 11910 | + "shape":"RFTEvalInterval", |
| 11911 | + "documentation":"<p> Interval between evaluation runs during RFT training, measured in training steps. More frequent evaluation provides better monitoring. </p>" |
| 11912 | + } |
| 11913 | + }, |
| 11914 | + "documentation":"<p> Hyperparameters for controlling the reinforcement fine-tuning training process, including learning settings and evaluation intervals. </p>" |
| 11915 | + }, |
| 11916 | + "RFTInferenceMaxTokens":{ |
| 11917 | + "type":"integer", |
| 11918 | + "box":true |
| 11919 | + }, |
| 11920 | + "RFTLearningRate":{ |
| 11921 | + "type":"float", |
| 11922 | + "box":true, |
| 11923 | + "max":0.001, |
| 11924 | + "min":0.0000001 |
| 11925 | + }, |
| 11926 | + "RFTMaxPromptLength":{ |
| 11927 | + "type":"integer", |
| 11928 | + "box":true |
| 11929 | + }, |
| 11930 | + "RFTTrainingSamplePerPrompt":{ |
| 11931 | + "type":"integer", |
| 11932 | + "box":true, |
| 11933 | + "max":16, |
| 11934 | + "min":2 |
| 11935 | + }, |
11764 | 11936 | "RagConfigs":{ |
11765 | 11937 | "type":"list", |
11766 | 11938 | "member":{"shape":"RAGConfig"}, |
|
11820 | 11992 | "max":100, |
11821 | 11993 | "min":1 |
11822 | 11994 | }, |
| 11995 | + "ReasoningEffort":{ |
| 11996 | + "type":"string", |
| 11997 | + "enum":[ |
| 11998 | + "low", |
| 11999 | + "medium", |
| 12000 | + "high" |
| 12001 | + ] |
| 12002 | + }, |
11823 | 12003 | "RegionAvailability":{ |
11824 | 12004 | "type":"string", |
11825 | 12005 | "enum":[ |
|
12853 | 13033 | } |
12854 | 13034 | } |
12855 | 13035 | }, |
| 13036 | + "UpdateCustomModelDeploymentRequest":{ |
| 13037 | + "type":"structure", |
| 13038 | + "required":[ |
| 13039 | + "modelArn", |
| 13040 | + "customModelDeploymentIdentifier" |
| 13041 | + ], |
| 13042 | + "members":{ |
| 13043 | + "modelArn":{ |
| 13044 | + "shape":"CustomModelArn", |
| 13045 | + "documentation":"<p> ARN of the new custom model to deploy. This replaces the currently deployed model. </p>" |
| 13046 | + }, |
| 13047 | + "customModelDeploymentIdentifier":{ |
| 13048 | + "shape":"CustomModelDeploymentIdentifier", |
| 13049 | + "documentation":"<p> Identifier of the custom model deployment to update with the new custom model. </p>", |
| 13050 | + "location":"uri", |
| 13051 | + "locationName":"customModelDeploymentIdentifier" |
| 13052 | + } |
| 13053 | + } |
| 13054 | + }, |
| 13055 | + "UpdateCustomModelDeploymentResponse":{ |
| 13056 | + "type":"structure", |
| 13057 | + "required":["customModelDeploymentArn"], |
| 13058 | + "members":{ |
| 13059 | + "customModelDeploymentArn":{ |
| 13060 | + "shape":"CustomModelDeploymentArn", |
| 13061 | + "documentation":"<p> ARN of the custom model deployment being updated. </p>" |
| 13062 | + } |
| 13063 | + } |
| 13064 | + }, |
12856 | 13065 | "UpdateGuardrailRequest":{ |
12857 | 13066 | "type":"structure", |
12858 | 13067 | "required":[ |
|
0 commit comments