|
219 | 219 | "documentation":"<p>Creates a batch inference job to invoke a model on multiple prompts. Format your data according to <a href=\"https://docs.aws.amazon.com/bedrock/latest/userguide/batch-inference-data\">Format your inference data</a> and upload it to an Amazon S3 bucket. For more information, see <a href=\"https://docs.aws.amazon.com/bedrock/latest/userguide/batch-inference.html\">Process multiple prompts with batch inference</a>.</p> <p>The response returns a <code>jobArn</code> that you can use to stop or get details about the job.</p>",
|
220 | 220 | "idempotent":true
|
221 | 221 | },
|
| 222 | + "CreatePromptRouter":{ |
| 223 | + "name":"CreatePromptRouter", |
| 224 | + "http":{ |
| 225 | + "method":"POST", |
| 226 | + "requestUri":"/prompt-routers", |
| 227 | + "responseCode":200 |
| 228 | + }, |
| 229 | + "input":{"shape":"CreatePromptRouterRequest"}, |
| 230 | + "output":{"shape":"CreatePromptRouterResponse"}, |
| 231 | + "errors":[ |
| 232 | + {"shape":"ResourceNotFoundException"}, |
| 233 | + {"shape":"AccessDeniedException"}, |
| 234 | + {"shape":"ValidationException"}, |
| 235 | + {"shape":"ConflictException"}, |
| 236 | + {"shape":"InternalServerException"}, |
| 237 | + {"shape":"TooManyTagsException"}, |
| 238 | + {"shape":"ServiceQuotaExceededException"}, |
| 239 | + {"shape":"ThrottlingException"} |
| 240 | + ], |
| 241 | + "documentation":"<p>Creates a prompt router that manages the routing of requests between multiple foundation models based on the routing criteria.</p>", |
| 242 | + "idempotent":true |
| 243 | + }, |
222 | 244 | "CreateProvisionedModelThroughput":{
|
223 | 245 | "name":"CreateProvisionedModelThroughput",
|
224 | 246 | "http":{
|
|
356 | 378 | "documentation":"<p>Delete the invocation logging. </p>",
|
357 | 379 | "idempotent":true
|
358 | 380 | },
|
| 381 | + "DeletePromptRouter":{ |
| 382 | + "name":"DeletePromptRouter", |
| 383 | + "http":{ |
| 384 | + "method":"DELETE", |
| 385 | + "requestUri":"/prompt-routers/{promptRouterArn}", |
| 386 | + "responseCode":200 |
| 387 | + }, |
| 388 | + "input":{"shape":"DeletePromptRouterRequest"}, |
| 389 | + "output":{"shape":"DeletePromptRouterResponse"}, |
| 390 | + "errors":[ |
| 391 | + {"shape":"ResourceNotFoundException"}, |
| 392 | + {"shape":"AccessDeniedException"}, |
| 393 | + {"shape":"ValidationException"}, |
| 394 | + {"shape":"InternalServerException"}, |
| 395 | + {"shape":"ThrottlingException"} |
| 396 | + ], |
| 397 | + "documentation":"<p>Deletes a specified prompt router. This action cannot be undone.</p>", |
| 398 | + "idempotent":true |
| 399 | + }, |
359 | 400 | "DeleteProvisionedModelThroughput":{
|
360 | 401 | "name":"DeleteProvisionedModelThroughput",
|
361 | 402 | "http":{
|
|
1858 | 1899 | }
|
1859 | 1900 | }
|
1860 | 1901 | },
|
| 1902 | + "CreatePromptRouterRequest":{ |
| 1903 | + "type":"structure", |
| 1904 | + "required":[ |
| 1905 | + "promptRouterName", |
| 1906 | + "models", |
| 1907 | + "routingCriteria", |
| 1908 | + "fallbackModel" |
| 1909 | + ], |
| 1910 | + "members":{ |
| 1911 | + "clientRequestToken":{ |
| 1912 | + "shape":"IdempotencyToken", |
| 1913 | + "documentation":"<p>A unique, case-sensitive identifier that you provide to ensure idempotency of your requests. If not specified, the Amazon Web Services SDK automatically generates one for you.</p>", |
| 1914 | + "idempotencyToken":true |
| 1915 | + }, |
| 1916 | + "promptRouterName":{ |
| 1917 | + "shape":"PromptRouterName", |
| 1918 | + "documentation":"<p>The name of the prompt router. The name must be unique within your Amazon Web Services account in the current region.</p>" |
| 1919 | + }, |
| 1920 | + "models":{ |
| 1921 | + "shape":"PromptRouterTargetModels", |
| 1922 | + "documentation":"<p>A list of foundation models that the prompt router can route requests to. At least one model must be specified.</p>" |
| 1923 | + }, |
| 1924 | + "description":{ |
| 1925 | + "shape":"PromptRouterDescription", |
| 1926 | + "documentation":"<p>An optional description of the prompt router to help identify its purpose.</p>" |
| 1927 | + }, |
| 1928 | + "routingCriteria":{ |
| 1929 | + "shape":"RoutingCriteria", |
| 1930 | + "documentation":"<p>The criteria, which is the response quality difference, used to determine how incoming requests are routed to different models.</p>" |
| 1931 | + }, |
| 1932 | + "fallbackModel":{ |
| 1933 | + "shape":"PromptRouterTargetModel", |
| 1934 | + "documentation":"<p>The default model to use when the routing criteria is not met.</p>" |
| 1935 | + }, |
| 1936 | + "tags":{ |
| 1937 | + "shape":"TagList", |
| 1938 | + "documentation":"<p>An array of key-value pairs to apply to this resource as tags. You can use tags to categorize and manage your Amazon Web Services resources.</p>" |
| 1939 | + } |
| 1940 | + } |
| 1941 | + }, |
| 1942 | + "CreatePromptRouterResponse":{ |
| 1943 | + "type":"structure", |
| 1944 | + "members":{ |
| 1945 | + "promptRouterArn":{ |
| 1946 | + "shape":"PromptRouterArn", |
| 1947 | + "documentation":"<p>The Amazon Resource Name (ARN) that uniquely identifies the prompt router.</p>" |
| 1948 | + } |
| 1949 | + } |
| 1950 | + }, |
1861 | 1951 | "CreateProvisionedModelThroughputRequest":{
|
1862 | 1952 | "type":"structure",
|
1863 | 1953 | "required":[
|
|
2080 | 2170 | "members":{
|
2081 | 2171 | }
|
2082 | 2172 | },
|
| 2173 | + "DeletePromptRouterRequest":{ |
| 2174 | + "type":"structure", |
| 2175 | + "required":["promptRouterArn"], |
| 2176 | + "members":{ |
| 2177 | + "promptRouterArn":{ |
| 2178 | + "shape":"PromptRouterArn", |
| 2179 | + "documentation":"<p>The Amazon Resource Name (ARN) of the prompt router to delete.</p>", |
| 2180 | + "location":"uri", |
| 2181 | + "locationName":"promptRouterArn" |
| 2182 | + } |
| 2183 | + } |
| 2184 | + }, |
| 2185 | + "DeletePromptRouterResponse":{ |
| 2186 | + "type":"structure", |
| 2187 | + "members":{ |
| 2188 | + } |
| 2189 | + }, |
2083 | 2190 | "DeleteProvisionedModelThroughputRequest":{
|
2084 | 2191 | "type":"structure",
|
2085 | 2192 | "required":["provisionedModelId"],
|
|
5596 | 5703 | "documentation":"<p>Specify the pagination token from a previous request to retrieve the next page of results.</p>",
|
5597 | 5704 | "location":"querystring",
|
5598 | 5705 | "locationName":"nextToken"
|
| 5706 | + }, |
| 5707 | + "type":{ |
| 5708 | + "shape":"PromptRouterType", |
| 5709 | + "documentation":"<p>The type of the prompt routers, such as whether it's default or custom.</p>", |
| 5710 | + "location":"querystring", |
| 5711 | + "locationName":"type" |
5599 | 5712 | }
|
5600 | 5713 | }
|
5601 | 5714 | },
|
|
6468 | 6581 | },
|
6469 | 6582 | "PromptRouterTargetModel":{
|
6470 | 6583 | "type":"structure",
|
| 6584 | + "required":["modelArn"], |
6471 | 6585 | "members":{
|
6472 | 6586 | "modelArn":{
|
6473 | 6587 | "shape":"PromptRouterTargetModelArn",
|
|
6480 | 6594 | "type":"string",
|
6481 | 6595 | "max":2048,
|
6482 | 6596 | "min":1,
|
6483 |
| - "pattern":".*(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}::foundation-model/[a-z0-9-]{1,63}[.]{1}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2})|(^arn:aws(|-us-gov|-cn|-iso|-iso-b):bedrock:(|[0-9a-z-]{0,20}):(|[0-9]{12}):inference-profile/[a-zA-Z0-9-:.]+)" |
| 6597 | + "pattern":".*(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}::foundation-model/[a-z0-9-]{1,63}[.]{1}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2})|(^arn:aws(|-us-gov|-cn|-iso|-iso-b):bedrock:(|[0-9a-z-]{0,20}):(|[0-9]{12}):(inference-profile|application-inference-profile)/[a-zA-Z0-9-:.]+)" |
6484 | 6598 | },
|
6485 | 6599 | "PromptRouterTargetModels":{
|
6486 | 6600 | "type":"list",
|
|
6898 | 7012 | "RoutingCriteriaResponseQualityDifferenceDouble":{
|
6899 | 7013 | "type":"double",
|
6900 | 7014 | "box":true,
|
6901 |
| - "max":1, |
| 7015 | + "max":100, |
6902 | 7016 | "min":0
|
6903 | 7017 | },
|
6904 | 7018 | "S3Config":{
|
|
7184 | 7298 | "type":"string",
|
7185 | 7299 | "max":1011,
|
7186 | 7300 | "min":20,
|
7187 |
| - "pattern":".*(^[a-zA-Z0-9][a-zA-Z0-9\\-]*$)|(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:([0-9]{12}|)((:(fine-tuning-job|model-customization-job|custom-model)/[a-z0-9-]{1,63}[.]{1}[a-z0-9-]{1,63}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2}(/[a-z0-9]{12})$)|(:guardrail/[a-z0-9]+$)|(:(inference-profile|application-inference-profile)/[a-zA-Z0-9-:.]+$)|(:(provisioned-model|model-invocation-job|model-evaluation-job|evaluation-job|model-import-job|imported-model|async-invoke)/[a-z0-9]{12}$))).*" |
| 7301 | + "pattern":".*(^[a-zA-Z0-9][a-zA-Z0-9\\-]*$)|(^arn:aws(-[^:]+)?:bedrock:[a-z0-9-]{1,20}:([0-9]{12}|)((:(fine-tuning-job|model-customization-job|custom-model)/[a-z0-9-]{1,63}[.]{1}[a-z0-9-]{1,63}([a-z0-9-]{1,63}[.]){0,2}[a-z0-9-]{1,63}([:][a-z0-9-]{1,63}){0,2}(/[a-z0-9]{12})$)|(:guardrail/[a-z0-9]+$)|(:automated-reasoning-policy/[a-zA-Z0-9]+(:[a-zA-Z0-9]+)?$)|(:(inference-profile|application-inference-profile)/[a-zA-Z0-9-:.]+$)|(:(provisioned-model|model-invocation-job|model-evaluation-job|evaluation-job|model-import-job|imported-model|async-invoke|provisioned-model-v2|provisioned-model-reservation|prompt-router)/[a-z0-9]{12}$))).*" |
7188 | 7302 | },
|
7189 | 7303 | "TeacherModelConfig":{
|
7190 | 7304 | "type":"structure",
|
|
0 commit comments