@@ -1363,6 +1363,7 @@ def deploy(
13631363 deploy_request_timeout : Optional [float ] = None ,
13641364 autoscaling_target_cpu_utilization : Optional [int ] = None ,
13651365 autoscaling_target_accelerator_duty_cycle : Optional [int ] = None ,
1366+ autoscaling_target_request_count_per_minute : Optional [int ] = None ,
13661367 enable_access_logging = False ,
13671368 disable_container_logging : bool = False ,
13681369 deployment_resource_pool : Optional [DeploymentResourcePool ] = None ,
@@ -1456,6 +1457,9 @@ def deploy(
14561457 Target Accelerator Duty Cycle.
14571458 Must also set accelerator_type and accelerator_count if specified.
14581459 A default value of 60 will be used if not specified.
1460+ autoscaling_target_request_count_per_minute (int):
1461+ Optional. The target number of requests per minute for autoscaling.
1462+ If set, the model will be scaled based on the number of requests it receives.
14591463 enable_access_logging (bool):
14601464 Whether to enable endpoint access logging. Defaults to False.
14611465 disable_container_logging (bool):
@@ -1536,6 +1540,7 @@ def deploy(
15361540 deploy_request_timeout = deploy_request_timeout ,
15371541 autoscaling_target_cpu_utilization = autoscaling_target_cpu_utilization ,
15381542 autoscaling_target_accelerator_duty_cycle = autoscaling_target_accelerator_duty_cycle ,
1543+ autoscaling_target_request_count_per_minute = autoscaling_target_request_count_per_minute ,
15391544 spot = spot ,
15401545 enable_access_logging = enable_access_logging ,
15411546 disable_container_logging = disable_container_logging ,
@@ -1568,6 +1573,7 @@ def _deploy(
15681573 deploy_request_timeout : Optional [float ] = None ,
15691574 autoscaling_target_cpu_utilization : Optional [int ] = None ,
15701575 autoscaling_target_accelerator_duty_cycle : Optional [int ] = None ,
1576+ autoscaling_target_request_count_per_minute : Optional [int ] = None ,
15711577 spot : bool = False ,
15721578 enable_access_logging = False ,
15731579 disable_container_logging : bool = False ,
@@ -1664,6 +1670,9 @@ def _deploy(
16641670 Target Accelerator Duty Cycle.
16651671 Must also set accelerator_type and accelerator_count if specified.
16661672 A default value of 60 will be used if not specified.
1673+ autoscaling_target_request_count_per_minute (int):
1674+ Optional. The target number of requests per minute for autoscaling.
1675+ If set, the model will be scaled based on the number of requests it receives.
16671676 spot (bool):
16681677 Optional. Whether to schedule the deployment workload on spot VMs.
16691678 enable_access_logging (bool):
@@ -1721,6 +1730,7 @@ def _deploy(
17211730 deploy_request_timeout = deploy_request_timeout ,
17221731 autoscaling_target_cpu_utilization = autoscaling_target_cpu_utilization ,
17231732 autoscaling_target_accelerator_duty_cycle = autoscaling_target_accelerator_duty_cycle ,
1733+ autoscaling_target_request_count_per_minute = autoscaling_target_request_count_per_minute ,
17241734 spot = spot ,
17251735 enable_access_logging = enable_access_logging ,
17261736 disable_container_logging = disable_container_logging ,
@@ -5339,6 +5349,7 @@ def deploy(
53395349 deploy_request_timeout : Optional [float ] = None ,
53405350 autoscaling_target_cpu_utilization : Optional [int ] = None ,
53415351 autoscaling_target_accelerator_duty_cycle : Optional [int ] = None ,
5352+ autoscaling_target_request_count_per_minute : Optional [int ] = None ,
53425353 enable_access_logging = False ,
53435354 disable_container_logging : bool = False ,
53445355 private_service_connect_config : Optional [
@@ -5454,6 +5465,9 @@ def deploy(
54545465 Optional. Target Accelerator Duty Cycle.
54555466 Must also set accelerator_type and accelerator_count if specified.
54565467 A default value of 60 will be used if not specified.
5468+ autoscaling_target_request_count_per_minute (int):
5469+ Optional. The target number of requests per minute for autoscaling.
5470+ If set, the model will be scaled based on the number of requests it receives.
54575471 enable_access_logging (bool):
54585472 Whether to enable endpoint access logging. Defaults to False.
54595473 disable_container_logging (bool):
@@ -5561,6 +5575,7 @@ def deploy(
55615575 deploy_request_timeout = deploy_request_timeout ,
55625576 autoscaling_target_cpu_utilization = autoscaling_target_cpu_utilization ,
55635577 autoscaling_target_accelerator_duty_cycle = autoscaling_target_accelerator_duty_cycle ,
5578+ autoscaling_target_request_count_per_minute = autoscaling_target_request_count_per_minute ,
55645579 spot = spot ,
55655580 enable_access_logging = enable_access_logging ,
55665581 disable_container_logging = disable_container_logging ,
@@ -5603,6 +5618,7 @@ def _deploy(
56035618 deploy_request_timeout : Optional [float ] = None ,
56045619 autoscaling_target_cpu_utilization : Optional [int ] = None ,
56055620 autoscaling_target_accelerator_duty_cycle : Optional [int ] = None ,
5621+ autoscaling_target_request_count_per_minute : Optional [int ] = None ,
56065622 spot : bool = False ,
56075623 enable_access_logging = False ,
56085624 disable_container_logging : bool = False ,
@@ -5720,6 +5736,9 @@ def _deploy(
57205736 Optional. Target Accelerator Duty Cycle.
57215737 Must also set accelerator_type and accelerator_count if specified.
57225738 A default value of 60 will be used if not specified.
5739+ autoscaling_target_request_count_per_minute (int):
5740+ Optional. The target number of requests per minute for autoscaling.
5741+ If set, the model will be scaled based on the number of requests it receives.
57235742 spot (bool):
57245743 Optional. Whether to schedule the deployment workload on spot VMs.
57255744 enable_access_logging (bool):
@@ -5808,6 +5827,7 @@ def _deploy(
58085827 deploy_request_timeout = deploy_request_timeout ,
58095828 autoscaling_target_cpu_utilization = autoscaling_target_cpu_utilization ,
58105829 autoscaling_target_accelerator_duty_cycle = autoscaling_target_accelerator_duty_cycle ,
5830+ autoscaling_target_request_count_per_minute = autoscaling_target_request_count_per_minute ,
58115831 spot = spot ,
58125832 enable_access_logging = enable_access_logging ,
58135833 disable_container_logging = disable_container_logging ,
0 commit comments