@@ -1294,6 +1294,7 @@ def deploy(
1294
1294
accelerator_type : Optional [str ] = None ,
1295
1295
accelerator_count : Optional [int ] = None ,
1296
1296
tpu_topology : Optional [str ] = None ,
1297
+ multihost_gpu_node_count : Optional [int ] = None ,
1297
1298
service_account : Optional [str ] = None ,
1298
1299
explanation_metadata : Optional [aiplatform .explain .ExplanationMetadata ] = None ,
1299
1300
explanation_parameters : Optional [
@@ -1365,6 +1366,9 @@ def deploy(
1365
1366
tpu_topology (str):
1366
1367
Optional. The TPU topology to use for the DeployedModel.
1367
1368
Required for CloudTPU multihost deployments.
1369
+ multihost_gpu_node_count (int):
1370
+ Optional. The number of nodes per replica for multihost GPU DeployedModel.
1371
+ Required for multihost GPU deployments.
1368
1372
service_account (str):
1369
1373
The service account that the DeployedModel's container runs as. Specify the
1370
1374
email address of the service account. If this service account is not
@@ -1457,6 +1461,7 @@ def deploy(
1457
1461
accelerator_type = accelerator_type ,
1458
1462
accelerator_count = accelerator_count ,
1459
1463
tpu_topology = tpu_topology ,
1464
+ multihost_gpu_node_count = multihost_gpu_node_count ,
1460
1465
reservation_affinity_type = reservation_affinity_type ,
1461
1466
reservation_affinity_key = reservation_affinity_key ,
1462
1467
reservation_affinity_values = reservation_affinity_values ,
@@ -1488,6 +1493,7 @@ def _deploy(
1488
1493
accelerator_type : Optional [str ] = None ,
1489
1494
accelerator_count : Optional [int ] = None ,
1490
1495
tpu_topology : Optional [str ] = None ,
1496
+ multihost_gpu_node_count : Optional [int ] = None ,
1491
1497
reservation_affinity_type : Optional [str ] = None ,
1492
1498
reservation_affinity_key : Optional [str ] = None ,
1493
1499
reservation_affinity_values : Optional [List [str ]] = None ,
@@ -1556,6 +1562,9 @@ def _deploy(
1556
1562
tpu_topology (str):
1557
1563
Optional. The TPU topology to use for the DeployedModel.
1558
1564
Required for CloudTPU multihost deployments.
1565
+ multihost_gpu_node_count (int):
1566
+ Optional. The number of nodes per replica for multihost GPU DeployedModel.
1567
+ Required for multihost GPU deployments.
1559
1568
reservation_affinity_type (str):
1560
1569
Optional. The type of reservation affinity.
1561
1570
One of NO_RESERVATION, ANY_RESERVATION, SPECIFIC_RESERVATION,
@@ -1633,6 +1642,7 @@ def _deploy(
1633
1642
accelerator_type = accelerator_type ,
1634
1643
accelerator_count = accelerator_count ,
1635
1644
tpu_topology = tpu_topology ,
1645
+ multihost_gpu_node_count = multihost_gpu_node_count ,
1636
1646
reservation_affinity_type = reservation_affinity_type ,
1637
1647
reservation_affinity_key = reservation_affinity_key ,
1638
1648
reservation_affinity_values = reservation_affinity_values ,
@@ -1671,6 +1681,7 @@ def _deploy_call(
1671
1681
accelerator_type : Optional [str ] = None ,
1672
1682
accelerator_count : Optional [int ] = None ,
1673
1683
tpu_topology : Optional [str ] = None ,
1684
+ multihost_gpu_node_count : Optional [int ] = None ,
1674
1685
reservation_affinity_type : Optional [str ] = None ,
1675
1686
reservation_affinity_key : Optional [str ] = None ,
1676
1687
reservation_affinity_values : Optional [List [str ]] = None ,
@@ -1748,6 +1759,9 @@ def _deploy_call(
1748
1759
tpu_topology (str):
1749
1760
Optional. The TPU topology to use for the DeployedModel.
1750
1761
Required for CloudTPU multihost deployments.
1762
+ multihost_gpu_node_count (int):
1763
+ Optional. The number of nodes per replica for multihost GPU DeployedModel.
1764
+ Required for multihost GPU deployments.
1751
1765
reservation_affinity_type (str):
1752
1766
Optional. The type of reservation affinity.
1753
1767
One of NO_RESERVATION, ANY_RESERVATION, SPECIFIC_RESERVATION,
@@ -1966,6 +1980,9 @@ def _deploy_call(
1966
1980
if tpu_topology is not None :
1967
1981
machine_spec .tpu_topology = tpu_topology
1968
1982
1983
+ if multihost_gpu_node_count is not None :
1984
+ machine_spec .multihost_gpu_node_count = multihost_gpu_node_count
1985
+
1969
1986
dedicated_resources .machine_spec = machine_spec
1970
1987
deployed_model .dedicated_resources = dedicated_resources
1971
1988
if fast_tryout_enabled :
@@ -3948,6 +3965,7 @@ def deploy(
3948
3965
accelerator_type : Optional [str ] = None ,
3949
3966
accelerator_count : Optional [int ] = None ,
3950
3967
tpu_topology : Optional [str ] = None ,
3968
+ multihost_gpu_node_count : Optional [int ] = None ,
3951
3969
service_account : Optional [str ] = None ,
3952
3970
explanation_metadata : Optional [aiplatform .explain .ExplanationMetadata ] = None ,
3953
3971
explanation_parameters : Optional [
@@ -4024,6 +4042,9 @@ def deploy(
4024
4042
tpu_topology (str):
4025
4043
Optional. The TPU topology to use for the DeployedModel.
4026
4044
Required for CloudTPU multihost deployments.
4045
+ multihost_gpu_node_count (int):
4046
+ Optional. The number of nodes per replica for multihost GPU DeployedModel.
4047
+ Required for multihost GPU deployments.
4027
4048
service_account (str):
4028
4049
The service account that the DeployedModel's container runs as. Specify the
4029
4050
email address of the service account. If this service account is not
@@ -4116,6 +4137,7 @@ def deploy(
4116
4137
accelerator_type = accelerator_type ,
4117
4138
accelerator_count = accelerator_count ,
4118
4139
tpu_topology = tpu_topology ,
4140
+ multihost_gpu_node_count = multihost_gpu_node_count ,
4119
4141
reservation_affinity_type = reservation_affinity_type ,
4120
4142
reservation_affinity_key = reservation_affinity_key ,
4121
4143
reservation_affinity_values = reservation_affinity_values ,
@@ -5166,6 +5188,7 @@ def deploy(
5166
5188
accelerator_type : Optional [str ] = None ,
5167
5189
accelerator_count : Optional [int ] = None ,
5168
5190
tpu_topology : Optional [str ] = None ,
5191
+ multihost_gpu_node_count : Optional [int ] = None ,
5169
5192
service_account : Optional [str ] = None ,
5170
5193
explanation_metadata : Optional [aiplatform .explain .ExplanationMetadata ] = None ,
5171
5194
explanation_parameters : Optional [
@@ -5242,6 +5265,9 @@ def deploy(
5242
5265
tpu_topology (str):
5243
5266
Optional. The TPU topology to use for the DeployedModel.
5244
5267
Requireid for CloudTPU multihost deployments.
5268
+ multihost_gpu_node_count (int):
5269
+ Optional. The number of nodes per replica for multihost GPU DeployedModel.
5270
+ Required for multihost GPU deployments.
5245
5271
service_account (str):
5246
5272
The service account that the DeployedModel's container runs as. Specify the
5247
5273
email address of the service account. If this service account is not
@@ -5377,6 +5403,7 @@ def deploy(
5377
5403
accelerator_type = accelerator_type ,
5378
5404
accelerator_count = accelerator_count ,
5379
5405
tpu_topology = tpu_topology ,
5406
+ multihost_gpu_node_count = multihost_gpu_node_count ,
5380
5407
reservation_affinity_type = reservation_affinity_type ,
5381
5408
reservation_affinity_key = reservation_affinity_key ,
5382
5409
reservation_affinity_values = reservation_affinity_values ,
@@ -5419,6 +5446,7 @@ def _deploy(
5419
5446
accelerator_type : Optional [str ] = None ,
5420
5447
accelerator_count : Optional [int ] = None ,
5421
5448
tpu_topology : Optional [str ] = None ,
5449
+ multihost_gpu_node_count : Optional [int ] = None ,
5422
5450
reservation_affinity_type : Optional [str ] = None ,
5423
5451
reservation_affinity_key : Optional [str ] = None ,
5424
5452
reservation_affinity_values : Optional [List [str ]] = None ,
@@ -5492,6 +5520,9 @@ def _deploy(
5492
5520
tpu_topology (str):
5493
5521
Optional. The TPU topology to use for the DeployedModel.
5494
5522
Requireid for CloudTPU multihost deployments.
5523
+ multihost_gpu_node_count (int):
5524
+ Optional. The number of nodes per replica for multihost GPU DeployedModel.
5525
+ Required for multihost GPU deployments.
5495
5526
reservation_affinity_type (str):
5496
5527
Optional. The type of reservation affinity.
5497
5528
One of NO_RESERVATION, ANY_RESERVATION, SPECIFIC_RESERVATION,
@@ -5618,6 +5649,7 @@ def _deploy(
5618
5649
accelerator_type = accelerator_type ,
5619
5650
accelerator_count = accelerator_count ,
5620
5651
tpu_topology = tpu_topology ,
5652
+ multihost_gpu_node_count = multihost_gpu_node_count ,
5621
5653
reservation_affinity_type = reservation_affinity_type ,
5622
5654
reservation_affinity_key = reservation_affinity_key ,
5623
5655
reservation_affinity_values = reservation_affinity_values ,
0 commit comments