Skip to content

Commit 7a7f0d4

Browse files
feat: add dedicated_resources to DeployedIndex in aiplatform v1beta1 index_endpoint.proto feat: add Scaling to OnlineServingConfig in aiplatform v1beta1 featurestore.proto chore: sort imports (#991)
* feat: add dedicated_resources to DeployedIndex in aiplatform v1beta1 index_endpoint.proto feat: add Scaling to OnlineServingConfig in aiplatform v1beta1 featurestore.proto chore: sort imports PiperOrigin-RevId: 425395202 Source-Link: googleapis/googleapis@e3bcc1e Source-Link: googleapis/googleapis-gen@62beef7 Copy-Tag: eyJwIjoiLmdpdGh1Yi8uT3dsQm90LnlhbWwiLCJoIjoiNjJiZWVmNzg1NTljOGJhYjQ3ZWNkMzZlZWQxYWE2YjY3OGRiNjA4OCJ9 * 🦉 Updates from OwlBot See https://github.com/googleapis/repo-automation-bots/blob/main/packages/owl-bot/README.md Co-authored-by: Owl Bot <gcf-owl-bot[bot]@users.noreply.github.com> Co-authored-by: Yu-Han Liu <[email protected]>
1 parent a814923 commit 7a7f0d4

File tree

9 files changed

+53
-25
lines changed

9 files changed

+53
-25
lines changed

google/cloud/aiplatform_v1beta1/services/vizier_service/async_client.py

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -255,9 +255,7 @@ async def create_study(
255255
256256
Returns:
257257
google.cloud.aiplatform_v1beta1.types.Study:
258-
LINT.IfChange
259258
A message representing a Study.
260-
261259
"""
262260
# Create or coerce a protobuf request object.
263261
# Quick check: If we got a request object, we should *not* have
@@ -328,9 +326,7 @@ async def get_study(
328326
329327
Returns:
330328
google.cloud.aiplatform_v1beta1.types.Study:
331-
LINT.IfChange
332329
A message representing a Study.
333-
334330
"""
335331
# Create or coerce a protobuf request object.
336332
# Quick check: If we got a request object, we should *not* have
@@ -548,9 +544,7 @@ async def lookup_study(
548544
549545
Returns:
550546
google.cloud.aiplatform_v1beta1.types.Study:
551-
LINT.IfChange
552547
A message representing a Study.
553-
554548
"""
555549
# Create or coerce a protobuf request object.
556550
# Quick check: If we got a request object, we should *not* have

google/cloud/aiplatform_v1beta1/services/vizier_service/client.py

Lines changed: 0 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -478,9 +478,7 @@ def create_study(
478478
479479
Returns:
480480
google.cloud.aiplatform_v1beta1.types.Study:
481-
LINT.IfChange
482481
A message representing a Study.
483-
484482
"""
485483
# Create or coerce a protobuf request object.
486484
# Quick check: If we got a request object, we should *not* have
@@ -551,9 +549,7 @@ def get_study(
551549
552550
Returns:
553551
google.cloud.aiplatform_v1beta1.types.Study:
554-
LINT.IfChange
555552
A message representing a Study.
556-
557553
"""
558554
# Create or coerce a protobuf request object.
559555
# Quick check: If we got a request object, we should *not* have
@@ -771,9 +767,7 @@ def lookup_study(
771767
772768
Returns:
773769
google.cloud.aiplatform_v1beta1.types.Study:
774-
LINT.IfChange
775770
A message representing a Study.
776-
777771
"""
778772
# Create or coerce a protobuf request object.
779773
# Quick check: If we got a request object, we should *not* have

google/cloud/aiplatform_v1beta1/types/custom_job.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -120,6 +120,7 @@ class CustomJob(proto.Message):
120120

121121
class CustomJobSpec(proto.Message):
122122
r"""Represents the spec of a CustomJob.
123+
Next Id: 14
123124
124125
Attributes:
125126
worker_pool_specs (Sequence[google.cloud.aiplatform_v1beta1.types.WorkerPoolSpec]):

google/cloud/aiplatform_v1beta1/types/featurestore.py

Lines changed: 30 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -81,13 +81,39 @@ class OnlineServingConfig(proto.Message):
8181
8282
Attributes:
8383
fixed_node_count (int):
84-
The number of nodes for each cluster. The
85-
number of nodes will not scale automatically but
86-
can be scaled manually by providing different
87-
values when updating.
84+
The number of nodes for each cluster. The number of nodes
85+
will not scale automatically but can be scaled manually by
86+
providing different values when updating. Only one of
87+
``fixed_node_count`` and ``scaling`` can be set. Setting one
88+
will reset the other.
89+
scaling (google.cloud.aiplatform_v1beta1.types.Featurestore.OnlineServingConfig.Scaling):
90+
Online serving scaling configuration. Only one of
91+
``fixed_node_count`` and ``scaling`` can be set. Setting one
92+
will reset the other.
8893
"""
8994

95+
class Scaling(proto.Message):
96+
r"""Online serving scaling configuration. If min_node_count and
97+
max_node_count are set to the same value, the cluster will be
98+
configured with the fixed number of node (no auto-scaling).
99+
100+
Attributes:
101+
min_node_count (int):
102+
Required. The minimum number of nodes to
103+
scale down to. Must be greater than or equal to
104+
1.
105+
max_node_count (int):
106+
The maximum number of nodes to scale up to. Must be greater
107+
or equal to min_node_count.
108+
"""
109+
110+
min_node_count = proto.Field(proto.INT32, number=1,)
111+
max_node_count = proto.Field(proto.INT32, number=2,)
112+
90113
fixed_node_count = proto.Field(proto.INT32, number=2,)
114+
scaling = proto.Field(
115+
proto.MESSAGE, number=4, message="Featurestore.OnlineServingConfig.Scaling",
116+
)
91117

92118
name = proto.Field(proto.STRING, number=1,)
93119
create_time = proto.Field(proto.MESSAGE, number=3, message=timestamp_pb2.Timestamp,)

google/cloud/aiplatform_v1beta1/types/index_endpoint.py

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -171,6 +171,15 @@ class DeployedIndex(proto.Message):
171171
don't provide SLA when min_replica_count=1). If
172172
max_replica_count is not set, the default value is
173173
min_replica_count. The max allowed replica count is 1000.
174+
dedicated_resources (google.cloud.aiplatform_v1beta1.types.DedicatedResources):
175+
Optional. A description of resources that are dedicated to
176+
the DeployedIndex, and that need a higher degree of manual
177+
configuration. If min_replica_count is not set, the default
178+
value is 2 (we don't provide SLA when min_replica_count=1).
179+
If max_replica_count is not set, the default value is
180+
min_replica_count. The max allowed replica count is 1000.
181+
182+
Available machine types: n1-standard-16 n1-standard-32
174183
enable_access_logging (bool):
175184
Optional. If true, private endpoint's access
176185
logs are sent to StackDriver Logging.
@@ -227,6 +236,9 @@ class DeployedIndex(proto.Message):
227236
automatic_resources = proto.Field(
228237
proto.MESSAGE, number=7, message=machine_resources.AutomaticResources,
229238
)
239+
dedicated_resources = proto.Field(
240+
proto.MESSAGE, number=16, message=machine_resources.DedicatedResources,
241+
)
230242
enable_access_logging = proto.Field(proto.BOOL, number=8,)
231243
deployed_index_auth_config = proto.Field(
232244
proto.MESSAGE, number=9, message="DeployedIndexAuthConfig",

google/cloud/aiplatform_v1beta1/types/model.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -397,7 +397,7 @@ class ModelContainerSpec(proto.Message):
397397
r"""Specification of a container for serving predictions. Some fields in
398398
this message correspond to fields in the `Kubernetes Container v1
399399
core
400-
specification <https://v1-18.docs.kubernetes.io/docs/reference/generated/kubernetes-api/v1.18/#container-v1-core>`__.
400+
specification <https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#container-v1-core>`__.
401401
402402
Attributes:
403403
image_uri (str):
@@ -463,7 +463,7 @@ class ModelContainerSpec(proto.Message):
463463
this syntax with ``$$``; for example: $$(VARIABLE_NAME) This
464464
field corresponds to the ``command`` field of the Kubernetes
465465
Containers `v1 core
466-
API <https://v1-18.docs.kubernetes.io/docs/reference/generated/kubernetes-api/v1.18/#container-v1-core>`__.
466+
API <https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#container-v1-core>`__.
467467
args (Sequence[str]):
468468
Immutable. Specifies arguments for the command that runs
469469
when the container starts. This overrides the container's
@@ -502,7 +502,7 @@ class ModelContainerSpec(proto.Message):
502502
this syntax with ``$$``; for example: $$(VARIABLE_NAME) This
503503
field corresponds to the ``args`` field of the Kubernetes
504504
Containers `v1 core
505-
API <https://v1-18.docs.kubernetes.io/docs/reference/generated/kubernetes-api/v1.18/#container-v1-core>`__.
505+
API <https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#container-v1-core>`__.
506506
env (Sequence[google.cloud.aiplatform_v1beta1.types.EnvVar]):
507507
Immutable. List of environment variables to set in the
508508
container. After the container starts running, code running
@@ -535,7 +535,7 @@ class ModelContainerSpec(proto.Message):
535535
536536
This field corresponds to the ``env`` field of the
537537
Kubernetes Containers `v1 core
538-
API <https://v1-18.docs.kubernetes.io/docs/reference/generated/kubernetes-api/v1.18/#container-v1-core>`__.
538+
API <https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#container-v1-core>`__.
539539
ports (Sequence[google.cloud.aiplatform_v1beta1.types.Port]):
540540
Immutable. List of ports to expose from the container.
541541
Vertex AI sends any prediction requests that it receives to
@@ -558,7 +558,7 @@ class ModelContainerSpec(proto.Message):
558558
Vertex AI does not use ports other than the first one
559559
listed. This field corresponds to the ``ports`` field of the
560560
Kubernetes Containers `v1 core
561-
API <https://v1-18.docs.kubernetes.io/docs/reference/generated/kubernetes-api/v1.18/#container-v1-core>`__.
561+
API <https://kubernetes.io/docs/reference/generated/kubernetes-api/v1.23/#container-v1-core>`__.
562562
predict_route (str):
563563
Immutable. HTTP path on the container to send prediction
564564
requests to. Vertex AI forwards requests sent using

google/cloud/aiplatform_v1beta1/types/model_deployment_monitoring_job.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -284,9 +284,10 @@ class ModelDeploymentMonitoringScheduleConfig(proto.Message):
284284
285285
Attributes:
286286
monitor_interval (google.protobuf.duration_pb2.Duration):
287-
Required. The model monitoring job running
287+
Required. The model monitoring job scheduling
288288
interval. It will be rounded up to next full
289-
hour.
289+
hour. This defines how often the monitoring jobs
290+
are triggered.
290291
"""
291292

292293
monitor_interval = proto.Field(

google/cloud/aiplatform_v1beta1/types/study.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,7 @@
2727

2828

2929
class Study(proto.Message):
30-
r"""LINT.IfChange
31-
A message representing a Study.
30+
r"""A message representing a Study.
3231
3332
Attributes:
3433
name (str):

tests/unit/gapic/aiplatform_v1beta1/test_index_endpoint_service.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,7 @@
4343
)
4444
from google.cloud.aiplatform_v1beta1.services.index_endpoint_service import pagers
4545
from google.cloud.aiplatform_v1beta1.services.index_endpoint_service import transports
46+
from google.cloud.aiplatform_v1beta1.types import accelerator_type
4647
from google.cloud.aiplatform_v1beta1.types import index_endpoint
4748
from google.cloud.aiplatform_v1beta1.types import index_endpoint as gca_index_endpoint
4849
from google.cloud.aiplatform_v1beta1.types import index_endpoint_service

0 commit comments

Comments
 (0)