diff --git a/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/endpoint_pb.rb b/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/endpoint_pb.rb index d8fddc28741e..08c1c8c57d37 100644 --- a/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/endpoint_pb.rb +++ b/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/endpoint_pb.rb @@ -15,7 +15,7 @@ require 'google/protobuf/timestamp_pb' -descriptor_data = "\n)google/cloud/aiplatform/v1/endpoint.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/resource.proto\x1a\x30google/cloud/aiplatform/v1/encryption_spec.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a#google/cloud/aiplatform/v1/io.proto\x1a\x32google/cloud/aiplatform/v1/machine_resources.proto\x1a\x33google/cloud/aiplatform/v1/service_networking.proto\x1a\x1egoogle/protobuf/duration.proto\x1a\x1fgoogle/protobuf/timestamp.proto\"\xff\n\n\x08\x45ndpoint\x12\x11\n\x04name\x18\x01 \x01(\tB\x03\xe0\x41\x03\x12\x19\n\x0c\x64isplay_name\x18\x02 \x01(\tB\x03\xe0\x41\x02\x12\x13\n\x0b\x64\x65scription\x18\x03 \x01(\t\x12G\n\x0f\x64\x65ployed_models\x18\x04 \x03(\x0b\x32).google.cloud.aiplatform.v1.DeployedModelB\x03\xe0\x41\x03\x12M\n\rtraffic_split\x18\x05 \x03(\x0b\x32\x36.google.cloud.aiplatform.v1.Endpoint.TrafficSplitEntry\x12\x0c\n\x04\x65tag\x18\x06 \x01(\t\x12@\n\x06labels\x18\x07 \x03(\x0b\x32\x30.google.cloud.aiplatform.v1.Endpoint.LabelsEntry\x12\x34\n\x0b\x63reate_time\x18\x08 \x01(\x0b\x32\x1a.google.protobuf.TimestampB\x03\xe0\x41\x03\x12\x34\n\x0bupdate_time\x18\t \x01(\x0b\x32\x1a.google.protobuf.TimestampB\x03\xe0\x41\x03\x12\x43\n\x0f\x65ncryption_spec\x18\n \x01(\x0b\x32*.google.cloud.aiplatform.v1.EncryptionSpec\x12\x37\n\x07network\x18\r \x01(\tB&\xe0\x41\x01\xfa\x41 \n\x1e\x63ompute.googleapis.com/Network\x12*\n\x1e\x65nable_private_service_connect\x18\x11 \x01(\x08\x42\x02\x18\x01\x12\x64\n\x1eprivate_service_connect_config\x18\x15 \x01(\x0b\x32\x37.google.cloud.aiplatform.v1.PrivateServiceConnectConfigB\x03\xe0\x41\x01\x12g\n\x1fmodel_deployment_monitoring_job\x18\x0e \x01(\tB>\xe0\x41\x03\xfa\x41\x38\n6aiplatform.googleapis.com/ModelDeploymentMonitoringJob\x12p\n\'predict_request_response_logging_config\x18\x12 \x01(\x0b\x32?.google.cloud.aiplatform.v1.PredictRequestResponseLoggingConfig\x12\"\n\x1a\x64\x65\x64icated_endpoint_enabled\x18\x18 \x01(\x08\x12#\n\x16\x64\x65\x64icated_endpoint_dns\x18\x19 \x01(\tB\x03\xe0\x41\x03\x12T\n\x18\x63lient_connection_config\x18\x17 \x01(\x0b\x32\x32.google.cloud.aiplatform.v1.ClientConnectionConfig\x12\x1a\n\rsatisfies_pzs\x18\x1b \x01(\x08\x42\x03\xe0\x41\x03\x12\x1a\n\rsatisfies_pzi\x18\x1c \x01(\x08\x42\x03\xe0\x41\x03\x1a\x33\n\x11TrafficSplitEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\x05:\x02\x38\x01\x1a-\n\x0bLabelsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01:\xb5\x01\xea\x41\xb1\x01\n\"aiplatform.googleapis.com/Endpoint\x12cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3" +descriptor_data = "\n)google/cloud/aiplatform/v1/endpoint.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/resource.proto\x1a\x30google/cloud/aiplatform/v1/encryption_spec.proto\x1a,google/cloud/aiplatform/v1/explanation.proto\x1a#google/cloud/aiplatform/v1/io.proto\x1a\x32google/cloud/aiplatform/v1/machine_resources.proto\x1a\x33google/cloud/aiplatform/v1/service_networking.proto\x1a\x1egoogle/protobuf/duration.proto\x1a\x1fgoogle/protobuf/timestamp.proto\"\xff\n\n\x08\x45ndpoint\x12\x11\n\x04name\x18\x01 \x01(\tB\x03\xe0\x41\x03\x12\x19\n\x0c\x64isplay_name\x18\x02 \x01(\tB\x03\xe0\x41\x02\x12\x13\n\x0b\x64\x65scription\x18\x03 \x01(\t\x12G\n\x0f\x64\x65ployed_models\x18\x04 \x03(\x0b\x32).google.cloud.aiplatform.v1.DeployedModelB\x03\xe0\x41\x03\x12M\n\rtraffic_split\x18\x05 \x03(\x0b\x32\x36.google.cloud.aiplatform.v1.Endpoint.TrafficSplitEntry\x12\x0c\n\x04\x65tag\x18\x06 \x01(\t\x12@\n\x06labels\x18\x07 \x03(\x0b\x32\x30.google.cloud.aiplatform.v1.Endpoint.LabelsEntry\x12\x34\n\x0b\x63reate_time\x18\x08 \x01(\x0b\x32\x1a.google.protobuf.TimestampB\x03\xe0\x41\x03\x12\x34\n\x0bupdate_time\x18\t \x01(\x0b\x32\x1a.google.protobuf.TimestampB\x03\xe0\x41\x03\x12\x43\n\x0f\x65ncryption_spec\x18\n \x01(\x0b\x32*.google.cloud.aiplatform.v1.EncryptionSpec\x12\x37\n\x07network\x18\r \x01(\tB&\xe0\x41\x01\xfa\x41 \n\x1e\x63ompute.googleapis.com/Network\x12*\n\x1e\x65nable_private_service_connect\x18\x11 \x01(\x08\x42\x02\x18\x01\x12\x64\n\x1eprivate_service_connect_config\x18\x15 \x01(\x0b\x32\x37.google.cloud.aiplatform.v1.PrivateServiceConnectConfigB\x03\xe0\x41\x01\x12g\n\x1fmodel_deployment_monitoring_job\x18\x0e \x01(\tB>\xe0\x41\x03\xfa\x41\x38\n6aiplatform.googleapis.com/ModelDeploymentMonitoringJob\x12p\n\'predict_request_response_logging_config\x18\x12 \x01(\x0b\x32?.google.cloud.aiplatform.v1.PredictRequestResponseLoggingConfig\x12\"\n\x1a\x64\x65\x64icated_endpoint_enabled\x18\x18 \x01(\x08\x12#\n\x16\x64\x65\x64icated_endpoint_dns\x18\x19 \x01(\tB\x03\xe0\x41\x03\x12T\n\x18\x63lient_connection_config\x18\x17 \x01(\x0b\x32\x32.google.cloud.aiplatform.v1.ClientConnectionConfig\x12\x1a\n\rsatisfies_pzs\x18\x1b \x01(\x08\x42\x03\xe0\x41\x03\x12\x1a\n\rsatisfies_pzi\x18\x1c \x01(\x08\x42\x03\xe0\x41\x03\x1a\x33\n\x11TrafficSplitEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\x05:\x02\x38\x01\x1a-\n\x0bLabelsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01:\xb5\x01\xea\x41\xb1\x01\n\"aiplatform.googleapis.com/Endpoint\x12cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3" pool = Google::Protobuf::DescriptorPool.generated_pool @@ -54,6 +54,7 @@ module AIPlatform module V1 Endpoint = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.Endpoint").msgclass DeployedModel = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DeployedModel").msgclass + DeployedModel::Status = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.DeployedModel.Status").msgclass PrivateEndpoints = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PrivateEndpoints").msgclass PredictRequestResponseLoggingConfig = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.PredictRequestResponseLoggingConfig").msgclass FasterDeploymentConfig = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.aiplatform.v1.FasterDeploymentConfig").msgclass diff --git a/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/machine_resources_pb.rb b/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/machine_resources_pb.rb index 85aaa96f5fb5..29ff11970f22 100644 --- a/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/machine_resources_pb.rb +++ b/google-cloud-ai_platform-v1/lib/google/cloud/aiplatform/v1/machine_resources_pb.rb @@ -9,7 +9,7 @@ require 'google/cloud/aiplatform/v1/reservation_affinity_pb' -descriptor_data = "\n2google/cloud/aiplatform/v1/machine_resources.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1fgoogle/api/field_behavior.proto\x1a\x31google/cloud/aiplatform/v1/accelerator_type.proto\x1a\x35google/cloud/aiplatform/v1/reservation_affinity.proto\"\x81\x02\n\x0bMachineSpec\x12\x19\n\x0cmachine_type\x18\x01 \x01(\tB\x03\xe0\x41\x05\x12J\n\x10\x61\x63\x63\x65lerator_type\x18\x02 \x01(\x0e\x32+.google.cloud.aiplatform.v1.AcceleratorTypeB\x03\xe0\x41\x05\x12\x19\n\x11\x61\x63\x63\x65lerator_count\x18\x03 \x01(\x05\x12\x19\n\x0ctpu_topology\x18\x04 \x01(\tB\x03\xe0\x41\x05\x12U\n\x14reservation_affinity\x18\x05 \x01(\x0b\x32/.google.cloud.aiplatform.v1.ReservationAffinityB\x06\xe0\x41\x05\xe0\x41\x01\"\x8b\x02\n\x12\x44\x65\x64icatedResources\x12\x45\n\x0cmachine_spec\x18\x01 \x01(\x0b\x32\'.google.cloud.aiplatform.v1.MachineSpecB\x06\xe0\x41\x02\xe0\x41\x05\x12!\n\x11min_replica_count\x18\x02 \x01(\x05\x42\x06\xe0\x41\x02\xe0\x41\x05\x12\x1e\n\x11max_replica_count\x18\x03 \x01(\x05\x42\x03\xe0\x41\x05\x12X\n\x18\x61utoscaling_metric_specs\x18\x04 \x03(\x0b\x32\x31.google.cloud.aiplatform.v1.AutoscalingMetricSpecB\x03\xe0\x41\x05\x12\x11\n\x04spot\x18\x05 \x01(\x08\x42\x03\xe0\x41\x01\"T\n\x12\x41utomaticResources\x12\x1e\n\x11min_replica_count\x18\x01 \x01(\x05\x42\x03\xe0\x41\x05\x12\x1e\n\x11max_replica_count\x18\x02 \x01(\x05\x42\x03\xe0\x41\x05\"\xa5\x01\n\x17\x42\x61tchDedicatedResources\x12\x45\n\x0cmachine_spec\x18\x01 \x01(\x0b\x32\'.google.cloud.aiplatform.v1.MachineSpecB\x06\xe0\x41\x02\xe0\x41\x05\x12#\n\x16starting_replica_count\x18\x02 \x01(\x05\x42\x03\xe0\x41\x05\x12\x1e\n\x11max_replica_count\x18\x03 \x01(\x05\x42\x03\xe0\x41\x05\"/\n\x11ResourcesConsumed\x12\x1a\n\rreplica_hours\x18\x01 \x01(\x01\x42\x03\xe0\x41\x03\"=\n\x08\x44iskSpec\x12\x16\n\x0e\x62oot_disk_type\x18\x01 \x01(\t\x12\x19\n\x11\x62oot_disk_size_gb\x18\x02 \x01(\x05\"=\n\x12PersistentDiskSpec\x12\x11\n\tdisk_type\x18\x01 \x01(\t\x12\x14\n\x0c\x64isk_size_gb\x18\x02 \x01(\x03\"L\n\x08NfsMount\x12\x13\n\x06server\x18\x01 \x01(\tB\x03\xe0\x41\x02\x12\x11\n\x04path\x18\x02 \x01(\tB\x03\xe0\x41\x02\x12\x18\n\x0bmount_point\x18\x03 \x01(\tB\x03\xe0\x41\x02\"A\n\x15\x41utoscalingMetricSpec\x12\x18\n\x0bmetric_name\x18\x01 \x01(\tB\x03\xe0\x41\x02\x12\x0e\n\x06target\x18\x02 \x01(\x05\".\n\x10ShieldedVmConfig\x12\x1a\n\x12\x65nable_secure_boot\x18\x01 \x01(\x08\x42\xd3\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x15MachineResourcesProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3" +descriptor_data = "\n2google/cloud/aiplatform/v1/machine_resources.proto\x12\x1agoogle.cloud.aiplatform.v1\x1a\x1fgoogle/api/field_behavior.proto\x1a\x31google/cloud/aiplatform/v1/accelerator_type.proto\x1a\x35google/cloud/aiplatform/v1/reservation_affinity.proto\"\x81\x02\n\x0bMachineSpec\x12\x19\n\x0cmachine_type\x18\x01 \x01(\tB\x03\xe0\x41\x05\x12J\n\x10\x61\x63\x63\x65lerator_type\x18\x02 \x01(\x0e\x32+.google.cloud.aiplatform.v1.AcceleratorTypeB\x03\xe0\x41\x05\x12\x19\n\x11\x61\x63\x63\x65lerator_count\x18\x03 \x01(\x05\x12\x19\n\x0ctpu_topology\x18\x04 \x01(\tB\x03\xe0\x41\x05\x12U\n\x14reservation_affinity\x18\x05 \x01(\x0b\x32/.google.cloud.aiplatform.v1.ReservationAffinityB\x06\xe0\x41\x05\xe0\x41\x01\"\xb0\x02\n\x12\x44\x65\x64icatedResources\x12\x45\n\x0cmachine_spec\x18\x01 \x01(\x0b\x32\'.google.cloud.aiplatform.v1.MachineSpecB\x06\xe0\x41\x02\xe0\x41\x05\x12!\n\x11min_replica_count\x18\x02 \x01(\x05\x42\x06\xe0\x41\x02\xe0\x41\x05\x12\x1e\n\x11max_replica_count\x18\x03 \x01(\x05\x42\x03\xe0\x41\x05\x12#\n\x16required_replica_count\x18\t \x01(\x05\x42\x03\xe0\x41\x01\x12X\n\x18\x61utoscaling_metric_specs\x18\x04 \x03(\x0b\x32\x31.google.cloud.aiplatform.v1.AutoscalingMetricSpecB\x03\xe0\x41\x05\x12\x11\n\x04spot\x18\x05 \x01(\x08\x42\x03\xe0\x41\x01\"T\n\x12\x41utomaticResources\x12\x1e\n\x11min_replica_count\x18\x01 \x01(\x05\x42\x03\xe0\x41\x05\x12\x1e\n\x11max_replica_count\x18\x02 \x01(\x05\x42\x03\xe0\x41\x05\"\xa5\x01\n\x17\x42\x61tchDedicatedResources\x12\x45\n\x0cmachine_spec\x18\x01 \x01(\x0b\x32\'.google.cloud.aiplatform.v1.MachineSpecB\x06\xe0\x41\x02\xe0\x41\x05\x12#\n\x16starting_replica_count\x18\x02 \x01(\x05\x42\x03\xe0\x41\x05\x12\x1e\n\x11max_replica_count\x18\x03 \x01(\x05\x42\x03\xe0\x41\x05\"/\n\x11ResourcesConsumed\x12\x1a\n\rreplica_hours\x18\x01 \x01(\x01\x42\x03\xe0\x41\x03\"=\n\x08\x44iskSpec\x12\x16\n\x0e\x62oot_disk_type\x18\x01 \x01(\t\x12\x19\n\x11\x62oot_disk_size_gb\x18\x02 \x01(\x05\"=\n\x12PersistentDiskSpec\x12\x11\n\tdisk_type\x18\x01 \x01(\t\x12\x14\n\x0c\x64isk_size_gb\x18\x02 \x01(\x03\"L\n\x08NfsMount\x12\x13\n\x06server\x18\x01 \x01(\tB\x03\xe0\x41\x02\x12\x11\n\x04path\x18\x02 \x01(\tB\x03\xe0\x41\x02\x12\x18\n\x0bmount_point\x18\x03 \x01(\tB\x03\xe0\x41\x02\"A\n\x15\x41utoscalingMetricSpec\x12\x18\n\x0bmetric_name\x18\x01 \x01(\tB\x03\xe0\x41\x02\x12\x0e\n\x06target\x18\x02 \x01(\x05\".\n\x10ShieldedVmConfig\x12\x1a\n\x12\x65nable_secure_boot\x18\x01 \x01(\x08\x42\xd3\x01\n\x1e\x63om.google.cloud.aiplatform.v1B\x15MachineResourcesProtoP\x01Z>cloud.google.com/go/aiplatform/apiv1/aiplatformpb;aiplatformpb\xaa\x02\x1aGoogle.Cloud.AIPlatform.V1\xca\x02\x1aGoogle\\Cloud\\AIPlatform\\V1\xea\x02\x1dGoogle::Cloud::AIPlatform::V1b\x06proto3" pool = Google::Protobuf::DescriptorPool.generated_pool diff --git a/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/endpoint.rb b/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/endpoint.rb index 525216f9415f..a50782c419eb 100644 --- a/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/endpoint.rb +++ b/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/endpoint.rb @@ -272,6 +272,9 @@ class LabelsEntry # @!attribute [rw] faster_deployment_config # @return [::Google::Cloud::AIPlatform::V1::FasterDeploymentConfig] # Configuration for faster model deployment. + # @!attribute [r] status + # @return [::Google::Cloud::AIPlatform::V1::DeployedModel::Status] + # Output only. Runtime status of the deployed model. # @!attribute [rw] system_labels # @return [::Google::Protobuf::Map{::String => ::String}] # System labels to apply to Model Garden deployments. @@ -280,6 +283,21 @@ class DeployedModel include ::Google::Protobuf::MessageExts extend ::Google::Protobuf::MessageExts::ClassMethods + # Runtime status of the deployed model. + # @!attribute [r] message + # @return [::String] + # Output only. The latest deployed model's status message (if any). + # @!attribute [r] last_update_time + # @return [::Google::Protobuf::Timestamp] + # Output only. The time at which the status was last updated. + # @!attribute [r] available_replica_count + # @return [::Integer] + # Output only. The number of available replicas of the deployed model. + class Status + include ::Google::Protobuf::MessageExts + extend ::Google::Protobuf::MessageExts::ClassMethods + end + # @!attribute [rw] key # @return [::String] # @!attribute [rw] value diff --git a/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/machine_resources.rb b/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/machine_resources.rb index 05f6fb7ca2a2..b11d494de3bc 100644 --- a/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/machine_resources.rb +++ b/google-cloud-ai_platform-v1/proto_docs/google/cloud/aiplatform/v1/machine_resources.rb @@ -89,6 +89,14 @@ class MachineSpec # quotas. Specifically, you will be charged for (max_replica_count * # number of cores in the selected machine type) and (max_replica_count * # number of GPUs per replica in the selected machine type). + # @!attribute [rw] required_replica_count + # @return [::Integer] + # Optional. Number of required available replicas for the deployment to + # succeed. This field is only needed when partial model deployment/mutation + # is desired. If set, the model deploy/mutate operation will succeed once + # available_replica_count reaches required_replica_count, and the rest of + # the replicas will be retried. If not set, the default + # required_replica_count will be min_replica_count. # @!attribute [rw] autoscaling_metric_specs # @return [::Array<::Google::Cloud::AIPlatform::V1::AutoscalingMetricSpec>] # Immutable. The metric specifications that overrides a resource