Skip to content

Commit cec22ab

Browse files
feat: add partner_model_tuning_spec to TuningJob (#5721)
* feat: add a dynamic retrieval API PiperOrigin-RevId: 680475495 Source-Link: googleapis/googleapis@a6a6956 Source-Link: googleapis/googleapis-gen@c9ef9e0 Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6ImM5ZWY5ZTAwZjkwYWUyYzU3NGY4MDBiNjY2ZmU3NDg2MjIwYjliZjIifQ== * feat: add psc_automation_configs to DeployIndex v1 PiperOrigin-RevId: 680742448 Source-Link: googleapis/googleapis@ce31830 Source-Link: googleapis/googleapis-gen@5254135 Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6IjUyNTQxMzVjZDkwODlmMzVjOWY1MzdhYmE1NjdkZDI5YWNjZTU0MTMifQ== * feat: add new `PscInterfaceConfig` field to `pipeline_job.proto` PiperOrigin-RevId: 680823763 Source-Link: googleapis/googleapis@8f00dab Source-Link: googleapis/googleapis-gen@e58485b Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6ImU1ODQ4NWI2NzA1NTBiNmI3ODM1MWVkZTQ5NmFkM2NlZDE1MDk1MzQifQ== * 🦉 Updates from OwlBot post-processor See https://github.com/googleapis/repo-automation-bots/blob/main/packages/owl-bot/README.md * feat: add enable_secure_private_service_connect in service attachment PiperOrigin-RevId: 681172589 Source-Link: googleapis/googleapis@16a1580 Source-Link: googleapis/googleapis-gen@87fb5dc Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6Ijg3ZmI1ZGM3MzhhZGZhNWQzMTNhNTgzNjgxZTQ3NmUzNDcwZDY5ZTUifQ== * feat: add continuous sync option in feature_view.proto PiperOrigin-RevId: 681665991 Source-Link: googleapis/googleapis@8d17595 Source-Link: googleapis/googleapis-gen@ceb528d Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6ImNlYjUyOGQzNzk1MDAxM2UxZTEyZWRkNGIwZTk5YjJkMjIwN2M3ZjkifQ== * feat: add a dynamic retrieval API PiperOrigin-RevId: 681780557 Source-Link: googleapis/googleapis@475669f Source-Link: googleapis/googleapis-gen@bbbb240 Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6ImJiYmIyNDBhMzhiNGE0NDU3NDUxZjYzYTNlZmFjYmI4MDY4YTY3ZWQifQ== * feat: add partner_model_tuning_spec to TuningJob PiperOrigin-RevId: 683655446 Source-Link: googleapis/googleapis@4be7103 Source-Link: googleapis/googleapis-gen@2f7b2ea Copy-Tag: eyJwIjoicGFja2FnZXMvZ29vZ2xlLWNsb3VkLWFpcGxhdGZvcm0vLk93bEJvdC55YW1sIiwiaCI6IjJmN2IyZWE2NDMyMGNlYTFjYWVhYzMwMTYzNWY1MzEzODUwYzk5ZDgifQ== * chore: run post-processor * 🦉 Updates from OwlBot post-processor See https://github.com/googleapis/repo-automation-bots/blob/main/packages/owl-bot/README.md --------- Co-authored-by: Owl Bot <gcf-owl-bot[bot]@users.noreply.github.com> Co-authored-by: sofisl <55454395+sofisl@users.noreply.github.com> Co-authored-by: Sofia Leon <sofialeon@google.com>
1 parent 683839a commit cec22ab

File tree

15 files changed

+2837
-18
lines changed

15 files changed

+2837
-18
lines changed

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1/content.proto

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -560,6 +560,12 @@ message GroundingMetadata {
560560
// Optional. List of grounding support.
561561
repeated GroundingSupport grounding_supports = 6
562562
[(google.api.field_behavior) = OPTIONAL];
563+
564+
// Optional. Output only. Retrieval metadata.
565+
optional RetrievalMetadata retrieval_metadata = 7 [
566+
(google.api.field_behavior) = OPTIONAL,
567+
(google.api.field_behavior) = OUTPUT_ONLY
568+
];
563569
}
564570

565571
// Google search entry point.
@@ -572,3 +578,14 @@ message SearchEntryPoint {
572578
// url> tuple.
573579
bytes sdk_blob = 2 [(google.api.field_behavior) = OPTIONAL];
574580
}
581+
582+
// Metadata related to retrieval in the grounding flow.
583+
message RetrievalMetadata {
584+
// Optional. Score indicating how likely information from google search could
585+
// help answer the prompt. The score is in the range `[0, 1]`, where 0 is the
586+
// least likely and 1 is the most likely. This score is only populated when
587+
// google search grounding and dynamic retrieval is enabled. It will be
588+
// compared to the threshold to determine whether to trigger google search.
589+
float google_search_dynamic_retrieval_score = 2
590+
[(google.api.field_behavior) = OPTIONAL];
591+
}

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1/feature_view.proto

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,10 @@ message FeatureView {
5555
// database. For example, "CRON_TZ=America/New_York 1 * * * *", or
5656
// "TZ=America/New_York 1 * * * *".
5757
string cron = 1;
58+
59+
// Optional. If true, syncs the FeatureView in a continuous manner to Online
60+
// Store.
61+
bool continuous = 2 [(google.api.field_behavior) = OPTIONAL];
5862
}
5963

6064
// Configuration for vector indexing.

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1/index_endpoint.proto

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -260,6 +260,12 @@ message DeployedIndex {
260260
//
261261
// Note: we only support up to 5 deployment groups(not including 'default').
262262
string deployment_group = 11 [(google.api.field_behavior) = OPTIONAL];
263+
264+
// Optional. If set for PSC deployed index, PSC connection will be
265+
// automatically created after deployment is done and the endpoint information
266+
// is populated in private_endpoints.psc_automated_endpoints.
267+
repeated PSCAutomationConfig psc_automation_configs = 19
268+
[(google.api.field_behavior) = OPTIONAL];
263269
}
264270

265271
// Used to set up the auth on the DeployedIndex's private endpoint.

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1/service_networking.proto

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,21 @@ option (google.api.resource_definition) = {
3131
pattern: "projects/{project}/regions/{region}/networkAttachments/{networkattachment}"
3232
};
3333

34+
// PSC config that is used to automatically create forwarding rule via
35+
// ServiceConnectionMap.
36+
message PSCAutomationConfig {
37+
// Required. Project id used to create forwarding rule.
38+
string project_id = 1 [(google.api.field_behavior) = REQUIRED];
39+
40+
// Required. The full name of the Google Compute Engine
41+
// [network](https://cloud.google.com/compute/docs/networks-and-firewalls#networks).
42+
// [Format](https://cloud.google.com/compute/docs/reference/rest/v1/networks/insert):
43+
// `projects/{project}/global/networks/{network}`.
44+
// Where {project} is a project number, as in '12345', and {network} is
45+
// network name.
46+
string network = 2 [(google.api.field_behavior) = REQUIRED];
47+
}
48+
3449
// Represents configuration for private service connect.
3550
message PrivateServiceConnectConfig {
3651
// Required. If true, expose the IndexEndpoint via private service connect.

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1/tool.proto

Lines changed: 23 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -142,7 +142,29 @@ message VertexAISearch {
142142
}
143143

144144
// Tool to retrieve public web data for grounding, powered by Google.
145-
message GoogleSearchRetrieval {}
145+
message GoogleSearchRetrieval {
146+
// Specifies the dynamic retrieval configuration for the given source.
147+
DynamicRetrievalConfig dynamic_retrieval_config = 2;
148+
}
149+
150+
// Describes the options to customize dynamic retrieval.
151+
message DynamicRetrievalConfig {
152+
// The mode of the predictor to be used in dynamic retrieval.
153+
enum Mode {
154+
// Always trigger retrieval.
155+
MODE_UNSPECIFIED = 0;
156+
157+
// Run retrieval only when system decides it is necessary.
158+
MODE_DYNAMIC = 1;
159+
}
160+
161+
// The mode of the predictor to be used in dynamic retrieval.
162+
Mode mode = 1;
163+
164+
// Optional. The threshold to be used in dynamic retrieval.
165+
// If not set, a system default value is used.
166+
optional float dynamic_threshold = 2 [(google.api.field_behavior) = OPTIONAL];
167+
}
146168

147169
// Tool config. This config is shared for all tools provided in the request.
148170
message ToolConfig {

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1beta1/content.proto

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -561,6 +561,12 @@ message GroundingMetadata {
561561
// Optional. List of grounding support.
562562
repeated GroundingSupport grounding_supports = 6
563563
[(google.api.field_behavior) = OPTIONAL];
564+
565+
// Optional. Output only. Retrieval metadata.
566+
optional RetrievalMetadata retrieval_metadata = 7 [
567+
(google.api.field_behavior) = OPTIONAL,
568+
(google.api.field_behavior) = OUTPUT_ONLY
569+
];
564570
}
565571

566572
// Google search entry point.
@@ -573,3 +579,14 @@ message SearchEntryPoint {
573579
// url> tuple.
574580
bytes sdk_blob = 2 [(google.api.field_behavior) = OPTIONAL];
575581
}
582+
583+
// Metadata related to retrieval in the grounding flow.
584+
message RetrievalMetadata {
585+
// Optional. Score indicating how likely information from google search could
586+
// help answer the prompt. The score is in the range [0, 1], where 0 is the
587+
// least likely and 1 is the most likely. This score is only populated when
588+
// google search grounding and dynamic retrieval is enabled. It will be
589+
// compared to the threshold to determine whether to trigger google search.
590+
float google_search_dynamic_retrieval_score = 2
591+
[(google.api.field_behavior) = OPTIONAL];
592+
}

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1beta1/pipeline_job.proto

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,7 @@ import "google/cloud/aiplatform/v1beta1/encryption_spec.proto";
2424
import "google/cloud/aiplatform/v1beta1/execution.proto";
2525
import "google/cloud/aiplatform/v1beta1/pipeline_failure_policy.proto";
2626
import "google/cloud/aiplatform/v1beta1/pipeline_state.proto";
27+
import "google/cloud/aiplatform/v1beta1/service_networking.proto";
2728
import "google/cloud/aiplatform/v1beta1/ui_pipeline_spec.proto";
2829
import "google/cloud/aiplatform/v1beta1/value.proto";
2930
import "google/protobuf/struct.proto";
@@ -198,6 +199,10 @@ message PipelineJob {
198199
// Example: ['vertex-ai-ip-range'].
199200
repeated string reserved_ip_ranges = 25;
200201

202+
// Optional. Configuration for PSC-I for PipelineJob.
203+
PscInterfaceConfig psc_interface_config = 31
204+
[(google.api.field_behavior) = OPTIONAL];
205+
201206
// A template uri from where the
202207
// [PipelineJob.pipeline_spec][google.cloud.aiplatform.v1beta1.PipelineJob.pipeline_spec],
203208
// if empty, will be downloaded. Currently, only uri from Vertex Template

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1beta1/service_networking.proto

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -56,6 +56,13 @@ message PrivateServiceConnectConfig {
5656
// attachment.
5757
repeated string project_allowlist = 2;
5858

59+
// Optional. If set to true, enable secure private service connect with IAM
60+
// authorization. Otherwise, private service connect will be done without
61+
// authorization. Note latency will be slightly increased if authorization is
62+
// enabled.
63+
bool enable_secure_private_service_connect = 4
64+
[(google.api.field_behavior) = OPTIONAL];
65+
5966
// Output only. The name of the generated service attachment resource.
6067
// This is only populated if the endpoint is deployed with
6168
// PrivateServiceConnect.

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1beta1/tool.proto

Lines changed: 23 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -233,7 +233,29 @@ message VertexAISearch {
233233
}
234234

235235
// Tool to retrieve public web data for grounding, powered by Google.
236-
message GoogleSearchRetrieval {}
236+
message GoogleSearchRetrieval {
237+
// Specifies the dynamic retrieval configuration for the given source.
238+
DynamicRetrievalConfig dynamic_retrieval_config = 2;
239+
}
240+
241+
// Describes the options to customize dynamic retrieval.
242+
message DynamicRetrievalConfig {
243+
// The mode of the predictor to be used in dynamic retrieval.
244+
enum Mode {
245+
// Always trigger retrieval.
246+
MODE_UNSPECIFIED = 0;
247+
248+
// Run retrieval only when system decides it is necessary.
249+
MODE_DYNAMIC = 1;
250+
}
251+
252+
// The mode of the predictor to be used in dynamic retrieval.
253+
Mode mode = 1;
254+
255+
// Optional. The threshold to be used in dynamic retrieval.
256+
// If not set, a system default value is used.
257+
optional float dynamic_threshold = 2 [(google.api.field_behavior) = OPTIONAL];
258+
}
237259

238260
// Tool config. This config is shared for all tools provided in the request.
239261
message ToolConfig {

packages/google-cloud-aiplatform/protos/google/cloud/aiplatform/v1beta1/tuning_job.proto

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@ import "google/api/resource.proto";
2121
import "google/cloud/aiplatform/v1beta1/content.proto";
2222
import "google/cloud/aiplatform/v1beta1/encryption_spec.proto";
2323
import "google/cloud/aiplatform/v1beta1/job_state.proto";
24+
import "google/protobuf/struct.proto";
2425
import "google/protobuf/timestamp.proto";
2526
import "google/rpc/status.proto";
2627

@@ -52,6 +53,9 @@ message TuningJob {
5253

5354
// Tuning Spec for Distillation.
5455
DistillationSpec distillation_spec = 17;
56+
57+
// Tuning Spec for open sourced and third party Partner models.
58+
PartnerModelTuningSpec partner_model_tuning_spec = 21;
5559
}
5660

5761
// Output only. Identifier. Resource name of a TuningJob. Format:
@@ -451,6 +455,21 @@ message DistillationHyperParameters {
451455
[(google.api.field_behavior) = OPTIONAL];
452456
}
453457

458+
// Tuning spec for Partner models.
459+
message PartnerModelTuningSpec {
460+
// Required. Cloud Storage path to file containing training dataset for
461+
// tuning. The dataset must be formatted as a JSONL file.
462+
string training_dataset_uri = 1 [(google.api.field_behavior) = REQUIRED];
463+
464+
// Optional. Cloud Storage path to file containing validation dataset for
465+
// tuning. The dataset must be formatted as a JSONL file.
466+
string validation_dataset_uri = 2 [(google.api.field_behavior) = OPTIONAL];
467+
468+
// Hyperparameters for tuning. The accepted hyper_parameters and their valid
469+
// range of values will differ depending on the base model.
470+
map<string, google.protobuf.Value> hyper_parameters = 3;
471+
}
472+
454473
// TunedModel Reference for legacy model migration.
455474
message TunedModelRef {
456475
// The Tuned Model Reference for the model.

0 commit comments

Comments
 (0)