diff --git a/.github/workflows/mypy.yml b/.github/workflows/mypy.yml new file mode 100644 index 0000000000..63c87b07da --- /dev/null +++ b/.github/workflows/mypy.yml @@ -0,0 +1,37 @@ +# This workflow runs mypy for static type checking on the vertexai/_genai submodule. +# See https://mypy.readthedocs.io/en/stable/index.html for more information. +# +# You can adjust the behavior by modifying this file. +name: Run mypy + +on: + pull_request: + branches: + - main + paths: + - 'vertexai/_genai/**' + +jobs: + genai-mypy: + runs-on: ubuntu-latest + strategy: + matrix: + python-version: ['3.9', '3.10', '3.11', '3.12'] + + steps: + - name: Checkout code + uses: actions/checkout@v4 + + - name: Set up Python ${{ matrix.python-version }} + uses: actions/setup-python@v5 + with: + python-version: ${{ matrix.python-version }} + + - name: Install dependencies + run: | + python -m pip install --upgrade pip + pip install mypy + pip install google-cloud-aiplatform + + - name: Run mypy ${{ matrix.python-version }} + run: mypy vertexai/_genai/ --strict --config-file=mypy.ini diff --git a/.release-please-manifest.json b/.release-please-manifest.json index 2c8891eb3a..123331f608 100644 --- a/.release-please-manifest.json +++ b/.release-please-manifest.json @@ -1,3 +1,3 @@ { - ".": "1.100.0" + ".": "1.101.0" } diff --git a/CHANGELOG.md b/CHANGELOG.md index bac427a2f0..9497e2b185 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,18 @@ # Changelog +## [1.101.0](https://github.com/googleapis/python-aiplatform/compare/v1.100.0...v1.101.0) (2025-07-01) + + +### Features + +* **Allow installation scripts in AgentEngine.** ([9296d4d](https://github.com/googleapis/python-aiplatform/commit/9296d4d9fc7cb40116f7adbce0e08f0c41a15413)) +* Add `invoke` method. It supports both streaming and non-streaming cases. ([e686932](https://github.com/googleapis/python-aiplatform/commit/e68693270a4f00aed51d78692a4c6bb78e7f3374)) +* Add computer use support to tools ([f56c42e](https://github.com/googleapis/python-aiplatform/commit/f56c42e1d52b052fac6003e6b523ee9f536b72a0)) +* Add computer use support to tools ([f56c42e](https://github.com/googleapis/python-aiplatform/commit/f56c42e1d52b052fac6003e6b523ee9f536b72a0)) +* Allow users to pass project_number for custom job service account when service_account is not provided. ([5b59030](https://github.com/googleapis/python-aiplatform/commit/5b59030d5ae98d6e4ff1a6d2e4e55dbe5b53fcf5)) +* Expose task_unique_name in pipeline task details for pipeline rerun ([f56c42e](https://github.com/googleapis/python-aiplatform/commit/f56c42e1d52b052fac6003e6b523ee9f536b72a0)) +* Support creating an invoke enabled model in Python SDK ([71a8d7b](https://github.com/googleapis/python-aiplatform/commit/71a8d7b375e5058de47901331071ccda9e2c41f6)) + ## [1.100.0](https://github.com/googleapis/python-aiplatform/compare/v1.99.0...v1.100.0) (2025-06-26) diff --git a/google/cloud/aiplatform/gapic_version.py b/google/cloud/aiplatform/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/gapic_version.py +++ b/google/cloud/aiplatform/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/models.py b/google/cloud/aiplatform/models.py index 9e3cb73e29..4b8fb72e8f 100644 --- a/google/cloud/aiplatform/models.py +++ b/google/cloud/aiplatform/models.py @@ -3161,6 +3161,152 @@ async def explain_async( explanations=explain_response.explanations, ) + def invoke( + self, + request_path: str, + body: bytes, + headers: Dict[str, str], + deployed_model_id: Optional[str] = None, + stream: bool = False, + timeout: Optional[float] = None, + ) -> Union[requests.models.Response, Iterator[requests.models.Response]]: + """Makes a prediction request for arbitrary paths. + + Example usage: + my_endpoint = aiplatform.Endpoint(ENDPOINT_ID) + # Unary request + body = { + "model": "", + "messages": [ + { + "role": "user", + "content": "Hello!", + } + ], + "stream": "true", + } + + response = my_endpoint.invoke( + request_path="/v1/chat/completions", + body = json.dumps(body).encode("utf-8"), + headers = {'Content-Type':'application/json'}, + ) + status_code = response.status_code + results = json.dumps(response.text) + + # Streaming request + body = { + "model": "", + "messages": [ + { + "role": "user", + "content": "Hello!", + } + ], + "stream": "true", + } + + for chunk in my_endpoint.invoke( + request_path="/v1/chat/completions", + body = json.dumps(body).encode("utf-8"), + headers = {'Content-Type':'application/json'}, + stream=True, + ): + chunk_text = chunk.decode('utf-8') + + Args: + request_path (str): + The request url to the model server. The request path must be + a string that starts with a forward slash. Root can't be + accessed. + + body (bytes): + The body of the prediction request in bytes. This must not exceed 1.5 mb per request. + + headers (Dict[str, str]): + The header of the request as a dictionary. There are no restrictions on the header. + + deployed_model_id (str): + Optional. If specified, this InvokeRequest will be served by the + chosen DeployedModel, overriding this Endpoint's traffic split. + + stream (bool): If set to True, streaming will be enabled. + + timeout (float): Optional. The timeout for this request in seconds. + + Returns: + By default, a requests.models.Response object containing the status code and prediction results is returned. + For stream=True, the response will be of type Iterator[requests.models.Response]. + + Raises: + ImportError: If there is an issue importing the `TCPKeepAliveAdapter` package. + """ + if not self.authorized_session: + self.credentials._scopes = constants.base.DEFAULT_AUTHED_SCOPES + self.authorized_session = google_auth_requests.AuthorizedSession( + self.credentials + ) + if not self.dedicated_endpoint_enabled: + raise ValueError( + "Invoke method is only supported on dedicated endpoints. Please" + "make sure endpoint and model are correctly configured." + ) + if self.dedicated_endpoint_dns is None: + raise ValueError( + "Dedicated endpoint DNS is empty. Please make sure endpoint" + "and model are ready before making a prediction." + ) + if len(request_path) < 0 or request_path[0] != "/": + raise ValueError( + "container path must be a string that starts with a forward slash." + ) + url = f"https://{self.dedicated_endpoint_dns}/v1/%7Bself.resource_name%7D" + + if deployed_model_id: + deployed_model_ids = set() + if hasattr(self._gca_resource, "deployed_models"): + for deployed_model in self._gca_resource.deployed_models: + deployed_model_ids.add(deployed_model.id) + if deployed_model_id not in deployed_model_ids: + raise ValueError( + f"Deployed model {deployed_model_id} not found in endpoint" + f" {self.name}." + ) + url += f"/deployedModels/{deployed_model_id}" + url += "/invoke" + request_path + if timeout is not None and timeout > google_auth_requests._DEFAULT_TIMEOUT: + try: + from requests_toolbelt.adapters.socket_options import ( + TCPKeepAliveAdapter, + ) + except ImportError: + raise ImportError( + "Cannot import the requests-toolbelt library." + "Please install requests-toolbelt." + ) + # count * interval need to be larger than 1 hr (3600s) + keep_alive = TCPKeepAliveAdapter(idle=120, count=100, interval=100) + self.authorized_session.mount("https://", keep_alive) + + def invoke_stream_response(): + with self.authorized_session.post( + url=url, + data=body, + headers=headers, + timeout=timeout, + stream=True, + ) as resp: + for line in resp.iter_lines(): + yield line + + if stream: + # This wrapping allows a Response object is returned for + # non-streaming requests. + return invoke_stream_response() + return self.authorized_session.post( + url=url, data=body, headers=headers, timeout=timeout + ) + @classmethod def list( cls, @@ -4006,6 +4152,132 @@ def explain(self): f"{self.__class__.__name__} class does not support 'explain' as of now." ) + def invoke( + self, + request_path: str, + body: bytes, + headers: Dict[str, str], + deployed_model_id: Optional[str] = None, + stream: bool = False, + timeout: Optional[float] = None, + endpoint_override: Optional[str] = None, + ) -> Iterator[bytes]: + """Makes a prediction request for arbitrary paths. + + Example usage: + my_endpoint = aiplatform.PrivateEndpoint(ENDPOINT_ID) + response = my_endpoint.invoke( + request_path="/v1/chat/completions", + body = json.dumps(DATA).encode("utf-8"), + headers = {'Content-Type':'application/json'}, + endpoint_override="10.128.0.3", + ) + status_code = response.status_code + results = json.dumps(response.text) + + for stream_response in my_endpoint.invoke( + request_path="/v1/chat/completions", + body = json.dumps(DATA).encode("utf-8"), + headers = {'Content-Type':'application/json'}, + stream=True, + endpoint_override="10.128.0.3", + ): + stream_response_text = stream_response.decode('utf-8') + + Args: + request_path (str): + The request url to the model server. The request path must be + a string that starts with a forward slash. Root can't be + accessed. + + body (bytes): + The body of the prediction request in bytes. This must not exceed 1.5 mb per request. + + headers (Dict[str, str]): + The header of the request as a dictionary. There are no restrictions on the header. + + deployed_model_id (str): + Optional. If specified, this InvokeRequest will be served by the + chosen DeployedModel, overriding this Endpoint's traffic split. + + stream (bool): If set to True, streaming will be enabled. + + timeout (float): Optional. The timeout for this request in seconds. + + endpoint_override (Optional[str]): + The Private Service Connect endpoint's IP address or DNS that + points to the endpoint's service attachment. + + Returns: + By default, a requests.models.Response object containing the status code and prediction results is returned. + For stream=True, the response will be of type Iterator[requests.models.Response]. + + Raises: + ValueError: If a endpoint override is not provided for PSC based + endpoint. + ValueError: If a endpoint override is invalid for PSC based endpoint. + """ + self.wait() + if self.network or not self.private_service_connect_config: + raise ValueError("PSA based private endpoint does not support invoke.") + + if self.private_service_connect_config: + if not endpoint_override: + raise ValueError( + "Cannot make an invoke request because endpoint override is" + "not provided. Please ensure an endpoint override is" + "provided." + ) + if not self._validate_endpoint_override(endpoint_override): + raise ValueError( + "Invalid endpoint override provided. Please only use IP" + "address or DNS." + ) + + if not self._authorized_session: + self.credentials._scopes = constants.base.DEFAULT_AUTHED_SCOPES + self._authorized_session = google_auth_requests.AuthorizedSession( + self.credentials, + ) + self._authorized_session.verify = False + if len(request_path) < 0 or request_path[0] != "/": + raise ValueError( + "container path must be a string that starts with a forward slash." + ) + + url = f"https://{endpoint_override}/v1/projects/%7Bself.project%7D/locations/%7Bself.location%7D/endpoints/%7Bself.name%7D" + if deployed_model_id: + deployed_model_ids = set() + if hasattr(self._gca_resource, "deployed_models"): + for deployed_model in self._gca_resource.deployed_models: + deployed_model_ids.add(deployed_model.id) + if deployed_model_id not in deployed_model_ids: + raise ValueError( + f"Deployed model {deployed_model_id} not found in endpoint" + f" {self.name}." + ) + url += f"/deployedModels/{deployed_model_id}" + url += "/invoke" + request_path + + def invoke_stream_response(): + with self._authorized_session.post( + url=url, + data=body, + headers=headers, + timeout=timeout, + stream=True, + ) as resp: + for line in resp.iter_lines(): + yield line + + if stream: + # This wrapping allows a Response object is returned for + # non-streaming requests. + return invoke_stream_response() + return self._authorized_session.post( + url=url, data=body, headers=headers, timeout=timeout + ) + def health_check(self) -> bool: """ Makes a request to this PrivateEndpoint's health check URI. Must be within network @@ -4862,6 +5134,7 @@ def upload( version_description: Optional[str] = None, serving_container_predict_route: Optional[str] = None, serving_container_health_route: Optional[str] = None, + serving_container_invoke_route_prefix: Optional[str] = None, description: Optional[str] = None, serving_container_command: Optional[Sequence[str]] = None, serving_container_args: Optional[Sequence[str]] = None, @@ -4948,6 +5221,12 @@ def upload( Optional. An HTTP path to send health check requests to the container, and which must be supported by it. If not specified a standard HTTP path will be used by Vertex AI. + serving_container_invoke_route_prefix (str): + Optional. Invoke route prefix for the custom container. "/*" is the only + supported value right now. By setting this field, any non-root route on + this model will be accessible with invoke http call + eg: "/invoke/foo/bar", however the [PredictionService.Invoke] RPC is not + supported yet. description (str): The description of the model. serving_container_command: Optional[Sequence[str]]=None, @@ -5212,6 +5491,7 @@ def upload( grpc_ports=grpc_ports, predict_route=serving_container_predict_route, health_route=serving_container_health_route, + invoke_route_prefix=serving_container_invoke_route_prefix, deployment_timeout=deployment_timeout, shared_memory_size_mb=serving_container_shared_memory_size_mb, startup_probe=startup_probe, diff --git a/google/cloud/aiplatform/v1/schema/predict/instance/gapic_version.py b/google/cloud/aiplatform/v1/schema/predict/instance/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/predict/instance/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/predict/instance/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/predict/instance_v1/gapic_version.py b/google/cloud/aiplatform/v1/schema/predict/instance_v1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/predict/instance_v1/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/predict/instance_v1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/predict/params/gapic_version.py b/google/cloud/aiplatform/v1/schema/predict/params/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/predict/params/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/predict/params/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/predict/params_v1/gapic_version.py b/google/cloud/aiplatform/v1/schema/predict/params_v1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/predict/params_v1/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/predict/params_v1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/predict/prediction/gapic_version.py b/google/cloud/aiplatform/v1/schema/predict/prediction/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/predict/prediction/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/predict/prediction/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/predict/prediction_v1/gapic_version.py b/google/cloud/aiplatform/v1/schema/predict/prediction_v1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/predict/prediction_v1/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/predict/prediction_v1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/trainingjob/definition/gapic_version.py b/google/cloud/aiplatform/v1/schema/trainingjob/definition/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/trainingjob/definition/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/trainingjob/definition/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1/schema/trainingjob/definition_v1/gapic_version.py b/google/cloud/aiplatform/v1/schema/trainingjob/definition_v1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1/schema/trainingjob/definition_v1/gapic_version.py +++ b/google/cloud/aiplatform/v1/schema/trainingjob/definition_v1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/predict/instance/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/predict/instance/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/predict/instance/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/predict/instance/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/predict/instance_v1beta1/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/predict/instance_v1beta1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/predict/instance_v1beta1/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/predict/instance_v1beta1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/predict/params/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/predict/params/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/predict/params/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/predict/params/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/predict/params_v1beta1/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/predict/params_v1beta1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/predict/params_v1beta1/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/predict/params_v1beta1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/predict/prediction/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/predict/prediction/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/predict/prediction/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/predict/prediction/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/predict/prediction_v1beta1/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/predict/prediction_v1beta1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/predict/prediction_v1beta1/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/predict/prediction_v1beta1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition_v1beta1/gapic_version.py b/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition_v1beta1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition_v1beta1/gapic_version.py +++ b/google/cloud/aiplatform/v1beta1/schema/trainingjob/definition_v1beta1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform/version.py b/google/cloud/aiplatform/version.py index de9792a57a..e9537ff529 100644 --- a/google/cloud/aiplatform/version.py +++ b/google/cloud/aiplatform/version.py @@ -15,4 +15,4 @@ # limitations under the License. # -__version__ = "1.100.0" +__version__ = "1.101.0" diff --git a/google/cloud/aiplatform_v1/gapic_version.py b/google/cloud/aiplatform_v1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform_v1/gapic_version.py +++ b/google/cloud/aiplatform_v1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform_v1/services/migration_service/client.py b/google/cloud/aiplatform_v1/services/migration_service/client.py index 735b4d1655..bdf0d9ec72 100644 --- a/google/cloud/aiplatform_v1/services/migration_service/client.py +++ b/google/cloud/aiplatform_v1/services/migration_service/client.py @@ -243,40 +243,40 @@ def parse_annotated_dataset_path(path: str) -> Dict[str, str]: @staticmethod def dataset_path( project: str, - location: str, dataset: str, ) -> str: """Returns a fully-qualified dataset string.""" - return "projects/{project}/locations/{location}/datasets/{dataset}".format( + return "projects/{project}/datasets/{dataset}".format( project=project, - location=location, dataset=dataset, ) @staticmethod def parse_dataset_path(path: str) -> Dict[str, str]: """Parses a dataset path into its component segments.""" - m = re.match( - r"^projects/(?P.+?)/locations/(?P.+?)/datasets/(?P.+?)$", - path, - ) + m = re.match(r"^projects/(?P.+?)/datasets/(?P.+?)$", path) return m.groupdict() if m else {} @staticmethod def dataset_path( project: str, + location: str, dataset: str, ) -> str: """Returns a fully-qualified dataset string.""" - return "projects/{project}/datasets/{dataset}".format( + return "projects/{project}/locations/{location}/datasets/{dataset}".format( project=project, + location=location, dataset=dataset, ) @staticmethod def parse_dataset_path(path: str) -> Dict[str, str]: """Parses a dataset path into its component segments.""" - m = re.match(r"^projects/(?P.+?)/datasets/(?P.+?)$", path) + m = re.match( + r"^projects/(?P.+?)/locations/(?P.+?)/datasets/(?P.+?)$", + path, + ) return m.groupdict() if m else {} @staticmethod diff --git a/google/cloud/aiplatform_v1/types/tool.py b/google/cloud/aiplatform_v1/types/tool.py index e5b5ff04b5..d272a278a9 100644 --- a/google/cloud/aiplatform_v1/types/tool.py +++ b/google/cloud/aiplatform_v1/types/tool.py @@ -95,6 +95,11 @@ class Tool(proto.Message): url_context (google.cloud.aiplatform_v1.types.UrlContext): Optional. Tool to support URL context retrieval. + computer_use (google.cloud.aiplatform_v1.types.Tool.ComputerUse): + Optional. Tool to support the model + interacting directly with the computer. If + enabled, it automatically populates computer-use + specific Function Declarations. """ class GoogleSearch(proto.Message): @@ -112,6 +117,33 @@ class CodeExecution(proto.Message): """ + class ComputerUse(proto.Message): + r"""Tool to support computer use. + + Attributes: + environment (google.cloud.aiplatform_v1.types.Tool.ComputerUse.Environment): + Required. The environment being operated. + """ + + class Environment(proto.Enum): + r"""Represents the environment being operated, such as a web + browser. + + Values: + ENVIRONMENT_UNSPECIFIED (0): + Defaults to browser. + ENVIRONMENT_BROWSER (1): + Operates in a web browser. + """ + ENVIRONMENT_UNSPECIFIED = 0 + ENVIRONMENT_BROWSER = 1 + + environment: "Tool.ComputerUse.Environment" = proto.Field( + proto.ENUM, + number=1, + enum="Tool.ComputerUse.Environment", + ) + function_declarations: MutableSequence["FunctionDeclaration"] = proto.RepeatedField( proto.MESSAGE, number=1, @@ -147,6 +179,11 @@ class CodeExecution(proto.Message): number=8, message="UrlContext", ) + computer_use: ComputerUse = proto.Field( + proto.MESSAGE, + number=11, + message=ComputerUse, + ) class UrlContext(proto.Message): diff --git a/google/cloud/aiplatform_v1beta1/gapic_version.py b/google/cloud/aiplatform_v1beta1/gapic_version.py index 2141e7c037..20decc178e 100644 --- a/google/cloud/aiplatform_v1beta1/gapic_version.py +++ b/google/cloud/aiplatform_v1beta1/gapic_version.py @@ -13,4 +13,4 @@ # See the License for the specific language governing permissions and # limitations under the License. # -__version__ = "1.100.0" # {x-release-please-version} +__version__ = "1.101.0" # {x-release-please-version} diff --git a/google/cloud/aiplatform_v1beta1/services/migration_service/client.py b/google/cloud/aiplatform_v1beta1/services/migration_service/client.py index 800fb62ce3..786e8ef90f 100644 --- a/google/cloud/aiplatform_v1beta1/services/migration_service/client.py +++ b/google/cloud/aiplatform_v1beta1/services/migration_service/client.py @@ -265,40 +265,40 @@ def parse_dataset_path(path: str) -> Dict[str, str]: @staticmethod def dataset_path( project: str, - location: str, dataset: str, ) -> str: """Returns a fully-qualified dataset string.""" - return "projects/{project}/locations/{location}/datasets/{dataset}".format( + return "projects/{project}/datasets/{dataset}".format( project=project, - location=location, dataset=dataset, ) @staticmethod def parse_dataset_path(path: str) -> Dict[str, str]: """Parses a dataset path into its component segments.""" - m = re.match( - r"^projects/(?P.+?)/locations/(?P.+?)/datasets/(?P.+?)$", - path, - ) + m = re.match(r"^projects/(?P.+?)/datasets/(?P.+?)$", path) return m.groupdict() if m else {} @staticmethod def dataset_path( project: str, + location: str, dataset: str, ) -> str: """Returns a fully-qualified dataset string.""" - return "projects/{project}/datasets/{dataset}".format( + return "projects/{project}/locations/{location}/datasets/{dataset}".format( project=project, + location=location, dataset=dataset, ) @staticmethod def parse_dataset_path(path: str) -> Dict[str, str]: """Parses a dataset path into its component segments.""" - m = re.match(r"^projects/(?P.+?)/datasets/(?P.+?)$", path) + m = re.match( + r"^projects/(?P.+?)/locations/(?P.+?)/datasets/(?P.+?)$", + path, + ) return m.groupdict() if m else {} @staticmethod diff --git a/google/cloud/aiplatform_v1beta1/types/pipeline_job.py b/google/cloud/aiplatform_v1beta1/types/pipeline_job.py index fe794259d0..c43d2d93b2 100644 --- a/google/cloud/aiplatform_v1beta1/types/pipeline_job.py +++ b/google/cloud/aiplatform_v1beta1/types/pipeline_job.py @@ -573,6 +573,16 @@ class PipelineTaskDetail(proto.Message): outputs (MutableMapping[str, google.cloud.aiplatform_v1beta1.types.PipelineTaskDetail.ArtifactList]): Output only. The runtime output artifacts of the task. + task_unique_name (str): + Output only. The unique name of a task. This field is used + by pipeline job reruns. Console UI and Vertex AI SDK will + support triggering pipeline job reruns. The name is + constructed by concatenating all the parent tasks' names + with the task name. For example, if a task named + "child_task" has a parent task named "parent_task_1" and + parent task 1 has a parent task named "parent_task_2", the + task unique name will be + "parent_task_2.parent_task_1.child_task". """ class State(proto.Enum): @@ -726,6 +736,10 @@ class ArtifactList(proto.Message): number=11, message=ArtifactList, ) + task_unique_name: str = proto.Field( + proto.STRING, + number=14, + ) class PipelineTaskExecutorDetail(proto.Message): diff --git a/google/cloud/aiplatform_v1beta1/types/tool.py b/google/cloud/aiplatform_v1beta1/types/tool.py index e61d783102..c6678904ce 100644 --- a/google/cloud/aiplatform_v1beta1/types/tool.py +++ b/google/cloud/aiplatform_v1beta1/types/tool.py @@ -96,6 +96,11 @@ class Tool(proto.Message): url_context (google.cloud.aiplatform_v1beta1.types.UrlContext): Optional. Tool to support URL context retrieval. + computer_use (google.cloud.aiplatform_v1beta1.types.Tool.ComputerUse): + Optional. Tool to support the model + interacting directly with the computer. If + enabled, it automatically populates computer-use + specific Function Declarations. """ class GoogleSearch(proto.Message): @@ -113,6 +118,33 @@ class CodeExecution(proto.Message): """ + class ComputerUse(proto.Message): + r"""Tool to support computer use. + + Attributes: + environment (google.cloud.aiplatform_v1beta1.types.Tool.ComputerUse.Environment): + Required. The environment being operated. + """ + + class Environment(proto.Enum): + r"""Represents the environment being operated, such as a web + browser. + + Values: + ENVIRONMENT_UNSPECIFIED (0): + Defaults to browser. + ENVIRONMENT_BROWSER (1): + Operates in a web browser. + """ + ENVIRONMENT_UNSPECIFIED = 0 + ENVIRONMENT_BROWSER = 1 + + environment: "Tool.ComputerUse.Environment" = proto.Field( + proto.ENUM, + number=1, + enum="Tool.ComputerUse.Environment", + ) + function_declarations: MutableSequence["FunctionDeclaration"] = proto.RepeatedField( proto.MESSAGE, number=1, @@ -148,6 +180,11 @@ class CodeExecution(proto.Message): number=8, message="UrlContext", ) + computer_use: ComputerUse = proto.Field( + proto.MESSAGE, + number=11, + message=ComputerUse, + ) class UrlContext(proto.Message): diff --git a/mypy.ini b/mypy.ini index 574c5aed39..e392baeb3c 100644 --- a/mypy.ini +++ b/mypy.ini @@ -1,3 +1,22 @@ [mypy] -python_version = 3.7 -namespace_packages = True +# TODO(b/422425982): Fix arg-type errors +disable_error_code = import-not-found, import-untyped, arg-type + +# We only want to run mypy on _genai dir, ignore dependent modules +[mypy-vertexai.agent_engines.*] +ignore_errors = True + +[mypy-vertexai.preview.*] +ignore_errors = True + +[mypy-vertexai.generative_models.*] +ignore_errors = True + +[mypy-vertexai.prompts.*] +ignore_errors = True + +[mypy-vertexai.tuning.*] +ignore_errors = True + +[mypy-vertexai.caching.*] +ignore_errors = True diff --git a/pypi/_vertex_ai_placeholder/version.py b/pypi/_vertex_ai_placeholder/version.py index 6e958580b7..2004102482 100644 --- a/pypi/_vertex_ai_placeholder/version.py +++ b/pypi/_vertex_ai_placeholder/version.py @@ -15,4 +15,4 @@ # limitations under the License. # -__version__ = "1.100.0" +__version__ = "1.101.0" diff --git a/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1.json b/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1.json index 25150480be..d1664cee13 100644 --- a/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1.json +++ b/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1.json @@ -8,7 +8,7 @@ ], "language": "PYTHON", "name": "google-cloud-aiplatform", - "version": "1.100.0" + "version": "1.101.0" }, "snippets": [ { diff --git a/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1beta1.json b/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1beta1.json index ae1878e46c..3174d937ee 100644 --- a/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1beta1.json +++ b/samples/generated_samples/snippet_metadata_google.cloud.aiplatform.v1beta1.json @@ -8,7 +8,7 @@ ], "language": "PYTHON", "name": "google-cloud-aiplatform", - "version": "1.100.0" + "version": "1.101.0" }, "snippets": [ { diff --git a/samples/model-builder/create_custom_job_psci_sample.py b/samples/model-builder/create_custom_job_psci_sample.py index 1a44496e05..de6498a536 100644 --- a/samples/model-builder/create_custom_job_psci_sample.py +++ b/samples/model-builder/create_custom_job_psci_sample.py @@ -14,7 +14,6 @@ # [START aiplatform_sdk_create_custom_job_psci_sample] from google.cloud import aiplatform -from google.cloud import aiplatform_v1beta1 def create_custom_job_psci_sample( @@ -26,40 +25,40 @@ def create_custom_job_psci_sample( replica_count: int, image_uri: str, network_attachment: str, + domain: str, + target_project: str, + target_network: str, ): - """Custom training job sample with PSC-I through aiplatform_v1beta1.""" + """Custom training job sample with PSC Interface Config.""" aiplatform.init(project=project, location=location, staging_bucket=bucket) - client_options = {"api_endpoint": f"{location}-aiplatform.googleapis.com"} - - client = aiplatform_v1beta1.JobServiceClient(client_options=client_options) - - request = aiplatform_v1beta1.CreateCustomJobRequest( - parent=f"projects/{project}/locations/{location}", - custom_job=aiplatform_v1beta1.CustomJob( - display_name=display_name, - job_spec=aiplatform_v1beta1.CustomJobSpec( - worker_pool_specs=[ - aiplatform_v1beta1.WorkerPoolSpec( - machine_spec=aiplatform_v1beta1.MachineSpec( - machine_type=machine_type, - ), - replica_count=replica_count, - container_spec=aiplatform_v1beta1.ContainerSpec( - image_uri=image_uri, - ), - ) - ], - psc_interface_config=aiplatform_v1beta1.PscInterfaceConfig( - network_attachment=network_attachment, - ), - ), - ), + worker_pool_specs = [{ + "machine_spec": { + "machine_type": machine_type, + }, + "replica_count": replica_count, + "container_spec": { + "image_uri": image_uri, + "command": [], + "args": [], + }, + }] + psc_interface_config = { + "network_attachment": network_attachment, + "dns_peering_configs": [ + { + "domain": domain, + "target_project": target_project, + "target_network": target_network, + }, + ], + } + job = aiplatform.CustomJob( + display_name=display_name, + worker_pool_specs=worker_pool_specs, ) - response = client.create_custom_job(request=request) - - return response + job.run(psc_interface_config=psc_interface_config) # [END aiplatform_sdk_create_custom_job_psci_sample] diff --git a/samples/model-builder/create_custom_job_psci_sample_test.py b/samples/model-builder/create_custom_job_psci_sample_test.py index b891789db3..de95fe879a 100644 --- a/samples/model-builder/create_custom_job_psci_sample_test.py +++ b/samples/model-builder/create_custom_job_psci_sample_test.py @@ -13,15 +13,13 @@ # limitations under the License. import create_custom_job_psci_sample -from google.cloud import aiplatform_v1beta1 import test_constants as constants def test_create_custom_job_psci_sample( mock_sdk_init, - mock_get_job_service_client_v1beta1, - mock_get_create_custom_job_request_v1beta1, - mock_create_custom_job_v1beta1, + mock_get_custom_job, + mock_run_custom_job, ): """Custom training job sample with PSC-I through aiplatform_v1beta1.""" create_custom_job_psci_sample.create_custom_job_psci_sample( @@ -31,8 +29,11 @@ def test_create_custom_job_psci_sample( display_name=constants.DISPLAY_NAME, machine_type=constants.MACHINE_TYPE, replica_count=1, - image_uri=constants.TRAIN_IMAGE, + image_uri=constants.CONTAINER_URI, network_attachment=constants.NETWORK_ATTACHMENT_NAME, + domain=constants.DOMAIN, + target_project=constants.TARGET_PROJECT, + target_network=constants.TARGET_NETWORK, ) mock_sdk_init.assert_called_once_with( @@ -41,37 +42,11 @@ def test_create_custom_job_psci_sample( staging_bucket=constants.STAGING_BUCKET, ) - mock_get_job_service_client_v1beta1.assert_called_once_with( - client_options={ - "api_endpoint": f"{constants.LOCATION}-aiplatform.googleapis.com" - } - ) - - mock_get_create_custom_job_request_v1beta1.assert_called_once_with( - parent=f"projects/{constants.PROJECT}/locations/{constants.LOCATION}", - custom_job=aiplatform_v1beta1.CustomJob( - display_name=constants.DISPLAY_NAME, - job_spec=aiplatform_v1beta1.CustomJobSpec( - worker_pool_specs=[ - aiplatform_v1beta1.WorkerPoolSpec( - machine_spec=aiplatform_v1beta1.MachineSpec( - machine_type=constants.MACHINE_TYPE, - ), - replica_count=constants.REPLICA_COUNT, - container_spec=aiplatform_v1beta1.ContainerSpec( - image_uri=constants.TRAIN_IMAGE, - ), - ) - ], - psc_interface_config=aiplatform_v1beta1.PscInterfaceConfig( - network_attachment=constants.NETWORK_ATTACHMENT_NAME, - ), - ), - ), + mock_get_custom_job.assert_called_once_with( + display_name=constants.DISPLAY_NAME, + worker_pool_specs=constants.CUSTOM_JOB_WORKER_POOL_SPECS_WITHOUT_ACCELERATOR, ) - request = aiplatform_v1beta1.CreateCustomJobRequest( - mock_get_create_custom_job_request_v1beta1.return_value + mock_run_custom_job.assert_called_once_with( + psc_interface_config=constants.PSC_INTERFACE_CONFIG, ) - - mock_create_custom_job_v1beta1.assert_called_once_with(request=request) diff --git a/samples/model-builder/test_constants.py b/samples/model-builder/test_constants.py index 69fbecd912..9d38605267 100644 --- a/samples/model-builder/test_constants.py +++ b/samples/model-builder/test_constants.py @@ -116,6 +116,19 @@ ACCELERATOR_TYPE = "ACCELERATOR_TYPE_UNSPECIFIED" ACCELERATOR_COUNT = 0 NETWORK_ATTACHMENT_NAME = "network-attachment-name" +DOMAIN = "test.com" +TARGET_PROJECT = "target-project" +TARGET_NETWORK = "target-network" +PSC_INTERFACE_CONFIG = { + "network_attachment": NETWORK_ATTACHMENT_NAME, + "dns_peering_configs": [ + { + "domain": DOMAIN, + "target_project": TARGET_PROJECT, + "target_network": TARGET_NETWORK, + }, + ], +} # Model constants MODEL_RESOURCE_NAME = f"{PARENT}/models/1234" @@ -387,6 +400,20 @@ } ] +CUSTOM_JOB_WORKER_POOL_SPECS_WITHOUT_ACCELERATOR = [ + { + "machine_spec": { + "machine_type": "n1-standard-4", + }, + "replica_count": 1, + "container_spec": { + "image_uri": CONTAINER_URI, + "command": [], + "args": [], + }, + } +] + VERSION_ID = "test-version" IS_DEFAULT_VERSION = False VERSION_ALIASES = ["test-version-alias"] diff --git a/tests/unit/aiplatform/test_endpoints.py b/tests/unit/aiplatform/test_endpoints.py index 567b5225db..610892b141 100644 --- a/tests/unit/aiplatform/test_endpoints.py +++ b/tests/unit/aiplatform/test_endpoints.py @@ -357,6 +357,7 @@ def get_dedicated_endpoint_mock(): get_endpoint_mock.return_value = gca_endpoint.Endpoint( display_name=_TEST_DISPLAY_NAME, name=_TEST_ENDPOINT_NAME, + deployed_models=_TEST_DEPLOYED_MODELS, encryption_spec=_TEST_ENCRYPTION_SPEC, dedicated_endpoint_enabled=True, dedicated_endpoint_dns=_TEST_DEDICATED_ENDPOINT_DNS, @@ -752,6 +753,69 @@ def predict_async_client_explain_mock(): yield explain_mock +@pytest.fixture +def invoke_public_dedicated_endpoint_http_mock(): + resp = requests.Response() + resp.status_code = 200 + resp._content = json.dumps( + { + "predictions": _TEST_PREDICTION, + "metadata": _TEST_METADATA, + "deployedModelId": _TEST_DEPLOYED_MODELS[0].id, + "model": _TEST_MODEL_NAME, + "modelVersionId": "1", + } + ).encode("utf-8") + with mock.patch.object( + google_auth_requests.AuthorizedSession, "post" + ) as predict_mock: + predict_mock.return_value = resp + yield predict_mock + + +@pytest.fixture +def invoke_public_dedicated_endpoint_http_mock_streaming(): + with mock.patch.object( + google_auth_requests.AuthorizedSession, "post" + ) as invoke_streaming_mock: + # Create a mock response object + mock_response = mock.Mock(spec=requests.Response) + + # Configure the mock to be used as a context manager + invoke_streaming_mock.return_value.__enter__.return_value = mock_response + + # Set the status code to 200 (OK) + mock_response.status_code = 200 + + # Simulate streaming data with iter_lines + mock_response.iter_lines = mock.Mock( + return_value=iter( + [ + json.dumps( + { + "predictions": [1.0, 2.0, 3.0], + "metadata": {"key": "value"}, + "deployedModelId": "model-id-123", + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + json.dumps( + { + "predictions": [4.0, 5.0, 6.0], + "metadata": {"key": "value"}, + "deployedModelId": "model-id-123", + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + ] + ) + ) + + yield invoke_streaming_mock + + @pytest.fixture def preview_get_drp_mock(): with mock.patch.object( @@ -988,6 +1052,69 @@ def stream_raw_predict_private_endpoint_mock(): yield stream_raw_predict_mock +@pytest.fixture +def invoke_private_dedicated_endpoint_http_mock(): + resp = requests.Response() + resp.status_code = 200 + resp._content = json.dumps( + { + "predictions": _TEST_PREDICTION, + "metadata": _TEST_METADATA, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": _TEST_MODEL_NAME, + "modelVersionId": "1", + } + ).encode("utf-8") + with mock.patch.object( + google_auth_requests.AuthorizedSession, "post" + ) as predict_mock: + predict_mock.return_value = resp + yield predict_mock + + +@pytest.fixture +def invoke_private_dedicated_endpoint_http_mock_streaming(): + with mock.patch.object( + google_auth_requests.AuthorizedSession, "post" + ) as invoke_streaming_mock: + # Create a mock response object + mock_response = mock.Mock(spec=requests.Response) + + # Configure the mock to be used as a context manager + invoke_streaming_mock.return_value.__enter__.return_value = mock_response + + # Set the status code to 200 (OK) + mock_response.status_code = 200 + + # Simulate streaming data with iter_lines + mock_response.iter_lines = mock.Mock( + return_value=iter( + [ + json.dumps( + { + "predictions": [1.0, 2.0, 3.0], + "metadata": {"key": "value"}, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + json.dumps( + { + "predictions": [4.0, 5.0, 6.0], + "metadata": {"key": "value"}, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + ] + ) + ) + + yield invoke_streaming_mock + + @pytest.fixture def health_check_private_endpoint_mock(): with mock.patch.object(urllib3.PoolManager, "request") as health_check_mock: @@ -2890,6 +3017,135 @@ def test_raw_predict_use_dedicated_endpoint_for_regular_endpoint( timeout=None, ) + @pytest.mark.usefixtures("get_dedicated_endpoint_mock") + def test_invoke_dedicated_endpoint_default( + self, invoke_public_dedicated_endpoint_http_mock + ): + test_endpoint = models.Endpoint(_TEST_ENDPOINT_NAME) + test_prediction_response = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + ) + + expected_prediction_response = requests.Response() + expected_prediction_response.status_code = 200 + expected_prediction_response._content = json.dumps( + { + "predictions": _TEST_PREDICTION, + "metadata": _TEST_METADATA, + "deployedModelId": _TEST_DEPLOYED_MODELS[0].id, + "model": _TEST_MODEL_NAME, + "modelVersionId": "1", + } + ).encode("utf-8") + + assert ( + test_prediction_response.status_code + == expected_prediction_response.status_code + ) + assert test_prediction_response.text == expected_prediction_response.text + invoke_public_dedicated_endpoint_http_mock.assert_called_once_with( + url=f"https://{_test_dedicated_endpoint_dns}/v1/projects/%7B_TEST_PROJECT%7D/locations/%7B_TEST_LOCATION%7D/endpoints/%7B_TEST_ID%7D/invoke/arbitrary/path", + data=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + timeout=None, + ) + + @pytest.mark.usefixtures("get_dedicated_endpoint_mock") + def test_invoke_dedicated_endpoint_stream_true( + self, invoke_public_dedicated_endpoint_http_mock_streaming + ): + test_endpoint = models.Endpoint(_TEST_ENDPOINT_NAME) + + test_prediction_iterator = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + stream=True, + ) + + test_streaming_predction_result = list(test_prediction_iterator) + expected_streaming_prediction_result = [ + json.dumps( + { + "predictions": [1.0, 2.0, 3.0], + "metadata": {"key": "value"}, + "deployedModelId": "model-id-123", + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + json.dumps( + { + "predictions": [4.0, 5.0, 6.0], + "metadata": {"key": "value"}, + "deployedModelId": "model-id-123", + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + ] + assert test_streaming_predction_result == expected_streaming_prediction_result + invoke_public_dedicated_endpoint_http_mock_streaming.assert_called_once_with( + url=f"https://{_test_dedicated_endpoint_dns}/v1/projects/%7B_TEST_PROJECT%7D/locations/%7B_TEST_LOCATION%7D/endpoints/%7B_TEST_ID%7D/invoke/arbitrary/path", + data=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + timeout=None, + stream=True, + ) + + @pytest.mark.usefixtures("get_dedicated_endpoint_mock") + def test_invoke_with_deployed_model_id( + self, invoke_public_dedicated_endpoint_http_mock + ): + test_endpoint = models.Endpoint(_TEST_ENDPOINT_NAME) + test_prediction_response = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + deployed_model_id=_TEST_DEPLOYED_MODELS[0].id, + ) + + expected_prediction_response = requests.Response() + expected_prediction_response.status_code = 200 + expected_prediction_response._content = json.dumps( + { + "predictions": _TEST_PREDICTION, + "metadata": _TEST_METADATA, + "deployedModelId": _TEST_DEPLOYED_MODELS[0].id, + "model": _TEST_MODEL_NAME, + "modelVersionId": "1", + } + ).encode("utf-8") + + assert ( + test_prediction_response.status_code + == expected_prediction_response.status_code + ) + assert test_prediction_response.text == expected_prediction_response.text + invoke_public_dedicated_endpoint_http_mock.assert_called_once_with( + url=f"https://{_test_dedicated_endpoint_dns}/v1/projects/%7B_TEST_PROJECT%7D/locations/%7B_TEST_LOCATION%7D/endpoints/%7B_TEST_ID%7D/deployedModels/%7B_TEST_DEPLOYED_MODELS[0].id%7D/invoke/arbitrary/path", + data=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + timeout=None, + ) + + @pytest.mark.usefixtures("get_dedicated_endpoint_mock") + def test_invoke_with_non_existent_deployed_model_id_raises_error(self): + test_endpoint = models.Endpoint(_TEST_ENDPOINT_NAME) + with pytest.raises(ValueError) as e: + _ = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + deployed_model_id="non-existent-deployed-model-id", + ) + + assert e.match( + f"Deployed model non-existent-deployed-model-id not found in endpoint {_TEST_ID}." + ) + @pytest.mark.asyncio @pytest.mark.usefixtures("get_endpoint_mock") async def test_predict_async(self, predict_async_client_predict_mock): @@ -3909,6 +4165,148 @@ def test_psc_predict_with_invalid_endpoint_override(self): "address or DNS." ) + @pytest.mark.usefixtures("get_psc_private_endpoint_with_many_model_mock") + def test_psc_invoke_default(self, invoke_private_dedicated_endpoint_http_mock): + test_endpoint = models.PrivateEndpoint( + project=_TEST_PROJECT, location=_TEST_LOCATION, endpoint_name=_TEST_ID + ) + + test_prediction_response = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={ + "Content-Type": "application/json", + }, + endpoint_override=_TEST_ENDPOINT_OVERRIDE, + ) + + expected_prediction_response = requests.Response() + expected_prediction_response.status_code = 200 + expected_prediction_response._content = json.dumps( + { + "predictions": _TEST_PREDICTION, + "metadata": _TEST_METADATA, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": _TEST_MODEL_NAME, + "modelVersionId": "1", + } + ).encode("utf-8") + + assert ( + test_prediction_response.status_code + == expected_prediction_response.status_code + ) + assert test_prediction_response.text == expected_prediction_response.text + invoke_private_dedicated_endpoint_http_mock.assert_called_once_with( + url=f"https://{_test_endpoint_override}/v1/projects/%7B_TEST_PROJECT%7D/locations/%7B_TEST_LOCATION%7D/endpoints/%7B_TEST_ID%7D/invoke/arbitrary/path", + data=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + timeout=None, + ) + + @pytest.mark.usefixtures("get_psc_private_endpoint_with_many_model_mock") + def test_psc_invoke_dedicated_endpoint_stream_true( + self, invoke_private_dedicated_endpoint_http_mock_streaming + ): + test_endpoint = models.PrivateEndpoint( + project=_TEST_PROJECT, location=_TEST_LOCATION, endpoint_name=_TEST_ID + ) + + test_prediction_iterator = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + stream=True, + endpoint_override=_TEST_ENDPOINT_OVERRIDE, + ) + + test_streaming_predction_result = list(test_prediction_iterator) + expected_streaming_prediction_result = [ + json.dumps( + { + "predictions": [1.0, 2.0, 3.0], + "metadata": {"key": "value"}, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + json.dumps( + { + "predictions": [4.0, 5.0, 6.0], + "metadata": {"key": "value"}, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": "model-name", + "modelVersionId": "1", + } + ).encode("utf-8"), + ] + assert test_streaming_predction_result == expected_streaming_prediction_result + invoke_private_dedicated_endpoint_http_mock_streaming.assert_called_once_with( + url=f"https://{_test_endpoint_override}/v1/projects/%7B_TEST_PROJECT%7D/locations/%7B_TEST_LOCATION%7D/endpoints/%7B_TEST_ID%7D/invoke/arbitrary/path", + data=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + timeout=None, + stream=True, + ) + + @pytest.mark.usefixtures("get_psc_private_endpoint_with_many_model_mock") + def test_psc_invoke_with_deployed_model_id( + self, invoke_private_dedicated_endpoint_http_mock + ): + test_endpoint = models.PrivateEndpoint( + project=_TEST_PROJECT, location=_TEST_LOCATION, endpoint_name=_TEST_ID + ) + test_prediction_response = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + deployed_model_id=_TEST_LONG_DEPLOYED_MODELS[0].id, + endpoint_override=_TEST_ENDPOINT_OVERRIDE, + ) + + expected_prediction_response = requests.Response() + expected_prediction_response.status_code = 200 + expected_prediction_response._content = json.dumps( + { + "predictions": _TEST_PREDICTION, + "metadata": _TEST_METADATA, + "deployedModelId": _TEST_LONG_DEPLOYED_MODELS[0].id, + "model": _TEST_MODEL_NAME, + "modelVersionId": "1", + } + ).encode("utf-8") + + assert ( + test_prediction_response.status_code + == expected_prediction_response.status_code + ) + assert test_prediction_response.text == expected_prediction_response.text + invoke_private_dedicated_endpoint_http_mock.assert_called_once_with( + url=f"https://{_test_endpoint_override}/v1/projects/%7B_TEST_PROJECT%7D/locations/%7B_TEST_LOCATION%7D/endpoints/%7B_TEST_ID%7D/deployedModels/%7B_TEST_LONG_DEPLOYED_MODELS[0].id%7D/invoke/arbitrary/path", + data=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + timeout=None, + ) + + @pytest.mark.usefixtures("get_psc_private_endpoint_with_many_model_mock") + def test_psc_invoke_with_non_existent_deployed_model_id_raises_error(self): + test_endpoint = models.PrivateEndpoint( + project=_TEST_PROJECT, location=_TEST_LOCATION, endpoint_name=_TEST_ID + ) + with pytest.raises(ValueError) as e: + _ = test_endpoint.invoke( + request_path="/arbitrary/path", + body=_TEST_RAW_INPUTS, + headers={"Content-Type": "application/json"}, + deployed_model_id="non-existent-deployed-model-id", + endpoint_override=_TEST_ENDPOINT_OVERRIDE, + ) + + assert e.match( + f"Deployed model non-existent-deployed-model-id not found in endpoint {_TEST_ID}." + ) + @pytest.mark.usefixtures("get_psa_private_endpoint_with_model_mock") def test_psa_health_check(self, health_check_private_endpoint_mock): test_endpoint = models.PrivateEndpoint(_TEST_ID) diff --git a/tests/unit/aiplatform/test_models.py b/tests/unit/aiplatform/test_models.py index ba95f42717..ee2233d0d8 100644 --- a/tests/unit/aiplatform/test_models.py +++ b/tests/unit/aiplatform/test_models.py @@ -102,12 +102,15 @@ _TEST_MODEL_PARENT_ALT = ( f"projects/{_TEST_PROJECT}/locations/{_TEST_LOCATION}/models/{_TEST_MODEL_NAME_ALT}" ) +_TEST_INVOKE_MODEL_NAME = "invoke-model" +_TEST_INVOKE_MODEL_PARENT = f"projects/{_TEST_PROJECT}/locations/{_TEST_LOCATION}/models/{_TEST_INVOKE_MODEL_NAME}" _TEST_ARTIFACT_URI = "gs://test/artifact/uri" _TEST_SERVING_CONTAINER_IMAGE = ( test_constants.ModelConstants._TEST_SERVING_CONTAINER_IMAGE ) _TEST_SERVING_CONTAINER_PREDICTION_ROUTE = "predict" _TEST_SERVING_CONTAINER_HEALTH_ROUTE = "metadata" +_TEST_SERVING_CONTAINER_INVOKE_ROUTE_PREFIX = "/*" _TEST_DESCRIPTION = "test description" _TEST_SERVING_CONTAINER_COMMAND = ["python3", "run_my_model.py"] _TEST_SERVING_CONTAINER_ARGS = ["--test", "arg"] @@ -258,6 +261,9 @@ ) _TEST_MODEL_RESOURCE_NAME = test_constants.ModelConstants._TEST_MODEL_RESOURCE_NAME +_TEST_INVOKE_MODEL_RESOURCE_NAME = model_service_client.ModelServiceClient.model_path( + _TEST_PROJECT, _TEST_LOCATION, _TEST_ID +) _TEST_MODEL_RESOURCE_NAME_CUSTOM_PROJECT = ( model_service_client.ModelServiceClient.model_path( _TEST_PROJECT_2, _TEST_LOCATION, _TEST_ID @@ -486,6 +492,15 @@ version_aliases=["default"], version_description=_TEST_MODEL_VERSION_DESCRIPTION_1, ), + gca_model.Model( + version_id="1", + create_time=timestamp_pb2.Timestamp(), + update_time=timestamp_pb2.Timestamp(), + display_name=_TEST_INVOKE_MODEL_NAME, + name=_TEST_INVOKE_MODEL_PARENT, + version_aliases=["default"], + version_description=_TEST_MODEL_VERSION_DESCRIPTION_1, + ), ] _TEST_MODEL_OBJ_WITH_VERSION = ( @@ -1356,6 +1371,47 @@ def test_upload_uploads_and_gets_model( name=_TEST_MODEL_RESOURCE_NAME, retry=base._DEFAULT_RETRY ) + @pytest.mark.parametrize("sync", [True, False]) + def test_upload_uploads_and_gets_invoke_model( + self, upload_model_mock, get_model_mock, sync + ): + + my_model = models.Model.upload( + display_name=_TEST_INVOKE_MODEL_NAME, + serving_container_image_uri=_TEST_SERVING_CONTAINER_IMAGE, + serving_container_invoke_route_prefix=_TEST_SERVING_CONTAINER_INVOKE_ROUTE_PREFIX, + serving_container_health_route=_TEST_SERVING_CONTAINER_HEALTH_ROUTE, + sync=sync, + upload_request_timeout=None, + ) + + container_spec = gca_model.ModelContainerSpec( + image_uri=_TEST_SERVING_CONTAINER_IMAGE, + invoke_route_prefix=_TEST_SERVING_CONTAINER_INVOKE_ROUTE_PREFIX, + health_route=_TEST_SERVING_CONTAINER_HEALTH_ROUTE, + ) + + managed_model = gca_model.Model( + display_name=_TEST_INVOKE_MODEL_NAME, + container_spec=container_spec, + version_aliases=["default"], + ) + + if not sync: + my_model.wait() + + upload_model_mock.assert_called_once_with( + request=gca_model_service.UploadModelRequest( + parent=initializer.global_config.common_location_path(), + model=managed_model, + ), + timeout=None, + ) + + get_model_mock.assert_called_once_with( + name=_TEST_INVOKE_MODEL_RESOURCE_NAME, retry=base._DEFAULT_RETRY + ) + def test_upload_without_serving_container_image_uri_throw_error( self, upload_model_mock, get_model_mock ): diff --git a/tests/unit/gapic/aiplatform_v1/test_gen_ai_cache_service.py b/tests/unit/gapic/aiplatform_v1/test_gen_ai_cache_service.py index c9dcbc6092..513b55219e 100644 --- a/tests/unit/gapic/aiplatform_v1/test_gen_ai_cache_service.py +++ b/tests/unit/gapic/aiplatform_v1/test_gen_ai_cache_service.py @@ -4721,6 +4721,7 @@ def test_create_cached_content_rest_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { @@ -5214,6 +5215,7 @@ def test_update_cached_content_rest_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { @@ -6569,6 +6571,7 @@ async def test_create_cached_content_rest_asyncio_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { @@ -7094,6 +7097,7 @@ async def test_update_cached_content_rest_asyncio_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { diff --git a/tests/unit/gapic/aiplatform_v1/test_migration_service.py b/tests/unit/gapic/aiplatform_v1/test_migration_service.py index 9e8dced432..b7ffa7bfc4 100644 --- a/tests/unit/gapic/aiplatform_v1/test_migration_service.py +++ b/tests/unit/gapic/aiplatform_v1/test_migration_service.py @@ -5398,22 +5398,19 @@ def test_parse_annotated_dataset_path(): def test_dataset_path(): project = "cuttlefish" - location = "mussel" - dataset = "winkle" - expected = "projects/{project}/locations/{location}/datasets/{dataset}".format( + dataset = "mussel" + expected = "projects/{project}/datasets/{dataset}".format( project=project, - location=location, dataset=dataset, ) - actual = MigrationServiceClient.dataset_path(project, location, dataset) + actual = MigrationServiceClient.dataset_path(project, dataset) assert expected == actual def test_parse_dataset_path(): expected = { - "project": "nautilus", - "location": "scallop", - "dataset": "abalone", + "project": "winkle", + "dataset": "nautilus", } path = MigrationServiceClient.dataset_path(**expected) @@ -5423,19 +5420,22 @@ def test_parse_dataset_path(): def test_dataset_path(): - project = "squid" - dataset = "clam" - expected = "projects/{project}/datasets/{dataset}".format( + project = "scallop" + location = "abalone" + dataset = "squid" + expected = "projects/{project}/locations/{location}/datasets/{dataset}".format( project=project, + location=location, dataset=dataset, ) - actual = MigrationServiceClient.dataset_path(project, dataset) + actual = MigrationServiceClient.dataset_path(project, location, dataset) assert expected == actual def test_parse_dataset_path(): expected = { - "project": "whelk", + "project": "clam", + "location": "whelk", "dataset": "octopus", } path = MigrationServiceClient.dataset_path(**expected) diff --git a/tests/unit/gapic/aiplatform_v1beta1/test_gen_ai_cache_service.py b/tests/unit/gapic/aiplatform_v1beta1/test_gen_ai_cache_service.py index d04776455e..a8c827a6a8 100644 --- a/tests/unit/gapic/aiplatform_v1beta1/test_gen_ai_cache_service.py +++ b/tests/unit/gapic/aiplatform_v1beta1/test_gen_ai_cache_service.py @@ -4732,6 +4732,7 @@ def test_create_cached_content_rest_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { @@ -5236,6 +5237,7 @@ def test_update_cached_content_rest_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { @@ -6602,6 +6604,7 @@ async def test_create_cached_content_rest_asyncio_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { @@ -7138,6 +7141,7 @@ async def test_update_cached_content_rest_asyncio_call_success(request_type): "enterprise_web_search": {}, "code_execution": {}, "url_context": {}, + "computer_use": {"environment": 1}, } ], "tool_config": { diff --git a/tests/unit/gapic/aiplatform_v1beta1/test_migration_service.py b/tests/unit/gapic/aiplatform_v1beta1/test_migration_service.py index 574ddbdf19..1069dbb2b0 100644 --- a/tests/unit/gapic/aiplatform_v1beta1/test_migration_service.py +++ b/tests/unit/gapic/aiplatform_v1beta1/test_migration_service.py @@ -5426,22 +5426,19 @@ def test_parse_dataset_path(): def test_dataset_path(): project = "squid" - location = "clam" - dataset = "whelk" - expected = "projects/{project}/locations/{location}/datasets/{dataset}".format( + dataset = "clam" + expected = "projects/{project}/datasets/{dataset}".format( project=project, - location=location, dataset=dataset, ) - actual = MigrationServiceClient.dataset_path(project, location, dataset) + actual = MigrationServiceClient.dataset_path(project, dataset) assert expected == actual def test_parse_dataset_path(): expected = { - "project": "octopus", - "location": "oyster", - "dataset": "nudibranch", + "project": "whelk", + "dataset": "octopus", } path = MigrationServiceClient.dataset_path(**expected) @@ -5451,19 +5448,22 @@ def test_parse_dataset_path(): def test_dataset_path(): - project = "cuttlefish" - dataset = "mussel" - expected = "projects/{project}/datasets/{dataset}".format( + project = "oyster" + location = "nudibranch" + dataset = "cuttlefish" + expected = "projects/{project}/locations/{location}/datasets/{dataset}".format( project=project, + location=location, dataset=dataset, ) - actual = MigrationServiceClient.dataset_path(project, dataset) + actual = MigrationServiceClient.dataset_path(project, location, dataset) assert expected == actual def test_parse_dataset_path(): expected = { - "project": "winkle", + "project": "mussel", + "location": "winkle", "dataset": "nautilus", } path = MigrationServiceClient.dataset_path(**expected) diff --git a/tests/unit/gapic/aiplatform_v1beta1/test_pipeline_service.py b/tests/unit/gapic/aiplatform_v1beta1/test_pipeline_service.py index c96e0d9885..4f85883cac 100644 --- a/tests/unit/gapic/aiplatform_v1beta1/test_pipeline_service.py +++ b/tests/unit/gapic/aiplatform_v1beta1/test_pipeline_service.py @@ -10088,6 +10088,7 @@ def test_create_pipeline_job_rest_call_success(request_type): ], "inputs": {}, "outputs": {}, + "task_unique_name": "task_unique_name_value", } ], }, @@ -13140,6 +13141,7 @@ async def test_create_pipeline_job_rest_asyncio_call_success(request_type): ], "inputs": {}, "outputs": {}, + "task_unique_name": "task_unique_name_value", } ], }, diff --git a/tests/unit/gapic/aiplatform_v1beta1/test_schedule_service.py b/tests/unit/gapic/aiplatform_v1beta1/test_schedule_service.py index d2c850a57d..358d8b97e5 100644 --- a/tests/unit/gapic/aiplatform_v1beta1/test_schedule_service.py +++ b/tests/unit/gapic/aiplatform_v1beta1/test_schedule_service.py @@ -5696,6 +5696,7 @@ def test_create_schedule_rest_call_success(request_type): ], "inputs": {}, "outputs": {}, + "task_unique_name": "task_unique_name_value", } ], }, @@ -6883,6 +6884,7 @@ def test_update_schedule_rest_call_success(request_type): ], "inputs": {}, "outputs": {}, + "task_unique_name": "task_unique_name_value", } ], }, @@ -8260,6 +8262,7 @@ async def test_create_schedule_rest_asyncio_call_success(request_type): ], "inputs": {}, "outputs": {}, + "task_unique_name": "task_unique_name_value", } ], }, @@ -9547,6 +9550,7 @@ async def test_update_schedule_rest_asyncio_call_success(request_type): ], "inputs": {}, "outputs": {}, + "task_unique_name": "task_unique_name_value", } ], }, diff --git a/tests/unit/vertex_langchain/test_agent_engines.py b/tests/unit/vertex_langchain/test_agent_engines.py index ec2e554aec..12c342ac3c 100644 --- a/tests/unit/vertex_langchain/test_agent_engines.py +++ b/tests/unit/vertex_langchain/test_agent_engines.py @@ -584,6 +584,10 @@ def register_operations(self) -> Dict[str, List[str]]: "pydantic": ["pydantic"], } +_TEST_BUILD_OPTIONS_INSTALLATION = _agent_engines._BUILD_OPTIONS_INSTALLATION +_TEST_INSTALLATION_SUBDIR = _utils._INSTALLATION_SUBDIR +_TEST_INSTALLATION_SCRIPT_PATH = f"{_TEST_INSTALLATION_SUBDIR}/install_package.sh" + def _create_empty_fake_package(package_name: str) -> str: """Creates a temporary directory structure representing an empty fake Python package. @@ -1146,6 +1150,47 @@ def test_create_agent_engine_with_env_vars_list( retry=_TEST_RETRY, ) + def test_create_agent_engine_with_build_options( + self, + create_agent_engine_mock, + cloud_storage_create_bucket_mock, + tarfile_open_mock, + cloudpickle_dump_mock, + cloudpickle_load_mock, + importlib_metadata_version_mock, + get_agent_engine_mock, + get_gca_resource_mock, + ): + + with mock.patch("os.path.exists", return_value=True): + agent_engines.create( + self.test_agent, + display_name=_TEST_AGENT_ENGINE_DISPLAY_NAME, + extra_packages=[ + _TEST_INSTALLATION_SCRIPT_PATH, + ], + build_options={ + _TEST_BUILD_OPTIONS_INSTALLATION: [_TEST_INSTALLATION_SCRIPT_PATH] + }, + ) + test_spec = types.ReasoningEngineSpec( + package_spec=_TEST_AGENT_ENGINE_PACKAGE_SPEC, + agent_framework=_agent_engines._DEFAULT_AGENT_FRAMEWORK, + ) + test_spec.class_methods.append(_TEST_AGENT_ENGINE_QUERY_SCHEMA) + create_agent_engine_mock.assert_called_with( + parent=_TEST_PARENT, + reasoning_engine=types.ReasoningEngine( + display_name=_TEST_AGENT_ENGINE_DISPLAY_NAME, + spec=test_spec, + ), + ) + + get_agent_engine_mock.assert_called_with( + name=_TEST_AGENT_ENGINE_RESOURCE_NAME, + retry=_TEST_RETRY, + ) + @pytest.mark.parametrize( "test_case_name, test_engine_instance, expected_framework", [ @@ -2788,8 +2833,8 @@ def test_update_agent_engine_with_no_updates( ValueError, match=( "At least one of `agent_engine`, `requirements`, " - "`extra_packages`, `display_name`, `description`, or `env_vars` " - "must be specified." + "`extra_packages`, `display_name`, `description`, " + "`env_vars`, or `build_options` must be specified." ), ): test_agent_engine = _generate_agent_engine_to_update() @@ -3228,3 +3273,114 @@ def test_scan_with_explicit_ignore_modules(self): "cloudpickle": "3.0.0", "pydantic": "1.11.1", } + + +class TestValidateInstallationScripts: + # pytest does not allow absl.testing.parameterized.named_parameters. + @pytest.mark.parametrize( + "name, script_paths, extra_packages", + [ + ( + "valid_script_in_subdir_and_extra_packages", + [f"{_utils._INSTALLATION_SUBDIR}/script.sh"], + [f"{_utils._INSTALLATION_SUBDIR}/script.sh"], + ), + ( + "multiple_valid_scripts", + [ + f"{_utils._INSTALLATION_SUBDIR}/script1.sh", + f"{_utils._INSTALLATION_SUBDIR}/script2.sh", + ], + [ + f"{_utils._INSTALLATION_SUBDIR}/script1.sh", + f"{_utils._INSTALLATION_SUBDIR}/script2.sh", + ], + ), + ("empty_script_paths_and_extra_packages", [], []), + ], + ) + def test_validate_installation_scripts(self, name, script_paths, extra_packages): + _utils.validate_installation_scripts_or_raise( + script_paths=script_paths, extra_packages=extra_packages + ) + + @pytest.mark.parametrize( + "name, script_paths, extra_packages, error_message", + [ + ( + "script_not_in_subdir", + ["script.sh"], + ["script.sh"], + ( + f"Required installation script 'script.sh' is not under" + f" '{_utils._INSTALLATION_SUBDIR}'" + ), + ), + ( + "script_not_in_extra_packages", + [f"{_utils._INSTALLATION_SUBDIR}/script.sh"], + [], + ( + "User-defined installation script " + f"'{_utils._INSTALLATION_SUBDIR}/script.sh'" + " does not exist in `extra_packages`" + ), + ), + ( + "extra_package_in_subdir_but_not_script", + [], + [f"{_utils._INSTALLATION_SUBDIR}/script.sh"], + ( + f"Extra package '{_utils._INSTALLATION_SUBDIR}/script.sh' " + "is in the installation scripts subdirectory, but is not " + "specified as an installation script." + ), + ), + ( + "one_valid_one_invalid_script_not_in_subdir", + [f"{_utils._INSTALLATION_SUBDIR}/script1.sh", "script2.sh"], + [f"{_utils._INSTALLATION_SUBDIR}/script1.sh", "script2.sh"], + ( + f"Required installation script 'script2.sh' is not under" + f" '{_utils._INSTALLATION_SUBDIR}'" + ), + ), + ( + "one_valid_one_invalid_script_not_in_extra_packages", + [ + f"{_utils._INSTALLATION_SUBDIR}/script1.sh", + f"{_utils._INSTALLATION_SUBDIR}/script2.sh", + ], + [f"{_utils._INSTALLATION_SUBDIR}/script1.sh"], + ( + "User-defined installation script " + f"'{_utils._INSTALLATION_SUBDIR}/script2.sh' " + "does not exist in `extra_packages`" + ), + ), + ( + "one_valid_one_invalid_extra_package_in_subdir", + [f"{_utils._INSTALLATION_SUBDIR}/script1.sh"], + [ + f"{_utils._INSTALLATION_SUBDIR}/script1.sh", + f"{_utils._INSTALLATION_SUBDIR}/script2.sh", + ], + ( + f"Extra package '{_utils._INSTALLATION_SUBDIR}/script2.sh' " + "is in the installation scripts subdirectory, but is not " + "specified as an installation script." + ), + ), + ], + ) + def test_validate_installation_scripts_raises_error( + self, + name, + script_paths, + extra_packages, + error_message, + ): + with pytest.raises(ValueError, match=error_message): + _utils.validate_installation_scripts_or_raise( + script_paths=script_paths, extra_packages=extra_packages + ) diff --git a/tests/unit/vertexai/genai/test_agent_engines.py b/tests/unit/vertexai/genai/test_agent_engines.py index 0f7c42c9c7..c99747bfe4 100644 --- a/tests/unit/vertexai/genai/test_agent_engines.py +++ b/tests/unit/vertexai/genai/test_agent_engines.py @@ -983,6 +983,10 @@ def test_create_agent_engine(self, mock_await_operation, mock_prepare): env_vars=_TEST_AGENT_ENGINE_ENV_VARS_INPUT, ), ) + mock_await_operation.assert_called_once_with( + operation_name=None, + poll_interval_seconds=10, + ) request_mock.assert_called_with( "post", "reasoningEngines", @@ -1023,6 +1027,10 @@ def test_create_agent_engine_lightweight( description=_TEST_AGENT_ENGINE_DESCRIPTION, ) ) + mock_await_operation.assert_called_once_with( + operation_name=None, + poll_interval_seconds=1, + ) request_mock.assert_called_with( "post", "reasoningEngines", diff --git a/vertexai/__init__.py b/vertexai/__init__.py index 1444612f49..4a7c313a84 100644 --- a/vertexai/__init__.py +++ b/vertexai/__init__.py @@ -27,7 +27,7 @@ _genai_types = None -def __getattr__(name): +def __getattr__(name): # type: ignore[no-untyped-def] # Lazy importing the preview submodule # See https://peps.python.org/pep-0562/ if name == "preview": diff --git a/vertexai/_genai/__init__.py b/vertexai/_genai/__init__.py index 2c5aa504f5..1b3e013c55 100644 --- a/vertexai/_genai/__init__.py +++ b/vertexai/_genai/__init__.py @@ -16,12 +16,12 @@ import importlib -from .client import Client +from .client import Client # type: ignore[attr-defined] _evals = None -def __getattr__(name): +def __getattr__(name): # type: ignore[no-untyped-def] if name == "evals": global _evals if _evals is None: diff --git a/vertexai/_genai/_agent_engines_utils.py b/vertexai/_genai/_agent_engines_utils.py index a6b8657311..485a1c50be 100644 --- a/vertexai/_genai/_agent_engines_utils.py +++ b/vertexai/_genai/_agent_engines_utils.py @@ -34,7 +34,7 @@ def _wrap_query_operation(*, method_name: str) -> Callable[..., Any]: the `query` API. """ - def _method(self: types.AgentEngine, **kwargs): + def _method(self: types.AgentEngine, **kwargs) -> Any: if not self.api_client: raise ValueError("api_client is not initialized.") if not self.api_resource: @@ -52,7 +52,9 @@ def _method(self: types.AgentEngine, **kwargs): return _method -def _wrap_async_query_operation(*, method_name: str) -> Callable[..., Coroutine]: +def _wrap_async_query_operation( + *, method_name: str +) -> Callable[..., Coroutine[Any, Any, Any]]: """Wraps an Agent Engine method, creating an async callable for `query` API. This function creates a callable object that executes the specified @@ -122,7 +124,7 @@ def _method(self: types.AgentEngine, **kwargs) -> Iterator[Any]: def _wrap_async_stream_query_operation( *, method_name: str -) -> Callable[..., AsyncIterator]: +) -> Callable[..., AsyncIterator[Any]]: """Wraps an Agent Engine method, creating an async callable for `stream_query` API. This function creates a callable object that executes the specified diff --git a/vertexai/_genai/_evals_common.py b/vertexai/_genai/_evals_common.py index 7a86e8003d..07c1cab463 100644 --- a/vertexai/_genai/_evals_common.py +++ b/vertexai/_genai/_evals_common.py @@ -253,7 +253,7 @@ def _execute_inference_concurrently( e, ) responses[index] = {"error": f"Inference task failed: {e}"} - return responses + return responses # type: ignore[return-value] def _run_gemini_inference( @@ -337,14 +337,14 @@ def _call_litellm_completion(model: str, messages: list[dict[str, Any]]) -> dict def _run_litellm_inference( model: str, prompt_dataset: pd.DataFrame -) -> list[dict[str, Any]]: +) -> list[Optional[dict[str, Any]]]: """Runs inference using LiteLLM with concurrency.""" logger.info( "Generating responses for %d prompts using LiteLLM for third party model: %s", len(prompt_dataset), model, ) - responses = [None] * len(prompt_dataset) + responses: list[Optional[dict[str, Any]]] = [None] * len(prompt_dataset) tasks = [] with tqdm(total=len(prompt_dataset), desc=f"LiteLLM Inference ({model})") as pbar: @@ -714,7 +714,7 @@ def _resolve_dataset_inputs( loaded_raw_datasets.append(current_loaded_data) if dataset_schema: - current_schema = _evals_data_converters.EvalDatasetSchema[dataset_schema] + current_schema = _evals_data_converters.EvalDatasetSchema(dataset_schema) else: current_schema = _evals_data_converters.auto_detect_dataset_schema( current_loaded_data @@ -826,11 +826,13 @@ def _execute_evaluation( " EvaluationDataset or a list of EvaluationDataset." ) original_candidate_names = [ - ds.candidate_name or f"candidate_{i+1}" for i, ds in enumerate(dataset_list) + ds.candidate_name or f"candidate_{i + 1}" for i, ds in enumerate(dataset_list) ] name_counts = collections.Counter(original_candidate_names) deduped_candidate_names = [] - current_name_counts = collections.defaultdict(int) + current_name_counts: collections.defaultdict[Any, int] = collections.defaultdict( + int + ) for name in original_candidate_names: if name_counts[name] > 1: diff --git a/vertexai/_genai/_evals_data_converters.py b/vertexai/_genai/_evals_data_converters.py index cb814e032f..e53a7c3bb2 100644 --- a/vertexai/_genai/_evals_data_converters.py +++ b/vertexai/_genai/_evals_data_converters.py @@ -15,8 +15,9 @@ """Dataset converters for evals.""" import abc +import json import logging -from typing import Any, Optional +from typing import Any, Optional, Union from google.genai import _common from google.genai import types as genai_types @@ -102,12 +103,20 @@ def _parse_request( last_message.content.role if last_message.content else "user" ) if last_message_role in ["user", None]: - prompt = last_message.content + prompt = ( + last_message.content + if last_message.content + else genai_types.Content() + ) elif last_message_role == "model": reference = types.ResponseCandidate(response=last_message.content) if conversation_history: second_to_last_message = conversation_history.pop() - prompt = second_to_last_message.content + prompt = ( + second_to_last_message.content + if second_to_last_message.content + else genai_types.Content() + ) else: prompt = genai_types.Content() @@ -355,7 +364,29 @@ def convert(self, raw_data: list[dict[str, Any]]) -> types.EvaluationDataset: continue request_data = item.get("request", {}) - response_data = item.get("response", {}) + response_data_raw = item.get("response", {}) + + response_data = {} + if isinstance(response_data_raw, str): + try: + loaded_json = json.loads(response_data_raw) + if isinstance(loaded_json, dict): + response_data = loaded_json + else: + logger.warning( + "Decoded response JSON is not a dictionary for case" + " %s. Type: %s", + i, + type(loaded_json), + ) + except json.JSONDecodeError: + logger.warning( + "Could not decode response JSON string for case %s." + " Treating as empty response.", + i, + ) + elif isinstance(response_data_raw, dict): + response_data = response_data_raw messages = request_data.get("messages", []) choices = response_data.get("choices", []) @@ -413,7 +444,7 @@ def convert(self, raw_data: list[dict[str, Any]]) -> types.EvaluationDataset: def auto_detect_dataset_schema( raw_dataset: list[dict[str, Any]], -) -> EvalDatasetSchema: +) -> Union[EvalDatasetSchema, str]: """Detects the schema of a raw dataset.""" if not raw_dataset: return EvalDatasetSchema.UNKNOWN @@ -499,7 +530,7 @@ def _validate_case_consistency( current_case: types.EvalCase, case_idx: int, dataset_idx: int, -): +) -> None: """Logs warnings if prompt or reference mismatches occur.""" if base_case.prompt != current_case.prompt: base_prompt_text_preview = _get_first_part_text(base_case.prompt)[:50] @@ -586,7 +617,11 @@ def merge_response_datasets_into_canonical_format( base_parsed_dataset = parsed_evaluation_datasets[0] for case_idx in range(num_expected_cases): - base_eval_case: types.EvalCase = base_parsed_dataset.eval_cases[case_idx] + base_eval_case: types.EvalCase = ( + base_parsed_dataset.eval_cases[case_idx] + if base_parsed_dataset.eval_cases + else types.EvalCase() + ) candidate_responses: list[types.ResponseCandidate] = [] if base_eval_case.responses: @@ -617,9 +652,11 @@ def merge_response_datasets_into_canonical_format( for dataset_idx_offset, current_parsed_ds in enumerate( parsed_evaluation_datasets[1:], start=1 ): - current_ds_eval_case: types.EvalCase = current_parsed_ds.eval_cases[ - case_idx - ] + current_ds_eval_case: types.EvalCase = ( + current_parsed_ds.eval_cases[case_idx] + if current_parsed_ds.eval_cases + else types.EvalCase() + ) _validate_case_consistency( base_eval_case, current_ds_eval_case, case_idx, dataset_idx_offset diff --git a/vertexai/_genai/_evals_metric_handlers.py b/vertexai/_genai/_evals_metric_handlers.py index 693e0ef939..d8f2d09553 100644 --- a/vertexai/_genai/_evals_metric_handlers.py +++ b/vertexai/_genai/_evals_metric_handlers.py @@ -20,7 +20,7 @@ import json import logging import statistics -from typing import Any, Callable, Optional, TypeVar +from typing import Any, Callable, Optional, TypeVar, Union from google.genai import _common from google.genai import types as genai_types @@ -178,6 +178,10 @@ def _build_request_payload( f"response_index {response_index} out of bounds for eval_case with" f" {len(eval_case.responses)} responses." ) + if eval_case.responses is None: + raise ValueError( + f"No responses found for eval_case with ID {eval_case.eval_case_id}." + ) current_response_candidate = eval_case.responses[response_index] if _extract_text_from_content(current_response_candidate.response) is None: raise ValueError( @@ -308,6 +312,10 @@ def _build_request_payload( f" {len(eval_case.responses)} responses." ) + if eval_case.responses is None: + raise ValueError( + f"No responses found for eval_case with ID {eval_case.eval_case_id}." + ) current_response_candidate = eval_case.responses[response_index] if _extract_text_from_content(current_response_candidate.response) is None: raise ValueError( @@ -442,6 +450,10 @@ def _build_request_payload( f"response_index {response_index} out of bounds for eval_case with" f" {len(eval_case.responses)} responses." ) + if eval_case.responses is None: + raise ValueError( + f"No responses found for eval_case with ID {eval_case.eval_case_id}." + ) current_response_candidate = eval_case.responses[response_index] prompt_text = _extract_text_from_content(eval_case.prompt) @@ -475,13 +487,15 @@ def _build_request_payload( original_attr_value = getattr(eval_case, var_name, None) if isinstance(original_attr_value, genai_types.Content): - instance_data_for_json[var_name] = _extract_text_from_content( - original_attr_value - ) + extracted_text = _extract_text_from_content(original_attr_value) + if extracted_text is not None: + instance_data_for_json[var_name] = extracted_text elif isinstance(original_attr_value, types.ResponseCandidate): - instance_data_for_json[var_name] = _extract_text_from_content( + extracted_text = _extract_text_from_content( original_attr_value.response ) + if extracted_text is not None: + instance_data_for_json[var_name] = extracted_text elif ( isinstance(original_attr_value, list) and original_attr_value @@ -510,11 +524,11 @@ def _build_request_payload( } metric_spec_payload = request_payload["pointwise_metric_input"]["metric_spec"] if self.metric.return_raw_output is not None: - metric_spec_payload["custom_output_format_config"] = { + metric_spec_payload["custom_output_format_config"] = { # type: ignore[index] "return_raw_output": self.metric.return_raw_output, } if self.metric.judge_model_system_instruction is not None: - metric_spec_payload[ + metric_spec_payload[ # type: ignore[index] "system_instruction" ] = self.metric.judge_model_system_instruction @@ -524,9 +538,9 @@ def _build_request_payload( if self.metric.judge_model_sampling_count is not None: autorater_config_payload[ "sampling_count" - ] = self.metric.judge_model_sampling_count + ] = self.metric.judge_model_sampling_count # type: ignore[assignment] if autorater_config_payload: - request_payload["autorater_config"] = autorater_config_payload + request_payload["autorater_config"] = autorater_config_payload # type: ignore[assignment] logger.debug("request_payload: %s", request_payload) @@ -650,6 +664,9 @@ def process( ), ) + if not eval_case.responses: + raise ValueError(f"EvalCase {eval_case.eval_case_id} has no responses.") + current_response_candidate = eval_case.responses[response_index] instance_for_custom_fn = eval_case.model_dump( @@ -663,29 +680,33 @@ def process( score = None explanation = None try: - custom_function_result = self.metric.custom_function(instance_for_custom_fn) - - if isinstance(custom_function_result, types.EvalCaseMetricResult): - return custom_function_result - elif ( - isinstance(custom_function_result, dict) - and "score" in custom_function_result - ): - score = custom_function_result["score"] - explanation = custom_function_result.get("explanation", None) - elif isinstance(custom_function_result, (float, int)): - score = custom_function_result - explanation = None - else: - error_msg = ( - f"CustomFunctionError({self.metric.custom_function}): Returned" - f" unexpected type {type(custom_function_result)}" + if self.metric.custom_function: + custom_function_result = self.metric.custom_function( + instance_for_custom_fn ) + if isinstance(custom_function_result, types.EvalCaseMetricResult): + return custom_function_result + elif ( + isinstance(custom_function_result, dict) + and "score" in custom_function_result + ): + score = custom_function_result["score"] + explanation = custom_function_result.get("explanation", None) + elif isinstance(custom_function_result, (float, int)): + score = custom_function_result + explanation = None + else: + error_msg = ( + f"CustomFunctionError({self.metric.custom_function}): Returned" + f" unexpected type {type(custom_function_result)}" + ) + except Exception as e: custom_function_name = ( self.metric.custom_function.__name__ - if hasattr(self.metric.custom_function, "__name__") + if self.metric.custom_function + and hasattr(self.metric.custom_function, "__name__") else "unknown_custom_function" ) error_msg = f"CustomFunctionError({custom_function_name}): {e}" @@ -735,10 +756,10 @@ def aggregate( def get_handler_for_metric( module: "evals.Evals", metric: types.Metric -) -> MetricHandlerType: +) -> Union[MetricHandlerType, Any]: """Returns a metric handler for the given metric.""" for condition, handler_class in _METRIC_HANDLER_MAPPING: - if condition(metric): + if condition(metric): # type: ignore[no-untyped-call] return handler_class(module=module, metric=metric) raise ValueError(f"Unsupported metric: {metric.name}") @@ -803,11 +824,16 @@ def _aggregate_metric_results( metric_name = handler.metric.name results_for_this_metric: list[types.EvalCaseMetricResult] = [] for case_result in eval_case_results: - for response_candidate_res in case_result.response_candidate_results: - if metric_name in response_candidate_res.metric_results: - results_for_this_metric.append( - response_candidate_res.metric_results[metric_name] - ) + if case_result.response_candidate_results: + for response_candidate_res in case_result.response_candidate_results: + if ( + response_candidate_res.metric_results + and metric_name in response_candidate_res.metric_results + and isinstance(metric_name, str) + ): + results_for_this_metric.append( + response_candidate_res.metric_results[metric_name] + ) if not results_for_this_metric: logger.warning( "No results found for metric '%s' to aggregate.", metric_name @@ -865,9 +891,9 @@ def compute_metrics_and_aggregate( """Computes metrics and aggregates them for a given evaluation run config.""" metric_handlers = [] all_futures = [] - results_by_case_response_metric = collections.defaultdict( - lambda: collections.defaultdict(dict) - ) + results_by_case_response_metric: collections.defaultdict[ + Any, collections.defaultdict[Any, dict[Any, Any]] + ] = collections.defaultdict(lambda: collections.defaultdict(dict)) submission_errors = [] execution_errors = [] case_indices_with_errors = set() diff --git a/vertexai/_genai/_evals_utils.py b/vertexai/_genai/_evals_utils.py index f415f040c1..573b7fd773 100644 --- a/vertexai/_genai/_evals_utils.py +++ b/vertexai/_genai/_evals_utils.py @@ -45,7 +45,7 @@ class GcsUtils: def __init__(self, api_client: BaseApiClient): self.api_client = api_client - self.storage_client = storage.Client( + self.storage_client = storage.Client( # type: ignore[attr-defined] project=self.api_client.project, credentials=self.api_client._credentials, ) @@ -65,7 +65,7 @@ def parse_gcs_path(self, gcs_path: str) -> tuple[str, str]: def upload_file_to_gcs(self, upload_gcs_path: str, filename: str) -> None: """Uploads the provided file to a Google Cloud Storage location.""" - storage.Blob.from_string( + storage.Blob.from_string( # type: ignore[attr-defined] uri=upload_gcs_path, client=self.storage_client ).upload_from_filename(filename) @@ -171,7 +171,7 @@ def upload_json_to_prefix( self.upload_json(data, full_gcs_path) return full_gcs_path - def read_file_contents(self, gcs_filepath: str) -> str: + def read_file_contents(self, gcs_filepath: str) -> Union[str, Any]: """Reads the contents of a file from Google Cloud Storage.""" bucket_name, blob_path = self.parse_gcs_path(gcs_filepath) @@ -236,7 +236,9 @@ def __init__(self, api_client: BaseApiClient): self.gcs_utils = GcsUtils(self.api_client) self.bigquery_utils = BigQueryUtils(self.api_client) - def _load_file(self, filepath: str, file_type: str) -> list[dict[str, Any]]: + def _load_file( + self, filepath: str, file_type: str + ) -> Union[list[dict[str, Any]], Any]: """Loads data from a file into a list of dictionaries.""" if filepath.startswith(GCS_PREFIX): df = self.gcs_utils.read_gcs_file_to_dataframe(filepath, file_type) @@ -254,7 +256,9 @@ def _load_file(self, filepath: str, file_type: str) -> list[dict[str, Any]]: " 'csv'." ) - def load(self, source: Union[str, "pd.DataFrame"]) -> list[dict[str, Any]]: + def load( + self, source: Union[str, "pd.DataFrame"] + ) -> Union[list[dict[str, Any]], Any]: """Loads dataset from various sources into a list of dictionaries.""" if isinstance(source, pd.DataFrame): return source.to_dict(orient="records") diff --git a/vertexai/_genai/_evals_visualization.py b/vertexai/_genai/_evals_visualization.py index d87bad6273..ab0a7c35ec 100644 --- a/vertexai/_genai/_evals_visualization.py +++ b/vertexai/_genai/_evals_visualization.py @@ -435,16 +435,17 @@ def display_evaluation_result( ): base_df = _preprocess_df_for_json(input_dataset_list[0].eval_dataset_df) processed_rows = [] - for _, row in base_df.iterrows(): - prompt_key = "request" if "request" in row else "prompt" - prompt_info = _extract_text_and_raw_json(row.get(prompt_key)) - processed_row = { - "prompt_display_text": prompt_info["display_text"], - "prompt_raw_json": prompt_info["raw_json"], - "reference": row.get("reference", ""), - } - processed_rows.append(processed_row) - metadata_payload["dataset"] = processed_rows + if base_df is not None: + for _, row in base_df.iterrows(): + prompt_key = "request" if "request" in row else "prompt" + prompt_info = _extract_text_and_raw_json(row.get(prompt_key)) + processed_row = { + "prompt_display_text": prompt_info["display_text"], + "prompt_raw_json": prompt_info["raw_json"], + "reference": row.get("reference", ""), + } + processed_rows.append(processed_row) + metadata_payload["dataset"] = processed_rows if "eval_case_results" in result_dump: for case_res in result_dump["eval_case_results"]: @@ -453,6 +454,7 @@ def display_evaluation_result( ): if ( resp_idx < len(input_dataset_list) + and input_dataset_list is not None and input_dataset_list[resp_idx].eval_dataset_df is not None ): df = _preprocess_df_for_json( @@ -486,18 +488,19 @@ def display_evaluation_result( and single_dataset.eval_dataset_df is not None ): processed_df = _preprocess_df_for_json(single_dataset.eval_dataset_df) - for _, row in processed_df.iterrows(): - prompt_key = "request" if "request" in row else "prompt" - prompt_info = _extract_text_and_raw_json(row.get(prompt_key)) - response_info = _extract_text_and_raw_json(row.get("response")) - processed_row = { - "prompt_display_text": prompt_info["display_text"], - "prompt_raw_json": prompt_info["raw_json"], - "reference": row.get("reference", ""), - "response_display_text": response_info["display_text"], - "response_raw_json": response_info["raw_json"], - } - processed_rows.append(processed_row) + if processed_df is not None: + for _, row in processed_df.iterrows(): + prompt_key = "request" if "request" in row else "prompt" + prompt_info = _extract_text_and_raw_json(row.get(prompt_key)) + response_info = _extract_text_and_raw_json(row.get("response")) + processed_row = { + "prompt_display_text": prompt_info["display_text"], + "prompt_raw_json": prompt_info["raw_json"], + "reference": row.get("reference", ""), + "response_display_text": response_info["display_text"], + "response_raw_json": response_info["raw_json"], + } + processed_rows.append(processed_row) metadata_payload["dataset"] = processed_rows if "eval_case_results" in result_dump and processed_rows: diff --git a/vertexai/_genai/agent_engines.py b/vertexai/_genai/agent_engines.py index e884eec5d5..61023f26bb 100644 --- a/vertexai/_genai/agent_engines.py +++ b/vertexai/_genai/agent_engines.py @@ -948,7 +948,7 @@ def _create( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1008,7 +1008,7 @@ def _create_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1079,7 +1079,7 @@ def delete( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1143,7 +1143,7 @@ def delete_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1209,7 +1209,7 @@ def _generate_memories( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1265,7 +1265,7 @@ def _get( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1327,7 +1327,7 @@ def get_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1377,7 +1377,7 @@ def _list( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1433,7 +1433,7 @@ def _list_memories( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1487,7 +1487,7 @@ def _get_agent_operation( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1541,7 +1541,7 @@ def _get_memory_operation( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1595,7 +1595,7 @@ def _get_generate_memories_operation( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1651,7 +1651,7 @@ def _query( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1717,7 +1717,7 @@ def _retrieve_memories( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1773,7 +1773,7 @@ def _update( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1833,7 +1833,7 @@ def _update_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -1988,7 +1988,15 @@ def create( env_vars=config.env_vars, ) operation = self._create(config=api_config) - operation = self._await_operation(operation_name=operation.name) + if agent_engine is None: + poll_interval_seconds = 1 # Lightweight agent engine resource creation. + else: + poll_interval_seconds = 10 + operation = self._await_operation( + operation_name=operation.name, + poll_interval_seconds=poll_interval_seconds, + ) + agent = types.AgentEngine( api_client=self, api_async_client=AsyncAgentEngines(api_client_=self._api_client), @@ -2110,7 +2118,7 @@ def _generate_deployment_spec_or_raise( *, env_vars: Optional[dict[str, Union[str, Any]]] = None, ): - deployment_spec = {} + deployment_spec: dict[str, Any] = {} update_masks = [] if env_vars: deployment_spec["env"] = [] @@ -2380,6 +2388,8 @@ def create_memory( ) # We need to make a call to get the memory because the operation # response might not contain the relevant fields. + if not operation.response: + raise ValueError("Error retrieving memory.") operation.response = self.get_memory(name=operation.response.name) return operation @@ -2543,7 +2553,7 @@ async def _create( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2605,7 +2615,7 @@ async def _create_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2678,7 +2688,7 @@ async def delete( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2744,7 +2754,7 @@ async def delete_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2812,7 +2822,7 @@ async def _generate_memories( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2870,7 +2880,7 @@ async def _get( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2934,7 +2944,7 @@ async def get_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -2986,7 +2996,7 @@ async def _list( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3044,7 +3054,7 @@ async def _list_memories( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3100,7 +3110,7 @@ async def _get_agent_operation( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3156,7 +3166,7 @@ async def _get_memory_operation( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3212,7 +3222,7 @@ async def _get_generate_memories_operation( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3270,7 +3280,7 @@ async def _query( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3338,7 +3348,7 @@ async def _retrieve_memories( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3396,7 +3406,7 @@ async def _update( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -3458,7 +3468,7 @@ async def _update_memory( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None diff --git a/vertexai/_genai/client.py b/vertexai/_genai/client.py index 2d6ca147d4..eb70b677b1 100644 --- a/vertexai/_genai/client.py +++ b/vertexai/_genai/client.py @@ -1,3 +1,5 @@ +# type: ignore + # Copyright 2025 Google LLC # # Licensed under the Apache License, Version 2.0 (the "License"); diff --git a/vertexai/_genai/evals.py b/vertexai/_genai/evals.py index e14742cb3d..1913d7fb71 100644 --- a/vertexai/_genai/evals.py +++ b/vertexai/_genai/evals.py @@ -845,7 +845,7 @@ def _evaluate_instances( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -925,7 +925,7 @@ def run_inference( config = types.EvalRunInferenceConfig() if isinstance(config, dict): config = types.EvalRunInferenceConfig.model_validate(config) - return _evals_common._execute_inference( + return _evals_common._execute_inference( # type: ignore[no-any-return] api_client=self._api_client, model=model, src=src, @@ -964,11 +964,9 @@ def evaluate( config = types.EvaluateMethodConfig.model_validate(config) if isinstance(dataset, list): dataset = [ - ( - types.EvaluationDataset.model_validate(ds_item) - if isinstance(ds_item, dict) - else ds_item - ) + types.EvaluationDataset.model_validate(ds_item) + if isinstance(ds_item, dict) + else ds_item for ds_item in dataset ] else: @@ -1109,7 +1107,7 @@ async def _evaluate_instances( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None diff --git a/vertexai/_genai/prompt_optimizer.py b/vertexai/_genai/prompt_optimizer.py index 022a28c997..c1ec2e83f3 100644 --- a/vertexai/_genai/prompt_optimizer.py +++ b/vertexai/_genai/prompt_optimizer.py @@ -24,7 +24,6 @@ from google.genai import _api_module from google.genai import _common -from google.genai import types as genai_types from google.genai._common import get_value_by_path as getv from google.genai._common import set_value_by_path as setv @@ -409,7 +408,7 @@ def _optimize_dummy( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -429,8 +428,8 @@ def _optimize_dummy( return_value = types.OptimizeResponse._from_response( response=response_dict, kwargs=parameter_model.model_dump() ) - self._api_client._verify_response(return_value) + self._api_client._verify_response(return_value) return return_value def _create_custom_job_resource( @@ -463,7 +462,7 @@ def _create_custom_job_resource( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -483,8 +482,8 @@ def _create_custom_job_resource( return_value = types.CustomJob._from_response( response=response_dict, kwargs=parameter_model.model_dump() ) - self._api_client._verify_response(return_value) + self._api_client._verify_response(return_value) return return_value def _get_custom_job( @@ -514,7 +513,7 @@ def _get_custom_job( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -534,8 +533,8 @@ def _get_custom_job( return_value = types.CustomJob._from_response( response=response_dict, kwargs=parameter_model.model_dump() ) - self._api_client._verify_response(return_value) + self._api_client._verify_response(return_value) return return_value """Prompt Optimizer PO-Data.""" @@ -587,9 +586,15 @@ def optimize( method: The method for optimizing multiple prompts. config: The config to use. Config consists of the following fields: - config_path: The gcs path to the config file, e.g. - gs://bucket/config.json. - service_account: The service account to - use for the job. - wait_for_completion: Optional. Whether to wait - for the job to complete. Default is True. + gs://bucket/config.json. - service_account: Optional. The service + account to use for the custom job. Cannot be provided at the same + time as 'service_account_project_number'. - + service_account_project_number: Optional. The project number used to + construct the default service account: + f"{service_account_project_number}-compute@developer.gserviceaccount.com" + Cannot be provided at the same time as 'service_account'. - + wait_for_completion: Optional. Whether to wait for the job to + complete. Default is True. """ if method != "vapo": @@ -626,10 +631,28 @@ def optimize( } ] + if config.service_account: + if config.service_account_project_number: + raise ValueError( + "Only one of service_account or" + " service_account_project_number can be provided." + ) + service_account = config.service_account + elif config.project_number: + service_account = ( + f"{config.service_account_project_number}" + "-compute@developer.gserviceaccount.com" + ) + else: + raise ValueError( + "Either service_account or service_account_project_number is" + " required." + ) + job_spec = types.CustomJobSpec( worker_pool_specs=worker_pool_specs, base_output_directory=types.GcsDestination(output_uri_prefix=bucket), - service_account=config.service_account, + service_account=service_account, ) custom_job = types.CustomJob( @@ -643,6 +666,8 @@ def optimize( # Get the job resource name job_resource_name = job.name + if not job_resource_name: + raise ValueError(f"Error creating job: {job}") job_id = job_resource_name.split("/")[-1] logger.info("Job created: %s", job.name) @@ -684,7 +709,7 @@ async def _optimize_dummy( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -706,8 +731,8 @@ async def _optimize_dummy( return_value = types.OptimizeResponse._from_response( response=response_dict, kwargs=parameter_model.model_dump() ) - self._api_client._verify_response(return_value) + self._api_client._verify_response(return_value) return return_value async def _create_custom_job_resource( @@ -740,7 +765,7 @@ async def _create_custom_job_resource( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -762,8 +787,8 @@ async def _create_custom_job_resource( return_value = types.CustomJob._from_response( response=response_dict, kwargs=parameter_model.model_dump() ) - self._api_client._verify_response(return_value) + self._api_client._verify_response(return_value) return return_value async def _get_custom_job( @@ -793,7 +818,7 @@ async def _get_custom_job( # TODO: remove the hack that pops config. request_dict.pop("config", None) - http_options: Optional[genai_types.HttpOptions] = None + http_options: Optional[types.HttpOptions] = None if ( parameter_model.config is not None and parameter_model.config.http_options is not None @@ -815,6 +840,6 @@ async def _get_custom_job( return_value = types.CustomJob._from_response( response=response_dict, kwargs=parameter_model.model_dump() ) - self._api_client._verify_response(return_value) + self._api_client._verify_response(return_value) return return_value diff --git a/vertexai/_genai/types.py b/vertexai/_genai/types.py index 2677db0c00..ba8d68a2fd 100644 --- a/vertexai/_genai/types.py +++ b/vertexai/_genai/types.py @@ -5210,6 +5210,9 @@ class PromptOptimizerVAPOConfig(_common.BaseModel): default=None, description="""The gcs path to the config file.""" ) service_account: Optional[str] = Field(default=None, description="""""") + service_account_project_number: Optional[Union[int, str]] = Field( + default=None, description="""""" + ) wait_for_completion: Optional[bool] = Field(default=True, description="""""") @@ -5222,6 +5225,9 @@ class PromptOptimizerVAPOConfigDict(TypedDict, total=False): service_account: Optional[str] """""" + service_account_project_number: Optional[Union[int, str]] + """""" + wait_for_completion: Optional[bool] """""" @@ -5248,7 +5254,7 @@ def text_must_not_be_empty(cls, value: str) -> str: ) return value - @computed_field + @computed_field # type: ignore[prop-decorator] @property def variables(self) -> set[str]: return set(re.findall(self._VARIABLE_NAME_REGEX, self.text)) @@ -5259,11 +5265,11 @@ def _split_template_by_variables(self) -> list[Tuple[str, str]]: for match in re.finditer(self._VARIABLE_NAME_REGEX, self.text): start, end = match.span() var_name = match.group(1) - if start > last_end: + if start > last_end and self.text: parts.append(("text", self.text[last_end:start])) parts.append(("var", var_name)) last_end = end - if last_end < len(self.text): + if last_end < len(self.text) and self.text: parts.append(("text", self.text[last_end:])) return parts @@ -5336,7 +5342,7 @@ def _parse_multimodal_json_string_into_parts( """Parses a multimodal JSON string and returns its list of Parts.""" try: content = genai_types.Content.model_validate_json(value) - return content.parts + return content.parts if content.parts is not None else [genai_types.Part()] except Exception: return [genai_types.Part(text=value)] @@ -5441,7 +5447,7 @@ def assemble(self, **kwargs: Any) -> str: return final_content_obj.model_dump_json(exclude_none=True) def __str__(self) -> str: - return self.text + return self.text if self.text else "" def __repr__(self) -> str: return f"PromptTemplate(text='{self.text}')" @@ -5615,7 +5621,7 @@ def _prepare_fields_and_construct_text(cls, data: Any) -> Any: def __str__(self) -> str: """Returns the fully constructed prompt template text.""" - return self.text + return self.text if self.text else "" class PromptTemplateDict(TypedDict, total=False): @@ -6512,9 +6518,13 @@ class AgentEngine(_common.BaseModel): model_config = ConfigDict(extra="allow") def __repr__(self) -> str: - return f"AgentEngine(api_resource.name='{self.api_resource.name}')" + return ( + f"AgentEngine(api_resource.name='{self.api_resource.name}')" + if self.api_resource is not None + else "AgentEngine(api_resource.name=None)" + ) - def operation_schemas(self) -> list[Dict[str, Any]]: + def operation_schemas(self) -> Optional[list[Dict[str, Any]]]: """Returns the schemas of all registered operations for the agent.""" if not isinstance(self.api_resource, ReasoningEngine): raise ValueError("api_resource is not initialized.") @@ -6526,7 +6536,7 @@ def delete( self, force: bool = False, config: Optional[DeleteAgentEngineConfigOrDict] = None, - ): + ) -> None: """Deletes the agent engine. Args: @@ -6539,7 +6549,7 @@ def delete( """ if not isinstance(self.api_resource, ReasoningEngine): raise ValueError("api_resource is not initialized.") - self.api_client.delete(name=self.api_resource.name, force=force, config=config) + self.api_client.delete(name=self.api_resource.name, force=force, config=config) # type: ignore[union-attr] class AgentEngineDict(TypedDict, total=False): diff --git a/vertexai/agent_engines/__init__.py b/vertexai/agent_engines/__init__.py index 19aa4113d6..025643eb96 100644 --- a/vertexai/agent_engines/__init__.py +++ b/vertexai/agent_engines/__init__.py @@ -70,6 +70,7 @@ def create( env_vars: Optional[ Union[Sequence[str], Dict[str, Union[str, aip_types.SecretRef]]] ] = None, + build_options: Optional[Dict[str, Sequence[str]]] = None, ) -> AgentEngine: """Creates a new Agent Engine. @@ -86,6 +87,9 @@ def create( |-- user_code/ | |-- utils.py | |-- ... + |-- installation_scripts/ + | |-- install_package.sh + | |-- ... |-- ... To build an Agent Engine with the above files, run: @@ -105,6 +109,12 @@ def create( "./user_src_dir/user_code", # a directory ... ], + build_options={ + "installation": [ + "./user_src_dir/installation_scripts/install_package.sh", + ... + ], + }, ) Args: @@ -131,6 +141,9 @@ def create( a valid key to `os.environ`. If it is a dictionary, the keys are the environment variable names, and the values are the corresponding values. + build_options (Dict[str, Sequence[str]]): + Optional. The build options for the Agent Engine. This includes + options such as installation scripts. Returns: AgentEngine: The Agent Engine that was created. @@ -153,6 +166,7 @@ def create( gcs_dir_name=gcs_dir_name, extra_packages=extra_packages, env_vars=env_vars, + build_options=build_options, ) @@ -237,6 +251,7 @@ def update( env_vars: Optional[ Union[Sequence[str], Dict[str, Union[str, aip_types.SecretRef]]] ] = None, + build_options: Optional[Dict[str, Sequence[str]]] = None, ) -> "AgentEngine": """Updates an existing Agent Engine. @@ -280,6 +295,9 @@ def update( a valid key to `os.environ`. If it is a dictionary, the keys are the environment variable names, and the values are the corresponding values. + build_options (Dict[str, Sequence[str]]): + Optional. The build options for the Agent Engine. This includes + options such as installation scripts. Returns: AgentEngine: The Agent Engine that was updated. @@ -290,8 +308,8 @@ def update( FileNotFoundError: If `extra_packages` includes a file or directory that does not exist. ValueError: if none of `display_name`, `description`, - `requirements`, `extra_packages`, or `agent_engine` were - specified. + `requirements`, `extra_packages`, `agent_engine`, or `build_options` + were specified. IOError: If requirements is a string that corresponds to a nonexistent file. """ @@ -304,6 +322,7 @@ def update( gcs_dir_name=gcs_dir_name, extra_packages=extra_packages, env_vars=env_vars, + build_options=build_options, ) diff --git a/vertexai/agent_engines/_agent_engines.py b/vertexai/agent_engines/_agent_engines.py index f76dcb43e3..4f3b096cea 100644 --- a/vertexai/agent_engines/_agent_engines.py +++ b/vertexai/agent_engines/_agent_engines.py @@ -88,6 +88,7 @@ ) _AGENT_FRAMEWORK_ATTR = "agent_framework" _DEFAULT_AGENT_FRAMEWORK = "custom" +_BUILD_OPTIONS_INSTALLATION = "installation_scripts" _DEFAULT_METHOD_NAME_MAP = { _STANDARD_API_MODE: _DEFAULT_METHOD_NAME, _ASYNC_API_MODE: _DEFAULT_ASYNC_METHOD_NAME, @@ -331,6 +332,7 @@ def create( env_vars: Optional[ Union[Sequence[str], Dict[str, Union[str, aip_types.SecretRef]]] ] = None, + build_options: Optional[Dict[str, Sequence[str]]] = None, ) -> "AgentEngine": """Creates a new Agent Engine. @@ -347,6 +349,9 @@ def create( |-- user_code/ | |-- utils.py | |-- ... + |-- installation_scripts/ + | |-- install_package.sh + | |-- ... |-- ... To build an Agent Engine with the above files, run: @@ -366,6 +371,12 @@ def create( "./user_src_dir/user_code", # a directory ... ], + build_options={ + "installation_scripts": [ + "./user_src_dir/installation_scripts/install_package.sh", + ... + ], + }, ) Args: @@ -392,6 +403,14 @@ def create( a valid key to `os.environ`. If it is a dictionary, the keys are the environment variable names, and the values are the corresponding values. + build_options (Dict[str, Sequence[str]]): + Optional. The build options for the Agent Engine. + The following keys are supported: + - installation_scripts: + Optional. The paths to the installation scripts to be + executed in the Docker image. + The scripts must be located in the `installation_scripts` + subdirectory and the path must be added to `extra_packages`. Returns: AgentEngine: The Agent Engine that was created. @@ -430,7 +449,10 @@ def create( agent_engine=agent_engine, requirements=requirements, ) - extra_packages = _validate_extra_packages_or_raise(extra_packages) + extra_packages = _validate_extra_packages_or_raise( + extra_packages=extra_packages, + build_options=build_options, + ) sdk_resource = cls.__new__(cls) base.VertexAiResourceNounWithFutureManager.__init__(sdk_resource) @@ -539,6 +561,7 @@ def update( env_vars: Optional[ Union[Sequence[str], Dict[str, Union[str, aip_types.SecretRef]]] ] = None, + build_options: Optional[Dict[str, Sequence[str]]] = None, ) -> "AgentEngine": """Updates an existing Agent Engine. @@ -580,6 +603,14 @@ def update( a valid key to `os.environ`. If it is a dictionary, the keys are the environment variable names, and the values are the corresponding values. + build_options (Dict[str, Sequence[str]]): + Optional. The build options for the Agent Engine. + The following keys are supported: + - installation_scripts: + Optional. The paths to the installation scripts to be + executed in the Docker image. + The scripts must be located in the `installation_scripts` + subdirectory and the path must be added to `extra_packages`. Returns: AgentEngine: The Agent Engine that was updated. @@ -614,12 +645,13 @@ def update( display_name, description, env_vars, + build_options, ] ): raise ValueError( "At least one of `agent_engine`, `requirements`, " - "`extra_packages`, `display_name`, `description`, or `env_vars` " - "must be specified." + "`extra_packages`, `display_name`, `description`, " + "`env_vars`, or `build_options` must be specified." ) if requirements is not None: requirements = _validate_requirements_or_raise( @@ -627,7 +659,10 @@ def update( requirements=requirements, ) if extra_packages is not None: - extra_packages = _validate_extra_packages_or_raise(extra_packages) + extra_packages = _validate_extra_packages_or_raise( + extra_packages=extra_packages, + build_options=build_options, + ) if agent_engine is not None: agent_engine = _validate_agent_engine_or_raise(agent_engine) @@ -885,9 +920,17 @@ def _validate_requirements_or_raise( return requirements -def _validate_extra_packages_or_raise(extra_packages: Sequence[str]) -> Sequence[str]: +def _validate_extra_packages_or_raise( + extra_packages: Sequence[str], + build_options: Optional[Dict[str, Sequence[str]]] = None, +) -> Sequence[str]: """Tries to validates the extra packages.""" extra_packages = extra_packages or [] + if build_options and _BUILD_OPTIONS_INSTALLATION in build_options: + _utils.validate_installation_scripts_or_raise( + script_paths=build_options[_BUILD_OPTIONS_INSTALLATION], + extra_packages=extra_packages, + ) for extra_package in extra_packages: if not os.path.exists(extra_package): raise FileNotFoundError( diff --git a/vertexai/agent_engines/_utils.py b/vertexai/agent_engines/_utils.py index e5363992aa..4cea417fe3 100644 --- a/vertexai/agent_engines/_utils.py +++ b/vertexai/agent_engines/_utils.py @@ -116,6 +116,7 @@ class _RequirementsValidationResult(TypedDict): _WARNINGS_KEY = "warnings" _WARNING_MISSING = "missing" _WARNING_INCOMPATIBLE = "incompatible" +_INSTALLATION_SUBDIR = "installation_scripts" def to_proto( @@ -767,3 +768,64 @@ def _import_autogen_tools_or_warn() -> Optional[types.ModuleType]: "call `pip install google-cloud-aiplatform[ag2]`." ) return None + + +def validate_installation_scripts_or_raise( + script_paths: Sequence[str], + extra_packages: Sequence[str], +): + """Validates the installation scripts' path explicitly provided by the user. + + Args: + script_paths (Sequence[str]): + Required. The paths to the installation scripts. + extra_packages (Sequence[str]): + Required. The extra packages to be updated. + + Raises: + ValueError: If a user-defined script is not under the expected + subdirectory, or not in `extra_packages`, or if an extra package is + in the installation scripts subdirectory, but is not specified as an + installation script. + """ + for script_path in script_paths: + if not script_path.startswith(_INSTALLATION_SUBDIR): + LOGGER.warning( + f"User-defined installation script '{script_path}' is not in " + f"the expected '{_INSTALLATION_SUBDIR}' subdirectory. " + f"Ensure it is placed in '{_INSTALLATION_SUBDIR}' within your " + f"`extra_packages`." + ) + raise ValueError( + f"Required installation script '{script_path}' " + f"is not under '{_INSTALLATION_SUBDIR}'" + ) + + if script_path not in extra_packages: + LOGGER.warning( + f"User-defined installation script '{script_path}' is not in " + f"extra_packages. Ensure it is added to `extra_packages`." + ) + raise ValueError( + f"User-defined installation script '{script_path}' " + f"does not exist in `extra_packages`" + ) + + for extra_package in extra_packages: + if ( + extra_package.startswith(_INSTALLATION_SUBDIR) + and extra_package not in script_paths + ): + LOGGER.warning( + f"Extra package '{extra_package}' is in the installation " + "scripts subdirectory, but is not specified as an installation " + "script in `build_options`. " + "Ensure it is added to installation_scripts for " + "automatic execution." + ) + raise ValueError( + f"Extra package '{extra_package}' is in the installation " + "scripts subdirectory, but is not specified as an installation " + "script in `build_options`." + ) + return