Skip to content

Commit b91a8aa

Browse files
vertex-sdk-botcopybara-github
authored andcommitted
fix: prediction stream raw predict url for non dedicated endpoint
PiperOrigin-RevId: 726231575
1 parent 0d73929 commit b91a8aa

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

google/cloud/aiplatform/models.py

+2-1
Original file line numberDiff line numberDiff line change
@@ -2583,6 +2583,7 @@ def stream_raw_predict(
25832583
timeout: Optional[float] = None,
25842584
) -> Iterator[requests.models.Response]:
25852585
"""Makes a streaming prediction request using arbitrary headers.
2586+
For custom model, this method is only supported for dedicated endpoint.
25862587
25872588
Example usage:
25882589
```
@@ -2632,7 +2633,7 @@ def stream_raw_predict(
26322633
if self.stream_raw_predict_request_url is None:
26332634
self.stream_raw_predict_request_url = f"https://{self.location}-{constants.base.API_BASE_PATH}/v1/projects/{self.project}/locations/{self.location}/endpoints/{self.name}:streamRawPredict"
26342635

2635-
url = self.raw_predict_request_url
2636+
url = self.stream_raw_predict_request_url
26362637

26372638
if use_dedicated_endpoint:
26382639
self._sync_gca_resource_if_skipped()

0 commit comments

Comments
 (0)