googleapis
diff --git a/‎google/cloud/aiplatform/vertex_ray/__init__.py
+2-2 b/‎google/cloud/aiplatform/vertex_ray/__init__.py
+2-2
diff --git a/‎google/cloud/aiplatform/vertex_ray/bigquery_datasink.py
+100-109 b/‎google/cloud/aiplatform/vertex_ray/bigquery_datasink.py
+100-109
@@ -19,7 +19,7 @@
 import sys
 
 from google.cloud.aiplatform.vertex_ray.bigquery_datasource import (
-    BigQueryDatasource,
+    _BigQueryDatasource,
 )
 from google.cloud.aiplatform.vertex_ray.client_builder import (
     VertexRayClientBuilder as ClientBuilder,
@@ -52,7 +52,7 @@
     )
 
 __all__ = (
-    "BigQueryDatasource",
+    "_BigQueryDatasource",
     "data",
     "ClientBuilder",
     "get_job_submission_client_cluster_info",
 
@@ -35,11 +35,8 @@
 from ray.data._internal.remote_fn import cached_remote_fn
 from ray.data.block import Block, BlockAccessor
 
-try:
-    from ray.data.datasource.datasink import Datasink
-except ImportError:
-    # If datasink cannot be imported, Ray 2.9.3 is not installed
-    Datasink = None
+from ray.data.datasource.datasink import Datasink
+
 
 DEFAULT_MAX_RETRY_CNT = 10
 RATE_LIMIT_EXCEEDED_SLEEP_TIME = 11
@@ -49,110 +46,104 @@
     gapic_version=_BQ_GAPIC_VERSION, user_agent=f"ray-on-vertex/{_BQ_GAPIC_VERSION}"
 )
 
-if Datasink is None:
-    _BigQueryDatasink = None
-else:
-    # BigQuery write for Ray 2.9.3
-    class _BigQueryDatasink(Datasink):
-        def __init__(
-            self,
-            dataset: str,
-            project_id: str = None,
-            max_retry_cnt: int = DEFAULT_MAX_RETRY_CNT,
-            overwrite_table: Optional[bool] = True,
-        ) -> None:
-            self.dataset = dataset
-            self.project_id = project_id or initializer.global_config.project
-            self.max_retry_cnt = max_retry_cnt
-            self.overwrite_table = overwrite_table
-
-        def on_write_start(self) -> None:
-            # Set up datasets to write
-            client = bigquery.Client(project=self.project_id, client_info=bq_info)
-            dataset_id = self.dataset.split(".", 1)[0]
-            try:
-                client.get_dataset(dataset_id)
-            except exceptions.NotFound:
-                client.create_dataset(f"{self.project_id}.{dataset_id}", timeout=30)
-                print("[Ray on Vertex AI]: Created dataset " + dataset_id)
-
-            # Delete table if overwrite_table is True
-            if self.overwrite_table:
-                print(
-                    f"[Ray on Vertex AI]: Attempting to delete table {self.dataset}"
-                    + " if it already exists since kwarg overwrite_table = True."
-                )
-                client.delete_table(
-                    f"{self.project_id}.{self.dataset}", not_found_ok=True
-                )
-            else:
-                print(
-                    "[Ray on Vertex AI]: The write will append to table "
-                    + f"{self.dataset} if it already exists "
-                    + "since kwarg overwrite_table = False."
-                )
-
-        def write(
-            self,
-            blocks: Iterable[Block],
-            ctx: TaskContext,
-        ) -> Any:
-            def _write_single_block(
-                block: Block, project_id: str, dataset: str
-            ) -> None:
-                block = BlockAccessor.for_block(block).to_arrow()
-
-                client = bigquery.Client(project=project_id, client_info=bq_info)
-                job_config = bigquery.LoadJobConfig(autodetect=True)
-                job_config.source_format = bigquery.SourceFormat.PARQUET
-                job_config.write_disposition = bigquery.WriteDisposition.WRITE_APPEND
-
-                with tempfile.TemporaryDirectory() as temp_dir:
-                    fp = os.path.join(temp_dir, f"block_{uuid.uuid4()}.parquet")
-                    pq.write_table(block, fp, compression="SNAPPY")
-
-                    retry_cnt = 0
-                    while retry_cnt <= self.max_retry_cnt:
-                        with open(fp, "rb") as source_file:
-                            job = client.load_table_from_file(
-                                source_file, dataset, job_config=job_config
-                            )
-                        try:
-                            logging.info(job.result())
-                            break
-                        except exceptions.Forbidden as e:
-                            retry_cnt += 1
-                            if retry_cnt > self.max_retry_cnt:
-                                break
-                            print(
-                                "[Ray on Vertex AI]: A block write encountered"
-                                + f" a rate limit exceeded error {retry_cnt} time(s)."
-                                + " Sleeping to try again."
-                            )
-                            logging.debug(e)
-                            time.sleep(RATE_LIMIT_EXCEEDED_SLEEP_TIME)
-
-                    # Raise exception if retry_cnt exceeds max_retry_cnt
-                    if retry_cnt > self.max_retry_cnt:
-                        print(
-                            f"[Ray on Vertex AI]: Maximum ({self.max_retry_cnt}) retry count exceeded."
-                            + " Ray will attempt to retry the block write via fault tolerance."
-                            + " For more information, see https://docs.ray.io/en/latest/ray-core/fault_tolerance/tasks.html"
-                        )
-                        raise RuntimeError(
-                            f"[Ray on Vertex AI]: Write failed due to {retry_cnt}"
-                            + " repeated API rate limit exceeded responses. Consider"
-                            + " specifiying the max_retry_cnt kwarg with a higher value."
-                        )
-
-            _write_single_block = cached_remote_fn(_write_single_block)
 
-            # Launch a remote task for each block within this write task
-            ray.get(
-                [
-                    _write_single_block.remote(block, self.project_id, self.dataset)
-                    for block in blocks
-                ]
+# BigQuery write for Ray 2.33.0 and 2.9.3
+class _BigQueryDatasink(Datasink):
+    def __init__(
+        self,
+        dataset: str,
+        project_id: Optional[str] = None,
+        max_retry_cnt: int = DEFAULT_MAX_RETRY_CNT,
+        overwrite_table: Optional[bool] = True,
+    ) -> None:
+        self.dataset = dataset
+        self.project_id = project_id or initializer.global_config.project
+        self.max_retry_cnt = max_retry_cnt
+        self.overwrite_table = overwrite_table
+
+    def on_write_start(self) -> None:
+        # Set up datasets to write
+        client = bigquery.Client(project=self.project_id, client_info=bq_info)
+        dataset_id = self.dataset.split(".", 1)[0]
+        try:
+            client.get_dataset(dataset_id)
+        except exceptions.NotFound:
+            client.create_dataset(f"{self.project_id}.{dataset_id}", timeout=30)
+            print("[Ray on Vertex AI]: Created dataset " + dataset_id)
+
+        # Delete table if overwrite_table is True
+        if self.overwrite_table:
+            print(
+                f"[Ray on Vertex AI]: Attempting to delete table {self.dataset}"
+                + " if it already exists since kwarg overwrite_table = True."
+            )
+            client.delete_table(f"{self.project_id}.{self.dataset}", not_found_ok=True)
+        else:
+            print(
+                "[Ray on Vertex AI]: The write will append to table "
+                + f"{self.dataset} if it already exists "
+                + "since kwarg overwrite_table = False."
             )
 
-            return "ok"
+    def write(
+        self,
+        blocks: Iterable[Block],
+        ctx: TaskContext,
+    ) -> Any:
+        def _write_single_block(block: Block, project_id: str, dataset: str) -> None:
+            block = BlockAccessor.for_block(block).to_arrow()
+
+            client = bigquery.Client(project=project_id, client_info=bq_info)
+            job_config = bigquery.LoadJobConfig(autodetect=True)
+            job_config.source_format = bigquery.SourceFormat.PARQUET
+            job_config.write_disposition = bigquery.WriteDisposition.WRITE_APPEND
+
+            with tempfile.TemporaryDirectory() as temp_dir:
+                fp = os.path.join(temp_dir, f"block_{uuid.uuid4()}.parquet")
+                pq.write_table(block, fp, compression="SNAPPY")
+
+                retry_cnt = 0
+                while retry_cnt <= self.max_retry_cnt:
+                    with open(fp, "rb") as source_file:
+                        job = client.load_table_from_file(
+                            source_file, dataset, job_config=job_config
+                        )
+                    try:
+                        logging.info(job.result())
+                        break
+                    except exceptions.Forbidden as e:
+                        retry_cnt += 1
+                        if retry_cnt > self.max_retry_cnt:
+                            break
+                        print(
+                            "[Ray on Vertex AI]: A block write encountered"
+                            + f" a rate limit exceeded error {retry_cnt} time(s)."
+                            + " Sleeping to try again."
+                        )
+                        logging.debug(e)
+                        time.sleep(RATE_LIMIT_EXCEEDED_SLEEP_TIME)
+
+                # Raise exception if retry_cnt exceeds max_retry_cnt
+                if retry_cnt > self.max_retry_cnt:
+                    print(
+                        f"[Ray on Vertex AI]: Maximum ({self.max_retry_cnt}) retry count exceeded."
+                        + " Ray will attempt to retry the block write via fault tolerance."
+                        + " For more information, see https://docs.ray.io/en/latest/ray-core/fault_tolerance/tasks.html"
+                    )
+                    raise RuntimeError(
+                        f"[Ray on Vertex AI]: Write failed due to {retry_cnt}"
+                        + " repeated API rate limit exceeded responses. Consider"
+                        + " specifiying the max_retry_cnt kwarg with a higher value."
+                    )
+
+        _write_single_block = cached_remote_fn(_write_single_block)
+
+        # Launch a remote task for each block within this write task
+        ray.get(
+            [
+                _write_single_block.remote(block, self.project_id, self.dataset)
+                for block in blocks
+            ]
+        )
+
+        return "ok"