feat: Make count_tokens generally-available at TextEmbeddingModel.

vertex-sdk-bot · copybara-github · commit efb84134094a · 2024-07-19T14:57:11.000-07:00
PiperOrigin-RevId: 654133506
diff --git a/tests/unit/aiplatform/test_language_models.py b/tests/unit/aiplatform/test_language_models.py
@@ -4526,7 +4526,48 @@ def test_text_embedding(self):
                     == expected_embedding["statistics"]["truncated"]
                 )
 
-    def test_text_embedding_preview_count_tokens(self):
+    def test_text_embedding_count_tokens_ga(self):
+        """Tests the text embedding model."""
+        aiplatform.init(
+            project=_TEST_PROJECT,
+            location=_TEST_LOCATION,
+        )
+        with mock.patch.object(
+            target=model_garden_service_client.ModelGardenServiceClient,
+            attribute="get_publisher_model",
+            return_value=gca_publisher_model.PublisherModel(
+                _TEXT_EMBEDDING_GECKO_PUBLISHER_MODEL_DICT
+            ),
+        ):
+            model = language_models.TextEmbeddingModel.from_pretrained(
+                "textembedding-gecko@001"
+            )
+
+            gca_count_tokens_response = (
+                gca_prediction_service_v1beta1.CountTokensResponse(
+                    total_tokens=_TEST_COUNT_TOKENS_RESPONSE["total_tokens"],
+                    total_billable_characters=_TEST_COUNT_TOKENS_RESPONSE[
+                        "total_billable_characters"
+                    ],
+                )
+            )
+
+            with mock.patch.object(
+                target=prediction_service_client_v1beta1.PredictionServiceClient,
+                attribute="count_tokens",
+                return_value=gca_count_tokens_response,
+            ):
+                response = model.count_tokens(["What is life?"])
+
+                assert (
+                    response.total_tokens == _TEST_COUNT_TOKENS_RESPONSE["total_tokens"]
+                )
+                assert (
+                    response.total_billable_characters
+                    == _TEST_COUNT_TOKENS_RESPONSE["total_billable_characters"]
+                )
+
+    def test_text_embedding_count_tokens_preview(self):
         """Tests the text embedding model."""
         aiplatform.init(
             project=_TEST_PROJECT,
diff --git a/vertexai/language_models/_language_models.py b/vertexai/language_models/_language_models.py
@@ -2417,7 +2417,11 @@ class _TunableTextEmbeddingModelMixin(_PreviewTunableTextEmbeddingModelMixin):
     pass
 
 
-class TextEmbeddingModel(_TextEmbeddingModel, _TunableTextEmbeddingModelMixin):
+class TextEmbeddingModel(
+    _TextEmbeddingModel,
+    _TunableTextEmbeddingModelMixin,
+    _CountTokensMixin,
+):
     __module__ = "vertexai.language_models"