WIP: expose dimensions in the Embedders

stellasia · stellasia · commit f7ef5dfc9cbb · 2025-08-21T13:45:42.000+02:00
diff --git a/examples/customize/embeddings/cohere_embeddings.py b/examples/customize/embeddings/cohere_embeddings.py
@@ -4,8 +4,14 @@
 api_key = None
 
 embeder = CohereEmbeddings(
-    model="embed-english-v3.0",
+    model="embed-v4.0",
     api_key=api_key,
 )
-res = embeder.embed_query("my question")
+res = embeder.embed_query(
+    "my question",
+    # optionally, set output dimensions if it's supported by the model
+    dimensions=256,
+    input_type="search_query",
+)
+print("Embedding dimensions", len(res))
 print(res[:10])
diff --git a/examples/customize/embeddings/custom_embeddings.py b/examples/customize/embeddings/custom_embeddings.py
@@ -8,7 +8,7 @@ class CustomEmbeddings(Embedder):
     def __init__(self, dimension: int = 10, **kwargs: Any):
         self.dimension = dimension
 
-    def embed_query(self, input: str) -> list[float]:
+    def embed_query(self, input: str, **kwargs) -> list[float]:
         return [random.random() for _ in range(self.dimension)]
 
 
diff --git a/examples/customize/embeddings/mistalai_embeddings.py b/examples/customize/embeddings/mistalai_embeddings.py
@@ -8,5 +8,10 @@
 api_key = None
 
 embeder = MistralAIEmbeddings(model="mistral-embed", api_key=api_key)
-res = embeder.embed_query("my question")
+res = embeder.embed_query(
+    "my question",
+    # optionally, set output dimensions
+    dimensions=256,
+)
+print("Embedding dimensions", len(res))
 print(res[:10])
diff --git a/examples/customize/embeddings/openai_embeddings.py b/examples/customize/embeddings/openai_embeddings.py
@@ -7,6 +7,12 @@
 # set api key here on in the OPENAI_API_KEY env var
 api_key = None
 
-embeder = OpenAIEmbeddings(model="text-embedding-ada-002", api_key=api_key)
-res = embeder.embed_query("my question")
+embeder = OpenAIEmbeddings(model="text-embedding-3-small", api_key=api_key)
+res = embeder.embed_query(
+    "my question",
+    # optionally, set output dimensions
+    # dimensions=256,
+)
+
+print("Embedding dimensions", len(res))
 print(res[:10])
diff --git a/examples/customize/embeddings/vertexai_embeddings.py b/examples/customize/embeddings/vertexai_embeddings.py
@@ -5,5 +5,9 @@
 from neo4j_graphrag.embeddings import VertexAIEmbeddings
 
 embeder = VertexAIEmbeddings(model="text-embedding-005")
-res = embeder.embed_query("my question")
+res = embeder.embed_query(
+    "my question",
+    dimensions=256,
+)
+print("Embedding dimensions", len(res))
 print(res[:10])
diff --git a/src/neo4j_graphrag/embeddings/base.py b/src/neo4j_graphrag/embeddings/base.py
@@ -24,11 +24,14 @@ class Embedder(ABC):
     """
 
     @abstractmethod
-    def embed_query(self, text: str) -> list[float]:
+    def embed_query(
+        self, text: str, dimensions: int | None = None, **kwargs
+    ) -> list[float]:
         """Embed query text.
 
         Args:
             text (str): Text to convert to vector embedding
+            dimensions (Optional[int]): The number of dimensions the resulting output embeddings should have. Only for models supporting it.
 
         Returns:
             list[float]: A vector embedding.
diff --git a/src/neo4j_graphrag/embeddings/cohere.py b/src/neo4j_graphrag/embeddings/cohere.py
@@ -32,12 +32,23 @@ def __init__(self, model: str = "", **kwargs: Any) -> None:
                 Please install it with `pip install "neo4j-graphrag[cohere]"`."""
             )
         self.model = model
-        self.client = cohere.Client(**kwargs)
+        self.client = cohere.ClientV2(**kwargs)
 
-    def embed_query(self, text: str, **kwargs: Any) -> list[float]:
+    def embed_query(
+        self, text: str, dimensions: int | None = None, **kwargs: Any
+    ) -> list[float]:
+        """
+        Generate embeddings for a given query using a Cohere text embedding model.
+
+        Args:
+            text (str): The text to generate an embedding for.
+            dimensions (Optional[int]): The number of dimensions the resulting output embeddings should have. Only for models supporting it.
+            **kwargs (Any): Additional keyword arguments to pass to the Cohere ClientV2.embed method.
+        """
         response = self.client.embed(
             texts=[text],
             model=self.model,
+            output_dimension=dimensions,
             **kwargs,
         )
-        return response.embeddings[0]  # type: ignore
+        return response.embeddings.float[0]  # type: ignore
diff --git a/src/neo4j_graphrag/embeddings/mistral.py b/src/neo4j_graphrag/embeddings/mistral.py
@@ -48,16 +48,19 @@ def __init__(self, model: str = "mistral-embed", **kwargs: Any) -> None:
         self.model = model
         self.mistral_client = Mistral(api_key=api_key, **kwargs)
 
-    def embed_query(self, text: str, **kwargs: Any) -> list[float]:
+    def embed_query(
+        self, text: str, dimensions: int | None = None, **kwargs: Any
+    ) -> list[float]:
         """
         Generate embeddings for a given query using a Mistral AI text embedding model.
 
         Args:
             text (str): The text to generate an embedding for.
-            **kwargs (Any): Additional keyword arguments to pass to the Mistral AI client.
+            dimensions (Optional[int]): The number of dimensions the resulting output embeddings should have. Only for models supporting it.
+            **kwargs (Any): Additional keyword arguments to pass to the embeddings.create method.
         """
         embeddings_batch_response = self.mistral_client.embeddings.create(
-            model=self.model, inputs=[text], **kwargs
+            model=self.model, inputs=[text], output_dimension=dimensions, **kwargs
         )
         if embeddings_batch_response is None or not embeddings_batch_response.data:
             raise EmbeddingsGenerationError("Failed to retrieve embeddings.")
diff --git a/src/neo4j_graphrag/embeddings/openai.py b/src/neo4j_graphrag/embeddings/openai.py
@@ -51,15 +51,21 @@ def _initialize_client(self, **kwargs: Any) -> Any:
         """
         pass
 
-    def embed_query(self, text: str, **kwargs: Any) -> list[float]:
+    def embed_query(
+        self, text: str, dimensions: int | None = None, **kwargs: Any
+    ) -> list[float]:
         """
         Generate embeddings for a given query using an OpenAI text embedding model.
 
         Args:
             text (str): The text to generate an embedding for.
+            dimensions (Optional[int]): The number of dimensions the resulting output embeddings should have. Only for models supporting it.
+
             **kwargs (Any): Additional arguments to pass to the OpenAI embedding generation function.
         """
-        response = self.client.embeddings.create(input=text, model=self.model, **kwargs)
+        response = self.client.embeddings.create(
+            input=text, model=self.model, dimensions=dimensions, **kwargs
+        )
         embedding: list[float] = response.data[0].embedding
         return embedding
 
diff --git a/src/neo4j_graphrag/embeddings/sentence_transformers.py b/src/neo4j_graphrag/embeddings/sentence_transformers.py
@@ -35,7 +35,7 @@ def __init__(
         self.np = np
         self.model = sentence_transformers.SentenceTransformer(model, *args, **kwargs)
 
-    def embed_query(self, text: str) -> Any:
+    def embed_query(self, text: str, **kwargs) -> Any:
         result = self.model.encode([text])
         if isinstance(result, self.torch.Tensor) or isinstance(result, self.np.ndarray):
             return result.flatten().tolist()
diff --git a/src/neo4j_graphrag/embeddings/vertexai.py b/src/neo4j_graphrag/embeddings/vertexai.py
@@ -14,20 +14,17 @@
 #  limitations under the License.
 from __future__ import annotations
 
-from typing import Any, TYPE_CHECKING
+from typing import Any
 
 from neo4j_graphrag.embeddings.base import Embedder
 
+
 try:
     from vertexai.language_models import TextEmbeddingInput, TextEmbeddingModel
 except (ImportError, AttributeError):
     TextEmbeddingModel = TextEmbeddingInput = None  # type: ignore[misc, assignment]
 
 
-if TYPE_CHECKING:
-    from vertexai.language_models import TextEmbeddingInput, TextEmbeddingModel
-
-
 class VertexAIEmbeddings(Embedder):
     """
     Vertex AI embeddings class.
@@ -46,17 +43,23 @@ def __init__(self, model: str = "text-embedding-004") -> None:
         self.model = TextEmbeddingModel.from_pretrained(model)
 
     def embed_query(
-        self, text: str, task_type: str = "RETRIEVAL_QUERY", **kwargs: Any
+        self,
+        text: str,
+        task_type: str = "RETRIEVAL_QUERY",
+        dimensions: int | None = None,
+        **kwargs: Any,
     ) -> list[float]:
         """
         Generate embeddings for a given query using a Vertex AI text embedding model.
 
         Args:
             text (str): The text to generate an embedding for.
+            dimensions (Optional[int]): The number of dimensions the resulting output embeddings should have. Only for models supporting it.
             task_type (str): The type of the text embedding task. Defaults to "RETRIEVAL_QUERY". See https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/text-embeddings-api#tasktype for a full list.
             **kwargs (Any): Additional keyword arguments to pass to the Vertex AI client's get_embeddings method.
         """
-        # type annotation needed for mypy
         inputs: list[str | TextEmbeddingInput] = [TextEmbeddingInput(text, task_type)]
-        embeddings = self.model.get_embeddings(inputs, **kwargs)
-        return embeddings[0].values
+        embeddings = self.model.get_embeddings(
+            inputs, output_dimensionality=dimensions, **kwargs
+        )
+        return embeddings[0].values  # type: ignore