jinaai
/

jina-embeddings-v4

@@ -407,9 +407,9 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
                 )
         return task
-    def encode_texts(
         self,
-        texts: List[str],
         task: Optional[str] = None,
         max_length: int = 8192,
         batch_size: int = 8,
@@ -417,12 +417,12 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
         return_numpy: bool = False,
         truncate_dim: Optional[int] = None,
         prompt_name: Optional[str] = None,
-    ) -> List[torch.Tensor]:
         """
         Encodes a list of texts into embeddings.
         Args:
-            texts: List of text strings to encode
             max_length: Maximum token length for text processing
             batch_size: Number of texts to process at once
             vector_type: Type of embedding vector to generate ('single_vector' or 'multi_vector')
@@ -431,7 +431,7 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
             prompt_name: Type of text being encoded ('query' or 'passage')
         Returns:
-            List of text embeddings as tensors or numpy arrays
         """
         prompt_name = prompt_name or "query"
         encode_kwargs = self._validate_encoding_params(
@@ -446,6 +446,9 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
             prefix=encode_kwargs.pop("prefix"),
         )
         embeddings = self._process_batches(
             data=texts,
             processor_fn=processor_fn,
@@ -456,7 +459,7 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
             **encode_kwargs,
         )
-        return embeddings
     def _load_images_if_needed(
         self, images: List[Union[str, Image.Image]]
@@ -472,21 +475,21 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
             loaded_images.append(image)
         return loaded_images
-    def encode_images(
         self,
-        images: List[Union[str, Image.Image]],
         task: Optional[str] = None,
         batch_size: int = 8,
         vector_type: Optional[str] = None,
         return_numpy: bool = False,
         truncate_dim: Optional[int] = None,
         max_pixels: Optional[int] = None,
-    ) -> List[torch.Tensor]:
         """
-        Encodes a list of images into embeddings.
         Args:
-            images: List of PIL images, URLs, or local file paths to encode
             batch_size: Number of images to process at once
             vector_type: Type of embedding vector to generate ('single_vector' or 'multi_vector')
             return_numpy: Whether to return numpy arrays instead of torch tensors
@@ -494,7 +497,7 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
             max_pixels: Maximum number of pixels to process per image
         Returns:
-            List of image embeddings as tensors or numpy arrays
         """
         if max_pixels:
             default_max_pixels = self.processor.image_processor.max_pixels
@@ -503,6 +506,11 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
             )
         encode_kwargs = self._validate_encoding_params(vector_type, truncate_dim)
         task = self._validate_task(task)
         images = self._load_images_if_needed(images)
         embeddings = self._process_batches(
             data=images,
@@ -517,7 +525,7 @@ class JinaEmbeddingsV4Model(Qwen2_5_VLForConditionalGeneration):
         if max_pixels:
             self.processor.image_processor.max_pixels = default_max_pixels
-        return embeddings
     @classmethod
     def from_pretrained(

                 )
         return task
+    def encode_text(
         self,
+        texts: Union[str, List[str]],
         task: Optional[str] = None,
         max_length: int = 8192,
         batch_size: int = 8,
         return_numpy: bool = False,
         truncate_dim: Optional[int] = None,
         prompt_name: Optional[str] = None,
+    ) -> Union[List[torch.Tensor], torch.Tensor]:
         """
         Encodes a list of texts into embeddings.
         Args:
+            texts: text or list of text strings to encode
             max_length: Maximum token length for text processing
             batch_size: Number of texts to process at once
             vector_type: Type of embedding vector to generate ('single_vector' or 'multi_vector')
             prompt_name: Type of text being encoded ('query' or 'passage')
         Returns:
+            List of text embeddings as tensors or numpy arrays when encoding multiple texts, or single text embedding as tensor when encoding a single text
         """
         prompt_name = prompt_name or "query"
         encode_kwargs = self._validate_encoding_params(
             prefix=encode_kwargs.pop("prefix"),
         )
+        if isinstance(texts, str):
+            texts = [texts]
         embeddings = self._process_batches(
             data=texts,
             processor_fn=processor_fn,
             **encode_kwargs,
         )
+        return embeddings if len(texts) > 1 else embeddings[0]
     def _load_images_if_needed(
         self, images: List[Union[str, Image.Image]]
             loaded_images.append(image)
         return loaded_images
+    def encode_image(
         self,
+        images: Union[str, Image.Image, List[Union[str, Image.Image]]],
         task: Optional[str] = None,
         batch_size: int = 8,
         vector_type: Optional[str] = None,
         return_numpy: bool = False,
         truncate_dim: Optional[int] = None,
         max_pixels: Optional[int] = None,
+    ) -> Union[List[torch.Tensor], torch.Tensor]:
         """
+        Encodes a list of images or a single image into embedding(s).
         Args:
+            images: image(s) to encode, can be PIL Image(s), URL(s), or local file path(s)
             batch_size: Number of images to process at once
             vector_type: Type of embedding vector to generate ('single_vector' or 'multi_vector')
             return_numpy: Whether to return numpy arrays instead of torch tensors
             max_pixels: Maximum number of pixels to process per image
         Returns:
+            List of image embeddings as tensors or numpy arrays when encoding multiple images, or single image embedding as tensor when encoding a single image
         """
         if max_pixels:
             default_max_pixels = self.processor.image_processor.max_pixels
             )
         encode_kwargs = self._validate_encoding_params(vector_type, truncate_dim)
         task = self._validate_task(task)
+        # Convert single image to list
+        if isinstance(images, (str, Image.Image)):
+            images = [images]
         images = self._load_images_if_needed(images)
         embeddings = self._process_batches(
             data=images,
         if max_pixels:
             self.processor.image_processor.max_pixels = default_max_pixels
+        return embeddings if len(images) > 1 else embeddings[0]
     @classmethod
     def from_pretrained(