ibm-granite
/

granite-vision-3.3-2b-embedding

@@ -23,7 +23,7 @@ def floor_by_factor(number: float, factor: int) -> int:
 class GraniteVisionEmbProcessor(LlavaNextProcessor):
     """
-    Processor for ColPali.
     """
     visual_prompt_prefix: ClassVar[str] = "<|user|>\n<image>\nDescribe the image.\n"
@@ -300,7 +300,7 @@ class GraniteVisionEmbProcessor(LlavaNextProcessor):
             images: List[Image.Image],
     ) -> BatchFeature:
         """
-        Process images for ColPali.
         """
         # texts_doc = [self.apply_chat_template(self.format_data_wo_role(self.visual_prompt_prefix, img),tokenize=False ) for img in images]
         texts_doc = [self.visual_prompt_prefix for _ in images]
@@ -394,7 +394,7 @@ class GraniteVisionEmbProcessor(LlavaNextProcessor):
     ) -> torch.Tensor:
         """
         Compute the late-interaction/MaxSim score (ColBERT-like) for the given multi-vector
-        query embeddings (`qs`) and passage embeddings (`ps`). For ColPali, a passage is the
         image of a document page.
         Because the embedding tensors are multi-vector and can thus have different shapes, they

 class GraniteVisionEmbProcessor(LlavaNextProcessor):
     """
+    Processor for GraniteVisionEmb.
     """
     visual_prompt_prefix: ClassVar[str] = "<|user|>\n<image>\nDescribe the image.\n"
             images: List[Image.Image],
     ) -> BatchFeature:
         """
+        Process images.
         """
         # texts_doc = [self.apply_chat_template(self.format_data_wo_role(self.visual_prompt_prefix, img),tokenize=False ) for img in images]
         texts_doc = [self.visual_prompt_prefix for _ in images]
     ) -> torch.Tensor:
         """
         Compute the late-interaction/MaxSim score (ColBERT-like) for the given multi-vector
+        query embeddings (`qs`) and passage embeddings (`ps`). For us, a passage is the
         image of a document page.
         Because the embedding tensors are multi-vector and can thus have different shapes, they