do not apply projection for blip2

Mark-ZhouWX · Mark-ZhouWX · commit e4e13f5cb37a · 2023-12-18T15:38:58.000+08:00
diff --git a/official/cv/segment-anything/segment_anything/modeling/prompt_encoder.py b/official/cv/segment-anything/segment_anything/modeling/prompt_encoder.py
@@ -56,7 +56,10 @@ def __init__(
         self.no_mask_embed = nn.Embedding(1, embed_dim)
 
         self.text_embeddings = nn.Embedding(1, embed_dim)
-        self.text_proj = nn.Dense(in_channels=text_feature_dim, out_channels=embed_dim)
+        # self.text_proj = nn.Dense(in_channels=text_feature_dim, out_channels=embed_dim)
+
+        self.text_proj = nn.Dense(in_channels=text_feature_dim, out_channels=embed_dim) \
+            if text_feature_dim != embed_dim else nn.Identity() # clip need projection while blip2 not
 
     def get_dense_pe(self) -> ms.Tensor:
         """