newocean-group
diff --git a/‎README.md
Lines changed: 2 additions & 0 deletions b/‎README.md
Lines changed: 2 additions & 0 deletions
diff --git a/‎SA_1B/sa_11027.jpg
668 KB b/‎SA_1B/sa_11027.jpg
668 KB
diff --git a/‎cls_embeddings.ipynb
Lines changed: 270 additions & 0 deletions b/‎cls_embeddings.ipynb
Lines changed: 270 additions & 0 deletions
diff --git a/‎src/model.py
Lines changed: 37 additions & 0 deletions b/‎src/model.py
Lines changed: 37 additions & 0 deletions
@@ -53,6 +53,8 @@ To use the model, follow these steps:
 ### 🔍 Demo
 I have attached a .ipynb [file](demo.ipynb) in the repository. You can refer to it to know how to use the model.
 
+Additionally, I have provided another .ipynb [file](cls_embeddings.ipynb) that illustrates the process of learning class embeddings for the model.
+
 **Note**: You may need to adjust the threshold value to achieve the best results.
 
 ### 💡 Conclusion
 
@@ -453,3 +453,40 @@ def forward_for_training_model_with_ref_points_lst_lst(
             out["dn_aux_outputs"] = self._set_aux_loss(dn_out_logits, dn_out_bboxes)
             out["dn_meta"] = dn_meta
         return out, visual_embeds_list
+
+    def forward_for_cls_embeddings(
+        self,
+        tensor_list: NestedTensor,
+        embeds,
+    ):
+        # memory
+        memory, mask_flatten, spatial_shapes, level_start_index, valid_ratios = (
+            self.image_encoder(tensor_list)
+        )
+
+        # box decoder
+        out_bboxes, out_logits, dn_out_bboxes, dn_out_logits, dn_meta = (
+            self.box_decoder(
+                memory=memory,
+                mask_flatten=mask_flatten,
+                spatial_shapes=spatial_shapes,
+                level_start_index=level_start_index,
+                valid_ratios=valid_ratios,
+                visual_embed=embeds,
+                targets=None,
+            )
+        )
+        out = {"pred_logits": out_logits[-1], "pred_boxes": out_bboxes[-1]}
+        out["aux_outputs"] = self._set_aux_loss(out_logits[:-1], out_bboxes[:-1])
+        if dn_meta is not None:
+
+            out["dn_aux_outputs"] = self._set_aux_loss(dn_out_logits, dn_out_bboxes)
+            out["dn_meta"] = dn_meta
+        return out, embeds
+
+    @torch.jit.unused
+    def _set_aux_loss(self, outputs_class, outputs_coord):
+        return [
+            {"pred_logits": a, "pred_boxes": b}
+            for a, b in zip(outputs_class[:-1], outputs_coord[:-1])
+        ]