Update lvd_pipeline.py
Browse files- lvd_pipeline.py +2 -1
lvd_pipeline.py
CHANGED
@@ -758,7 +758,8 @@ class GroundedTextToVideoSDPipeline(DiffusionPipeline, TextualInversionLoaderMix
|
|
758 |
# we represent the location information as (xmin,ymin,xmax,ymax)
|
759 |
boxes = torch.zeros(max_objs, 4, device=device,
|
760 |
dtype=self.text_encoder.dtype)
|
761 |
-
|
|
|
762 |
text_embeddings = torch.zeros(
|
763 |
max_objs, self.unet.cross_attention_dim, device=device, dtype=self.text_encoder.dtype
|
764 |
)
|
|
|
758 |
# we represent the location information as (xmin,ymin,xmax,ymax)
|
759 |
boxes = torch.zeros(max_objs, 4, device=device,
|
760 |
dtype=self.text_encoder.dtype)
|
761 |
+
if n_objs:
|
762 |
+
boxes[:n_objs] = torch.tensor(lvd_gligen_boxes_frame)
|
763 |
text_embeddings = torch.zeros(
|
764 |
max_objs, self.unet.cross_attention_dim, device=device, dtype=self.text_encoder.dtype
|
765 |
)
|