Spaces:

1inkusFace
/

StableDiffusion-3.5-Large-IP

Running on Zero

1inkusFace commited on Jan 21

Commit

628ea81

verified ·

1 Parent(s): 3cfe28a

Update pipeline_stable_diffusion_3_ipa.py

Files changed (1) hide show

pipeline_stable_diffusion_3_ipa.py CHANGED Viewed

@@ -1195,16 +1195,16 @@ class StableDiffusion3Pipeline(DiffusionPipeline, SD3LoraLoaderMixin, FromSingle
         #clip_image_embeds_cat_list = torch.cat(image_prompt_embeds_list).mean(dim=0)
         clip_image_embeds_cat_list = torch.cat(image_prompt_embeds_list, dim=1)
-        print('catted embeds list with mean: ',clip_image_embeds_cat_list.shape)
-        seq_len, _ = clip_image_embeds_cat_list.shape
-        clip_image_embeds_cat_list_repeat = clip_image_embeds_cat_list.repeat(1, 1, 1)
-        clip_image_embeds_view = clip_image_embeds_cat_list #.unsqueeze(0) # Added unsqueeze here instead
-        print('catted embeds repeat: ',clip_image_embeds_view.shape)
-        clip_image_embeds_view = clip_image_embeds_view.view(1, seq_len, -1)
-        print('catted viewed: ',clip_image_embeds_view.shape)
         zeros_tensor = torch.zeros_like(clip_image_embeds_view)
         #zeros_tensor = torch.zeros_like(clip_image_embeds_view[:, :image_prompt_embeds_list[0].shape[1], :]) # Make zeros tensor match the sequence length of a single image embedding
-        print('zeros: ',zeros_tensor.shape)
         clip_image_embeds = torch.cat([zeros_tensor, clip_image_embeds_view], dim=0)
         print('embeds shape: ', clip_image_embeds.shape)

         #clip_image_embeds_cat_list = torch.cat(image_prompt_embeds_list).mean(dim=0)
         clip_image_embeds_cat_list = torch.cat(image_prompt_embeds_list, dim=1)
+        print('catted embeds list with meanout shape: ',clip_image_embeds_cat_list.shape)
+        #seq_len, _ = clip_image_embeds_cat_list.shape
+        #clip_image_embeds_cat_list_repeat = clip_image_embeds_cat_list.repeat(1, 1, 1)
+        clip_image_embeds_view = clip_image_embeds_cat_list.unsqueeze(0) # Added unsqueeze here instead
+        print('catted embeds unsqueeze shape: ',clip_image_embeds_view.shape)
+        #clip_image_embeds_view = clip_image_embeds_view.view(1, seq_len, -1)
+        #print('catted viewed: ',clip_image_embeds_view.shape)
         zeros_tensor = torch.zeros_like(clip_image_embeds_view)
         #zeros_tensor = torch.zeros_like(clip_image_embeds_view[:, :image_prompt_embeds_list[0].shape[1], :]) # Make zeros tensor match the sequence length of a single image embedding
+        print('zeros shape: ',zeros_tensor.shape)
         clip_image_embeds = torch.cat([zeros_tensor, clip_image_embeds_view], dim=0)
         print('embeds shape: ', clip_image_embeds.shape)