Spaces:

rynmurdock
/

Blue_Tigers

Runtime error

rynmurdock commited on Jun 3, 2024

Commit

ce6d022

verified ·

1 Parent(s): 82ddb45

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -132,8 +132,8 @@ processor = AutoProcessor.from_pretrained('google/paligemma-3b-pt-224')
 @spaces.GPU()
 def to_wanted_embs(image_outputs, input_ids, attention_mask, cache_position=None):
-    inputs_embeds = pali.get_input_embeddings()(input_ids)
-    selected_image_feature = image_outputs.to(dtype).to(device)
     image_features = pali.multi_modal_projector(selected_image_feature)
     if cache_position is None:
@@ -190,9 +190,9 @@ def generate_gpu(in_im_embs, prompt='the scene'):
                 )
         im_emb = im_emb.detach().to('cpu').to(torch.float32)
         im = torchvision.transforms.ToTensor()(output.frames[0][len(output.frames[0])//2]).unsqueeze(0)
-        im = torch.nn.functional.interpolate(im, (224, 224))
         im = (im - .5) * 2
-        gemb = pali.vision_tower(im.to(device).to(dtype)).last_hidden_state.detach().to('cpu').to(torch.float32)
     return output, im_emb, gemb

 @spaces.GPU()
 def to_wanted_embs(image_outputs, input_ids, attention_mask, cache_position=None):
+    inputs_embeds = pali.get_input_embeddings()(input_ids.to('cuda'))
+    selected_image_feature = image_outputs.to(dtype).to('cuda')
     image_features = pali.multi_modal_projector(selected_image_feature)
     if cache_position is None:
                 )
         im_emb = im_emb.detach().to('cpu').to(torch.float32)
         im = torchvision.transforms.ToTensor()(output.frames[0][len(output.frames[0])//2]).unsqueeze(0)
+        im = torch.nn.functional.interpolate(im, (224, 224)).to(dtype).to('cuda')
         im = (im - .5) * 2
+        gemb = pali.vision_tower(im).last_hidden_state.detach().to('cpu').to(torch.float32)
     return output, im_emb, gemb