Spaces:

ByteDance-Seed
/

Seed1.5-VL

Running

chenjoya commited on 21 days ago

Commit

1bcebf0

verified ·

1 Parent(s): 4693a25

Fix screenshot case (#2)

Files changed (1) hide show

infer.py CHANGED Viewed

@@ -1,4 +1,5 @@
 # Copyright (2025) [Seed-VL-Cookbook] Bytedance Seed
 import json
 import time
 import math
@@ -9,8 +10,8 @@ import torch
 import decord
 import numpy as np
 from PIL import Image, ImageSequence
-from torchvision.io import read_image, encode_jpeg, ImageReadMode
-from torchvision.transforms.functional import resize
 from torchvision.transforms import InterpolationMode
@@ -210,7 +211,18 @@ class SeedVLInfer:
                         },
                     })
             else:
-                image = read_image(path, ImageReadMode.RGB)
                 if online and path.endswith('.webp'):
                     streaming_timestamp = i
                 if streaming_timestamp is not None:

 # Copyright (2025) [Seed-VL-Cookbook] Bytedance Seed
+import cv2
 import json
 import time
 import math
 import decord
 import numpy as np
 from PIL import Image, ImageSequence
+from torchvision.io import read_image, encode_jpeg
+from torchvision.transforms.functional import resize, pil_to_tensor
 from torchvision.transforms import InterpolationMode
                         },
                     })
             else:
+                try:
+                    image = read_image(path, "RGB")
+                except:
+                    try:
+                        image = pil_to_tensor(Image.open(path).convert('RGB'))
+                    except:
+                        image = torch.from_numpy(
+                            cv2.cvtColor(
+                                cv2.imread(path),
+                                cv2.COLOR_BGR2RGB
+                            )
+                        ).permute(2, 0, 1)
                 if online and path.endswith('.webp'):
                     streaming_timestamp = i
                 if streaming_timestamp is not None: