|
import io |
|
import os |
|
import sys |
|
import time |
|
import numpy as np |
|
import cv2 |
|
import torch |
|
import torchvision |
|
from fastapi import FastAPI, File, UploadFile |
|
from PIL import Image |
|
import uvicorn |
|
|
|
app = FastAPI() |
|
|
|
|
|
zoe_path = "ZoeDepth" |
|
if not os.path.exists(zoe_path): |
|
os.system("git clone https://github.com/isl-org/ZoeDepth.git") |
|
|
|
|
|
sys.path.append(os.path.abspath(zoe_path)) |
|
|
|
|
|
from zoedepth.models.builder import build_model |
|
from zoedepth.utils.config import get_config |
|
|
|
|
|
device = torch.device("cuda" if torch.cuda.is_available() else "cpu") |
|
|
|
config = get_config("zoedepth", version="tiny", pretrained_resource=None) |
|
model = ZoeDepth.build_from_config(config) |
|
model.eval() |
|
|
|
@app.post("/analyze_path/") |
|
async def analyze_path(file: UploadFile = File(...)): |
|
|
|
image_bytes = await file.read() |
|
image = Image.open(io.BytesIO(image_bytes)).convert("RGB") |
|
|
|
|
|
image_np = np.array(image) |
|
flipped_image = cv2.flip(image_np, -1) |
|
|
|
|
|
transform = torchvision.transforms.Compose([ |
|
torchvision.transforms.Resize((256, 256)), |
|
torchvision.transforms.ToTensor(), |
|
]) |
|
img_tensor = transform(flipped_image).unsqueeze(0).to(device) |
|
|
|
|
|
start_time = time.time() |
|
|
|
|
|
with torch.no_grad(): |
|
depth_map = model.infer(img_tensor) |
|
depth_map = torch.nn.functional.interpolate( |
|
depth_map.unsqueeze(1), size=(image_np.shape[0], image_np.shape[1]), mode="bicubic", align_corners=False |
|
).squeeze().cpu().numpy() |
|
|
|
end_time = time.time() |
|
print(f"⏳ ZoeDepth xử lý trong {end_time - start_time:.4f} giây") |
|
|
|
|
|
start_detect_time = time.time() |
|
command = detect_path(depth_map) |
|
end_detect_time = time.time() |
|
print(f"⏳ detect_path() xử lý trong {end_detect_time - start_detect_time:.4f} giây") |
|
|
|
return {"command": command} |
|
|
|
def detect_path(depth_map): |
|
"""Phân tích đường đi từ ảnh Depth Map""" |
|
h, w = depth_map.shape |
|
center_x = w // 2 |
|
scan_y = h - 20 |
|
|
|
left_region = np.mean(depth_map[scan_y, :center_x]) |
|
right_region = np.mean(depth_map[scan_y, center_x:]) |
|
center_region = np.mean(depth_map[scan_y, center_x - 20:center_x + 20]) |
|
|
|
if center_region > 200: |
|
return "forward" |
|
elif left_region > right_region: |
|
return "left" |
|
elif right_region > left_region: |
|
return "right" |
|
else: |
|
return "backward" |
|
|
|
|
|
if __name__ == "__main__": |
|
uvicorn.run(app, host="0.0.0.0", port=7860) |
|
|