Spaces:

adpro
/

midas

Running

App Files Files Community

adpro commited on 29 days ago

Commit

64c49d0

verified ·

1 Parent(s): e8e141f

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -25

app.py CHANGED Viewed

@@ -8,33 +8,39 @@ from fastapi import FastAPI, File, UploadFile
 from PIL import Image
 import uvicorn
 app = FastAPI()
 # 🟢 Chọn thiết bị xử lý (GPU nếu có)
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-# 🟢 Tải model DPT-Hybrid thay cho ZoeDepth để tăng tốc
 feature_extractor = DPTFeatureExtractor.from_pretrained("Intel/dpt-swinv2-tiny-256")
 model = DPTForDepthEstimation.from_pretrained("Intel/dpt-swinv2-tiny-256").to(device)
 model.eval()
 @app.post("/analyze_path/")
 async def analyze_path(file: UploadFile = File(...)):
-        # 🟢 Bắt đầu đo thời gian dự đoán Depth Map
     start_time = time.time()
     # 🟢 Đọc file ảnh từ ESP32
     image_bytes = await file.read()
     image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
     # 🔵 Resize ảnh để xử lý nhanh hơn
-    image = image.resize((192, 192))  # Giảm kích thước giúp tăng tốc độ xử lý
     image_np = np.array(image)
     flipped_image = cv2.flip(image_np, -1)
     # 🟢 Chuẩn bị ảnh cho mô hình
     inputs = feature_extractor(images=flipped_image, return_tensors="pt").to(device)
     # 🟢 Dự đoán Depth Map với DPT-Hybrid
     with torch.no_grad():
         outputs = model(**inputs)
@@ -43,6 +49,13 @@ async def analyze_path(file: UploadFile = File(...)):
     predicted_depth = outputs.predicted_depth.squeeze().cpu().numpy()
     depth_map = (predicted_depth * 255 / predicted_depth.max()).astype("uint8")
     end_time = time.time()
     print(f"⏳ DPT xử lý trong {end_time - start_time:.4f} giây")
@@ -50,9 +63,9 @@ async def analyze_path(file: UploadFile = File(...)):
     start_detect_time = time.time()
     command = detect_path(depth_map)
     end_detect_time = time.time()
-    print(f"⏳ detect_path() xử lý trong {end_detect_time - start_detect_time:.4f} giây Lệnh: {command}")
-    return {"command": command}
 def detect_path(depth_map):
     """Phân tích đường đi từ ảnh Depth Map"""
@@ -60,31 +73,21 @@ def detect_path(depth_map):
     center_x = w // 2
     scan_y = int(h * 0.8)  # Quét dòng 80% từ trên xuống
-    # 🟢 Chia ảnh thành 3 vùng: trái, giữa, phải
-    left_region = np.mean(depth_map[scan_y, :center_x - 40])
-    right_region = np.mean(depth_map[scan_y, center_x + 40:])
     center_region = np.mean(depth_map[scan_y, center_x - 40:center_x + 40])
-    # 🟢 Ngưỡng phát hiện vật cản (càng thấp, càng nhạy)
-    threshold = 80
-    # 🟢 Không có vật cản ở cả 3 vùng → đi thẳng
-    if left_region > threshold and center_region > threshold and right_region > threshold:
-        return "forward"
-    # 🟢 Nếu chỉ có giữa trống → đi thẳng
     if center_region > threshold:
         return "forward"
-    # 🟢 Nếu chỉ có trái hoặc phải trống → chọn hướng có vùng trống lớn nhất
-    if left_region > right_region:
         return "left"
     elif right_region > left_region:
         return "right"
-    # 🟢 Nếu tất cả đều có vật cản → lùi lại
-    return "backward"
 # 🟢 Chạy server FastAPI
 if __name__ == "__main__":
-    uvicorn.run(app, host="0.0.0.0", port=7860)

 from PIL import Image
 import uvicorn
+# 🟢 Tạo FastAPI
 app = FastAPI()
 # 🟢 Chọn thiết bị xử lý (GPU nếu có)
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# 🟢 Tải model DPT-Hybrid để tăng tốc
 feature_extractor = DPTFeatureExtractor.from_pretrained("Intel/dpt-swinv2-tiny-256")
 model = DPTForDepthEstimation.from_pretrained("Intel/dpt-swinv2-tiny-256").to(device)
 model.eval()
+# 🟢 Biến lưu ảnh Depth Map để hiển thị trên Gradio
+depth_map_global = None
 @app.post("/analyze_path/")
 async def analyze_path(file: UploadFile = File(...)):
+    """Xử lý ảnh Depth Map và trả về lệnh điều hướng"""
+    global depth_map_global  # Dùng biến toàn cục để hiển thị trên Gradio
     start_time = time.time()
     # 🟢 Đọc file ảnh từ ESP32
     image_bytes = await file.read()
     image = Image.open(io.BytesIO(image_bytes)).convert("RGB")
     # 🔵 Resize ảnh để xử lý nhanh hơn
+    image = image.resize((256, 256))
     image_np = np.array(image)
     flipped_image = cv2.flip(image_np, -1)
     # 🟢 Chuẩn bị ảnh cho mô hình
     inputs = feature_extractor(images=flipped_image, return_tensors="pt").to(device)
     # 🟢 Dự đoán Depth Map với DPT-Hybrid
     with torch.no_grad():
         outputs = model(**inputs)
     predicted_depth = outputs.predicted_depth.squeeze().cpu().numpy()
     depth_map = (predicted_depth * 255 / predicted_depth.max()).astype("uint8")
+    # 🔵 Chuyển depth_map thành ảnh có thể hiển thị
+    depth_colored = cv2.applyColorMap(depth_map, cv2.COLORMAP_INFERNO)
+    depth_pil = Image.fromarray(depth_colored)
+    # 🟢 Lưu ảnh Depth Map để hiển thị trên Gradio
+    depth_map_global = depth_pil
     end_time = time.time()
     print(f"⏳ DPT xử lý trong {end_time - start_time:.4f} giây")
     start_detect_time = time.time()
     command = detect_path(depth_map)
     end_detect_time = time.time()
+    print(f"⏳ detect_path() xử lý trong {end_detect_time - start_detect_time:.4f} giây")
+    return command  # Trả về lệnh điều hướng (không kèm ảnh)
 def detect_path(depth_map):
     """Phân tích đường đi từ ảnh Depth Map"""
     center_x = w // 2
     scan_y = int(h * 0.8)  # Quét dòng 80% từ trên xuống
+    left_region = np.mean(depth_map[scan_y, :center_x])
+    right_region = np.mean(depth_map[scan_y, center_x:])
     center_region = np.mean(depth_map[scan_y, center_x - 40:center_x + 40])
+    # 🟢 Cải thiện logic xử lý
+    threshold = 100  # Ngưỡng phân biệt vật cản
     if center_region > threshold:
         return "forward"
+    elif left_region > right_region:
         return "left"
     elif right_region > left_region:
         return "right"
+    else:
+        return "backward"
 # 🟢 Chạy server FastAPI
 if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=7860)