Spaces:

umarbalak
/

CodeCraft

Runtime error

App Files Files Community

CodeCraft / app.py

umarbalak

initial commit

7be1f70 5 months ago

raw

history blame

8.96 kB

	from fastapi import FastAPI, File, UploadFile, HTTPException
	from fastapi.responses import FileResponse, JSONResponse
	from fastapi.middleware.cors import CORSMiddleware
	import uvicorn
	import cv2
	import numpy as np
	from ultralytics import YOLO
	import os
	import shutil
	from typing import Optional
	import uuid
	import base64
	from io import BytesIO
	from PIL import Image

	# Create FastAPI app
	app = FastAPI(
	title="YOLO Intrusion Detection API",
	description="API for detecting intrusions using YOLOv8 model",
	version="1.0.0"
	)

	# Add CORS middleware
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# Load YOLO model
	model_name = 'yolov8n.pt'
	model = None # Will be loaded on startup

	# Define trapezoidal restricted area
	trapezoid_pts = np.array([[250, 150], [400, 150], [450, 300], [200, 300]], np.int32)

	# Create temp directory for uploads if it doesn't exist
	os.makedirs("temp", exist_ok=True)

	def is_inside_trapezoid(box, trapezoid_pts):
	"""Check if the center of a detected object is inside the trapezoidal area."""
	x1, y1, x2, y2 = box
	cx, cy = int((x1 + x2) / 2), int((y1 + y2) / 2) # Calculate center of detected object

	# Use point-in-polygon check
	return cv2.pointPolygonTest(trapezoid_pts, (cx, cy), False) >= 0

	def process_image(frame):
	"""Process a single image and return the annotated image and intrusion data."""
	global model

	# Perform object detection
	results = model.predict(frame, conf=0.5)
	annotated_frame = results[0].plot() # Draw bounding boxes

	# Draw trapezoidal restricted area
	cv2.polylines(annotated_frame, [trapezoid_pts.reshape((-1, 1, 2))], isClosed=True, color=(0, 0, 255), thickness=2)

	isAlert = {'alert': [False, ""], 'personCount': 0}
	classInIntrusion = ['person', 'bicycle', 'car', 'motorcycle']

	detections = []

	# Loop through detected objects
	for r in results:
	for box, cls, conf in zip(r.boxes.xyxy, r.boxes.cls, r.boxes.conf):
	class_id = int(cls.item()) # Convert to integer
	confidence = float(conf.item())
	x1, y1, x2, y2 = map(int, box.tolist())

	class_name = classInIntrusion[class_id] if class_id < len(classInIntrusion) else f"class_{class_id}"

	# Add to detections list
	detections.append({
	"class": class_name,
	"confidence": confidence,
	"bbox": [x1, y1, x2, y2],
	"in_restricted_area": is_inside_trapezoid(box.tolist(), trapezoid_pts)
	})

	if class_id == 0: # Person
	isAlert['personCount'] += 1

	if class_id in [0, 1, 2, 3]: # Person, bicycle, car, motorcycle
	if is_inside_trapezoid(box.tolist(), trapezoid_pts):
	isAlert['alert'] = [True, classInIntrusion[class_id]]
	# Mark the intrusion with a red box
	cv2.rectangle(annotated_frame, (x1, y1), (x2, y2), (0, 0, 255), 3)

	# Add alert text on the frame
	alert_text = f"Intrusion Alert: {isAlert['alert'][0]}, Object: {isAlert['alert'][1]}, Persons: {isAlert['personCount']}"
	cv2.putText(annotated_frame, alert_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 255), 2)

	# Convert the response
	response = {
	"intrusion_detected": isAlert['alert'][0],
	"intruding_object": isAlert['alert'][1],
	"person_count": isAlert['personCount'],
	"detections": detections
	}

	return annotated_frame, response

	def encode_image_to_base64(image):
	"""Convert an OpenCV image to base64 encoded string."""
	_, buffer = cv2.imencode('.jpg', image)
	return base64.b64encode(buffer).decode('utf-8')

	@app.on_event("startup")
	async def startup_event():
	"""Load the YOLO model when the app starts."""
	global model
	model = YOLO(model_name)
	print(f"Model {model_name} loaded successfully")

	@app.get("/")
	async def root():
	"""Root endpoint."""
	return {
	"message": "YOLO Intrusion Detection API is running",
	"documentation": "/docs",
	"endpoints": {
	"process_image": "/process_image/",
	"process_video": "/process_video/",
	"health": "/health/"
	}
	}

	@app.get("/health/")
	async def health_check():
	"""Health check endpoint."""
	return {"status": "healthy", "model": model_name}

	@app.post("/process_image/")
	async def api_process_image(file: UploadFile = File(...), return_image: bool = True):
	"""
	Process an image file and detect intrusions.

	Args:
	file: The image file to process
	return_image: If True, returns the annotated image as base64

	Returns:
	JSON with detection results and optionally the annotated image
	"""
	# Check file extension
	if not file.filename.lower().endswith(('.png', '.jpg', '.jpeg')):
	raise HTTPException(status_code=400, detail="Only PNG and JPG images are supported")

	# Read and process image
	contents = await file.read()
	nparr = np.frombuffer(contents, np.uint8)
	img = cv2.imdecode(nparr, cv2.IMREAD_COLOR)

	if img is None:
	raise HTTPException(status_code=400, detail="Could not decode image")

	# Process the image
	annotated_img, results = process_image(img)

	# Optionally include the annotated image
	if return_image:
	results["image"] = encode_image_to_base64(annotated_img)

	return results

	@app.post("/process_video/")
	async def api_process_video(file: UploadFile = File(...)):
	"""
	Process a video file and detect intrusions.

	Args:
	file: The video file to process

	Returns:
	JSON with detection results and path to processed video
	"""
	# Check file extension
	if not file.filename.lower().endswith(('.mp4', '.avi', '.mov')):
	raise HTTPException(status_code=400, detail="Only MP4, AVI, and MOV videos are supported")

	# Create a unique temporary file name
	temp_input = f"temp/input_{uuid.uuid4()}.mp4"
	temp_output = f"temp/output_{uuid.uuid4()}.mp4"

	# Save uploaded file
	with open(temp_input, "wb") as buffer:
	shutil.copyfileobj(file.file, buffer)

	# Process the video
	cap = cv2.VideoCapture(temp_input)
	if not cap.isOpened():
	os.remove(temp_input)
	raise HTTPException(status_code=400, detail="Could not open video file")

	# Get video properties
	width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
	height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
	fps = cap.get(cv2.CAP_PROP_FPS)

	# Create output video file
	fourcc = cv2.VideoWriter_fourcc(*'mp4v')
	out = cv2.VideoWriter(temp_output, fourcc, fps, (width, height))

	# Process frames
	final_results = {
	"intrusion_detected": False,
	"intruding_objects": set(),
	"max_person_count": 0,
	"frames_processed": 0,
	"total_detections": 0
	}

	while True:
	ret, frame = cap.read()
	if not ret:
	break

	# Process the frame
	annotated_frame, frame_results = process_image(frame)

	# Update final results
	final_results["frames_processed"] += 1
	final_results["total_detections"] += len(frame_results["detections"])

	if frame_results["intrusion_detected"]:
	final_results["intrusion_detected"] = True
	if frame_results["intruding_object"]:
	final_results["intruding_objects"].add(frame_results["intruding_object"])

	final_results["max_person_count"] = max(
	final_results["max_person_count"],
	frame_results["person_count"]
	)

	# Write the frame
	out.write(annotated_frame)

	# Release resources
	cap.release()
	out.release()

	# Convert set to list for JSON serialization
	final_results["intruding_objects"] = list(final_results["intruding_objects"])

	# Clean up input file
	os.remove(temp_input)

	return {
	"results": final_results,
	"video_path": f"/download_video/{os.path.basename(temp_output)}"
	}

	@app.get("/download_video/{filename}")
	async def download_video(filename: str):
	"""
	Download the processed video file.

	Args:
	filename: The name of the processed video file

	Returns:
	The video file
	"""
	file_path = f"temp/{filename}"
	if not os.path.exists(file_path):
	raise HTTPException(status_code=404, detail="Video not found")

	return FileResponse(file_path, media_type="video/mp4", filename="processed_video.mp4")

	# # For local development
	# if __name__ == "__main__":
	# uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=True)