Spaces:

tstone87
/

stance-detection

Running

App Files Files Community

stance-detection / app.py

tstone87

Update app.py

6ab3263 verified 4 months ago

raw

history blame

5.3 kB

	import sys
	import gradio as gr
	import os
	import tempfile
	import cv2
	import requests
	from ultralytics import YOLO

	# Remove extra CLI arguments that Spaces might pass.
	sys.argv = [arg for arg in sys.argv if arg != "--import"]

	# Load the YOLO11-pose model (auto-downloads if needed)
	model = YOLO("yolo11n-pose.pt")

	def process_input(uploaded_file, youtube_link, image_url, sensitivity):
	"""
	Process input from one of the three methods (Upload, YouTube, Image URL).
	Priority: YouTube link > Image URL > Uploaded file.
	The sensitivity slider value is passed as the confidence threshold.

	Returns a tuple:
	(download_file_path, display_file_path, status_message, dummy_state)
	(The dummy_state is used because Gradio requires the same number of outputs.)
	"""
	input_path = None

	# Priority 1: YouTube link
	if youtube_link and youtube_link.strip():
	try:
	from pytube import YouTube
	yt = YouTube(youtube_link)
	stream = yt.streams.filter(file_extension='mp4', progressive=True)\
	.order_by("resolution").desc().first()
	if stream is None:
	return None, None, "No suitable mp4 stream found.", ""
	input_path = stream.download()
	except Exception as e:
	return None, None, f"Error downloading video: {e}", ""
	# Priority 2: Image URL
	elif image_url and image_url.strip():
	try:
	response = requests.get(image_url, stream=True)
	if response.status_code != 200:
	return None, None, f"Error downloading image: HTTP {response.status_code}", ""
	temp_image_path = os.path.join(tempfile.gettempdir(), "downloaded_image.jpg")
	with open(temp_image_path, "wb") as f:
	f.write(response.content)
	input_path = temp_image_path
	except Exception as e:
	return None, None, f"Error downloading image: {e}", ""
	# Priority 3: Uploaded file
	elif uploaded_file is not None:
	input_path = uploaded_file.name
	else:
	return None, None, "Please provide an input using one of the methods.", ""

	try:
	# Pass the slider value as the confidence threshold.
	results = model.predict(source=input_path, save=True, conf=sensitivity)
	except Exception as e:
	return None, None, f"Error running prediction: {e}", ""

	output_path = None
	try:
	if hasattr(results[0], "save_path"):
	output_path = results[0].save_path
	else:
	annotated = results[0].plot() # returns a numpy array
	output_path = os.path.join(tempfile.gettempdir(), "annotated.jpg")
	cv2.imwrite(output_path, annotated)
	except Exception as e:
	return None, None, f"Error processing the file: {e}", ""

	# Clean up the temporary input if it was downloaded.
	if ((youtube_link and youtube_link.strip()) or (image_url and image_url.strip())) and input_path and os.path.exists(input_path):
	os.remove(input_path)

	return output_path, output_path, "Success!", ""

	# Build the Gradio interface with custom CSS for the result image.
	with gr.Blocks(css="""
	.result_img > img {
	width: 100%;
	height: auto;
	object-fit: contain;
	}
	""") as demo:
	# Header with scaled image (25% width) and title.
	gr.HTML("<div style='text-align:center;'><img src='/crowdresult.jpg' style='width:25%;'/></div>")
	gr.Markdown("## Pose Detection with YOLO11-pose")

	# Create two columns.
	with gr.Row():
	# Left column: Input tabs and sensitivity slider.
	with gr.Column(scale=1):
	with gr.Tabs():
	with gr.TabItem("Upload File"):
	file_input = gr.File(label="Upload Image/Video")
	with gr.TabItem("YouTube Link"):
	youtube_input = gr.Textbox(label="YouTube Link", placeholder="https://...")
	with gr.TabItem("Image URL"):
	image_url_input = gr.Textbox(label="Image URL", placeholder="https://...")
	sensitivity_slider = gr.Slider(minimum=0.1, maximum=1.0, step=0.05, value=0.5,
	label="Sensitivity (Confidence Threshold)")
	# Right column: Display result.
	with gr.Column(scale=2):
	output_display = gr.Image(label="Annotated Output", elem_classes="result_img")
	output_file = gr.File(label="Download Annotated Output")
	output_text = gr.Textbox(label="Status", interactive=False)

	# Set up automatic triggers for each input type.
	file_input.change(
	fn=process_input,
	inputs=[file_input, gr.State(""), gr.State(""), sensitivity_slider],
	outputs=[output_file, output_display, output_text, gr.State()]
	)
	youtube_input.change(
	fn=process_input,
	inputs=[gr.State(None), youtube_input, gr.State(""), sensitivity_slider],
	outputs=[output_file, output_display, output_text, gr.State()]
	)
	image_url_input.change(
	fn=process_input,
	inputs=[gr.State(None), gr.State(""), image_url_input, sensitivity_slider],
	outputs=[output_file, output_display, output_text, gr.State()]
	)

	if __name__ == "__main__":
	demo.launch()