Spaces:

pacomesimon
/

BirdsDetectionRealTime

Running

App Files Files Community

BirdsDetectionRealTime / app.py

pacomesimon

ft:tabs_reordering

44960ec 25 days ago

raw

history blame contribute delete

19 kB

	import cv2
	import numpy as np
	import gradio as gr
	import time
	from collections import deque
	import matplotlib.pyplot as plt
	from ultralytics import YOLO
	import os

	# Dummy comment to test push

	def compare_images_optical_flow(img1, img2):
	"""
	Compares two images and returns a grayscale image of flow magnitude normalized to 0 - 1.

	Args:

	Returns:
	A grayscale image of flow magnitude normalized to 0 - 1, or None if an error occurs.
	"""
	# Convert images to grayscale
	gray1 = cv2.cvtColor(img1, cv2.COLOR_BGR2GRAY)
	gray2 = cv2.cvtColor(img2, cv2.COLOR_BGR2GRAY)


	# Calculate optical flow using Farneback method
	flow = cv2.calcOpticalFlowFarneback(gray1, gray2, None, 0.5, 3, 15, 3, 5, 1.2, 0)

	# Calculate the magnitude of the optical flow
	flow_magnitude = np.sqrt(flow[..., 0]2 + flow[..., 1]2)

	# # Normalize the magnitude to the range 0-1
	# flow_magnitude_normalized = cv2.normalize(flow_magnitude, None, 0, 1, cv2.NORM_MINMAX, cv2.CV_32F)

	#The output is already a grayscale image. No need to convert it.
	return flow_magnitude

	model = YOLO("yolov8s-world.pt")
	# Define custom classes
	CUSTOM_CLASSES = ["one bird", "one airplane", "one kite","a flying object","sky"]
	model.set_classes(CUSTOM_CLASSES)

	def detect_birds(image):
	results = model(image,
	conf = 0.1,
	verbose=False,

	)
	return results[0].plot()

	optical_flow_runtime = []
	object_detection_runtime = []
	change_detection_runtime = []
	example_videos_folder = "./example_videos"

	EXAMPLE_VIDEOS_LIST = os.listdir(example_videos_folder)
	EXAMPLE_VIDEOS_LIST = [os.path.join(example_videos_folder, v)
	for v in EXAMPLE_VIDEOS_LIST]

	HEIGHT_STANDARD = 480
	WIDTH_STANDARD = 640
	frame_stack = deque(maxlen=2)
	detection_stack = deque(maxlen=1)

	fall_back_frame = np.zeros((256, 256, 3), dtype=np.uint8) + 127
	flow_magnitude_normalized = np.zeros((256, 256), dtype=np.uint8)
	FLAGS = {
	"OBJECT_DETECTING": False,
	}
	CAP = []

	# Function to compute optical flow
	def compute_optical_flow(mean_norm = None):
	global FLAGS, flow_magnitude_normalized, frame_stack
	if mean_norm is None:
	mean_norm = .4
	else:
	mean_norm = float(mean_norm)
	FLAGS["OBJECT_DETECTING"] = False
	while True:
	if (len(frame_stack) > 1) and not(FLAGS["OBJECT_DETECTING"]): #

	prev_frame, curr_frame = frame_stack
	original_height, original_width = curr_frame.shape[:2]
	start_time = time.time() # Start timing
	prev_frame_resized, curr_frame_resized = [
	cv2.resize(
	frame,
	(original_width // 4, original_height // 4)
	) for frame in [prev_frame, curr_frame]
	]
	flow_magnitude = compare_images_optical_flow(prev_frame_resized,
	curr_frame_resized)
	end_time = time.time() # End timing
	optical_flow_runtime.append(end_time - start_time) # Append the elapsed time

	flow_magnitude_normalized = cv2.normalize(flow_magnitude, None, 0, 1, cv2.NORM_MINMAX, cv2.CV_32F)
	flow_magnitude_normalized = cv2.resize(
	flow_magnitude_normalized,
	(original_width, original_height)
	)
	yield flow_magnitude_normalized

	if flow_magnitude_normalized.mean() < mean_norm:
	detection_stack.append((curr_frame,prev_frame, flow_magnitude_normalized))
	else:
	yield np.stack((flow_magnitude_normalized,flow_magnitude_normalized0, flow_magnitude_normalized0), axis=-1)

	# Function to perform object detection
	def object_detection_stream(classes = ""):
	if classes.strip() == "":
	classes = "one bird, one airplane, one kite,a flying object,sky"
	classes_list = classes.split(",")
	global FLAGS, fall_back_frame, model
	model.set_classes(classes_list)

	detected_frame = fall_back_frame.copy()
	while True:
	if len(detection_stack)>0:
	FLAGS["OBJECT_DETECTING"] = True
	curr_frame, prev_frame, flow_magnitude_normalized = detection_stack.pop()
	frame = curr_frame
	start_time = time.time() # Start timing
	detected_frame = detect_birds(frame)
	end_time = time.time() # End timing
	object_detection_runtime.append(end_time - start_time) # Append the elapsed time
	FLAGS["OBJECT_DETECTING"] = False
	yield detected_frame
	FLAGS["OBJECT_DETECTING"] = False

	def change_detection_stream(useless_var = None):
	detected_frame = fall_back_frame.copy()
	while True:
	if len(detection_stack)>0:
	FLAGS["OBJECT_DETECTING"] = True
	curr_frame, prev_frame, flow_magnitude_normalized = detection_stack.pop()
	frame = curr_frame
	start_time = time.time() # Start timing
	ret, thresh = cv2.threshold((flow_magnitude_normalized*255).astype(np.uint8),
	127, 255, 0)
	contours_tuple= cv2.findContours(thresh, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
	contours = contours_tuple[0] if len(contours_tuple) == 2 else contours_tuple[1]
	detected_frame = frame.copy()
	for contour in contours:
	x, y, w, h = cv2.boundingRect(contour)
	cv2.rectangle(detected_frame, (x, y), (x + w, y + h), (0, 255, 0), 2)
	end_time = time.time() # End timing
	change_detection_runtime.append(end_time - start_time) # Append the elapsed time
	FLAGS["OBJECT_DETECTING"] = False
	yield detected_frame
	FLAGS["OBJECT_DETECTING"] = False

	def video_stream(frame_rate = ""):
	if frame_rate.strip() == "":
	frame_rate = 2.0
	else:
	frame_rate = float(frame_rate)
	if len(CAP) > 0:
	while True:
	cap = cv2.VideoCapture(CAP[-1])
	ret, frame = cap.read()
	while ret:
	frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
	frame_stack.append(
	cv2.resize(
	frame,
	(WIDTH_STANDARD, HEIGHT_STANDARD) # Resize the frame
	)
	)
	yield frame
	ret, frame = cap.read()
	time.sleep(1/frame_rate)
	else:
	yield fall_back_frame

	def yield_frame(s):
	while True:
	yield frame_stack[0]
	def video_stream_HIKvision(video_address, frame_rate = ""):
	if frame_rate.strip() == "":
	frame_rate = 2.0
	else:
	frame_rate = float(frame_rate)
	cap = cv2.VideoCapture(video_address, cv2.CAP_FFMPEG)
	while True:
	ret, frame = cap.read()
	if ret:
	frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
	frame_stack.append(
	cv2.resize(
	frame,
	(WIDTH_STANDARD, HEIGHT_STANDARD) # Resize the frame
	)
	)
	yield frame
	ret, frame = cap.read()
	time.sleep(1/frame_rate)
	else:
	yield fall_back_frame
	# Gradio interface
	with gr.Blocks() as demo:
	gr.Markdown("### Birds Detection Real Time (suitable for CPU Embedded Systems)")
	with gr.Tab("Using a custom Video"):
	with gr.Row():
	with gr.Column():
	with gr.Row():
	video = gr.Video(label="Video Source")
	with gr.Row():
	examples = gr.Examples(
	examples=EXAMPLE_VIDEOS_LIST,
	inputs=[video],
	)

	with gr.Column():
	webcam_img = gr.Interface(video_stream,
	inputs=gr.Textbox(label="Acquisition: Enter the frame rate", value = 2.0), #
	outputs="image")
	with gr.Row():
	with gr.Column():
	optical_flow_img = gr.Interface(compute_optical_flow,
	inputs=gr.Slider(label="Optical Flow: Noise Tolerance", minimum=0.0, maximum=1.0, value=0.4),
	outputs=gr.Image(),#,"image",
	)
	with gr.Column():
	detection_img = gr.Interface(object_detection_stream,
	inputs=gr.Textbox(label="Classes: Enter the classes", value = "one bird, one airplane, one kite,a flying object,sky"),
	outputs="image")

	video.change(
	fn=lambda video: CAP.append(video),
	inputs=[video],
	)

	with gr.Tab("Using a custom Video (Change Detection)"):
	with gr.Row():
	with gr.Column():
	with gr.Row():
	video_CD = gr.Video(label="Video Source")
	with gr.Row():
	examples_CD = gr.Examples(
	examples=EXAMPLE_VIDEOS_LIST,
	inputs=[video_CD],
	)

	with gr.Column():
	webcam_img_CD = gr.Interface(video_stream,
	inputs=gr.Textbox(label="Acquisition: Enter the frame rate", value = 2.0), #
	outputs="image")
	with gr.Row():
	with gr.Column():
	optical_flow_img_CD = gr.Interface(compute_optical_flow,
	inputs=gr.Slider(label="Optical Flow: Noise Tolerance", minimum=0.0, maximum=1.0, value=0.4),
	outputs=gr.Image(),#,"image",
	)
	with gr.Column():
	detection_img_CD = gr.Interface(change_detection_stream,
	inputs=gr.Textbox(label="Change detection", value = "DUMMY"),
	outputs="image")

	video_CD.change(
	fn=lambda video: CAP.append(video),
	inputs=[video_CD],
	)


	with gr.Tab("Using a Real Time Camera"):
	with gr.Row():

	with gr.Column():
	webcam_img_RT = gr.Image(label="Webcam", sources="webcam")
	webcam_img_RT.stream(lambda s: frame_stack.append(
	cv2.resize(
	s,
	(WIDTH_STANDARD, HEIGHT_STANDARD)
	)
	),
	webcam_img_RT,
	time_limit=15, stream_every=1.0,
	concurrency_limit=30
	)

	with gr.Column():
	optical_flow_img_RT = gr.Interface(compute_optical_flow,
	inputs=gr.Slider(label="Optical Flow: Noise Tolerance", minimum=0.0, maximum=1.0, value=0.4),
	outputs="image",
	)


	with gr.Row():

	with gr.Column():
	detection_img_RT = gr.Interface(object_detection_stream,
	inputs=gr.Textbox(label="Classes: Enter the classes",
	value = "one bird, one airplane, one kite,a flying object,sky"),
	outputs="image")



	with gr.Tab("Using a Real Time Camera (Change Detection)"):
	with gr.Row():

	with gr.Column():
	webcam_img_RT_CD = gr.Image(label="Webcam", sources="webcam")
	webcam_img_RT_CD.stream(lambda s: frame_stack.append(
	cv2.resize(
	s,
	(WIDTH_STANDARD, HEIGHT_STANDARD)
	)
	),
	webcam_img_RT_CD,
	time_limit=15, stream_every=1.0,
	concurrency_limit=30
	)

	with gr.Column():
	optical_flow_img_RT_CD = gr.Interface(compute_optical_flow,
	inputs=gr.Slider(label="Optical Flow: Noise Tolerance", minimum=0.0, maximum=1.0, value=0.4),
	outputs="image",
	)



	with gr.Row():

	with gr.Column():
	detection_img_RT_CD = gr.Interface(change_detection_stream,
	inputs=gr.Textbox(label="Changes will be detected here",
	value = "DUMMY"),
	outputs="image")

	with gr.Tab("Using a Hikvision Camera"):
	with gr.Row():
	with gr.Column():
	with gr.Row():
	video_address = gr.Textbox(label="Video Source Address")
	with gr.Row():
	example_addresses = gr.Examples(
	examples=EXAMPLE_VIDEOS_LIST+[
	'rtsp://admin:Admin123@192.168.254.200:554/Streaming/Channels/101',
	'rtsp://admin:Admin123@192.168.254.201:554/Streaming/Channels/101',
	'rtsp://admin:Admin123@192.168.254.202:554/Streaming/Channels/101',
	'rtsp://admin:Admin123@192.168.254.203:554/Streaming/Channels/101'
	],
	inputs=[video_address],
	)

	with gr.Column():
	webcam_img_HIKvision = gr.Interface(video_stream_HIKvision,
	inputs=[video_address, gr.Textbox(label="Acquisition: Enter the frame rate", value = 2.0)], #
	outputs="image")
	with gr.Row():
	with gr.Column():
	optical_flow_img = gr.Interface(compute_optical_flow,
	inputs=gr.Slider(label="Optical Flow: Noise Tolerance", minimum=0.0, maximum=1.0, value=0.4),
	outputs=gr.Image(),#,"image",
	)
	with gr.Column():
	detection_img = gr.Interface(object_detection_stream,
	inputs=gr.Textbox(label="Classes: Enter the classes", value = "one bird, one airplane, one kite,a flying object,sky"),
	outputs="image")

	with gr.Tab("Using a Hikvision Camera (Change Detection)"):
	with gr.Row():
	with gr.Column():
	with gr.Row():
	video_address_CD = gr.Textbox(label="Hikvision Camera Address (RTSP)")
	with gr.Row():
	example_addresses_CD = gr.Examples(
	examples=EXAMPLE_VIDEOS_LIST+[
	'rtsp://admin:Admin123@192.168.254.200:554/Streaming/Channels/101',
	'rtsp://admin:Admin123@192.168.254.201:554/Streaming/Channels/101',
	'rtsp://admin:Admin123@192.168.254.202:554/Streaming/Channels/101',
	'rtsp://admin:Admin123@192.168.254.203:554/Streaming/Channels/101'
	],
	inputs=[video_address_CD],
	)

	with gr.Column():
	hikvision_stream_CD = gr.Interface(
	video_stream_HIKvision,
	inputs=[
	video_address_CD,
	gr.Textbox(label="Acquisition: Enter the frame rate", value=2.0)
	],
	outputs="image"
	)

	with gr.Row():
	with gr.Column():
	optical_flow_img_HIK_CD = gr.Interface(
	compute_optical_flow,
	inputs=gr.Slider(label="Optical Flow: Noise Tolerance", minimum=0.0, maximum=1.0, value=0.4),
	outputs="image"
	)

	with gr.Column():
	detection_img_HIK_CD = gr.Interface(
	change_detection_stream,
	inputs=gr.Textbox(label="Changes will be detected here", value="DUMMY"),
	outputs="image"
	)



	with gr.Tab("Runtime Histograms"):
	def plot_histogram(data, title, color):
	plt.figure(figsize=(9, 5))
	plt.hist(data, bins=30, color=color, alpha=0.7)
	plt.title(title)
	plt.xlabel('Runtime (seconds)')
	plt.ylabel('Frequency')
	plt.grid(True)
	plt.tight_layout()
	filename = title.replace(" ", "_").lower() + ".png"
	plt.savefig(filename)
	if os.path.exists(filename):
	img_plt = cv2.imread(filename)
	return img_plt
	else:
	return np.zeros((256, 256, 3), dtype=np.uint8) + 127

	def update_optical_flow_plot():
	return plot_histogram(np.array(optical_flow_runtime), 'Histogram of Optical Flow Runtime', 'blue')

	def update_object_detection_plot():
	return plot_histogram(object_detection_runtime, 'Histogram of Object Detection Runtime', 'green')

	def update_change_detection_plot():
	return plot_histogram(change_detection_runtime, 'Histogram of Change Detection Runtime', 'red')

	with gr.Row():
	optical_flow_image = gr.Image(update_optical_flow_plot, label="Optical Flow Runtime Histogram")
	with gr.Row():
	optical_flow_button = gr.Button("Update Optical Flow Histogram")
	optical_flow_button.click(fn=update_optical_flow_plot, outputs=optical_flow_image)
	with gr.Row():
	object_detection_image = gr.Image(update_object_detection_plot, label="Object Detection Runtime Histogram")
	with gr.Row():
	object_detection_button = gr.Button("Update Object Detection Histogram")
	object_detection_button.click(fn=update_object_detection_plot, outputs=object_detection_image)
	with gr.Row():
	change_detection_image = gr.Image(update_change_detection_plot, label="Change Detection Runtime Histogram")
	with gr.Row():
	change_detection_button = gr.Button("Update Change Detection Histogram")
	change_detection_button.click(fn=update_change_detection_plot, outputs=change_detection_image)
	demo.launch(debug=True)