Nekshay
/

Car_VS_Rest

Image Classification

Model card Files Files and versions

Car_VS_Rest / onnx_runtime_draw_bboxes.py

Nekshay's picture

Update onnx_runtime_draw_bboxes.py

cd66def verified about 1 year ago

history blame contribute delete

3.69 kB

	import onnxruntime as ort
	import numpy as np
	import cv2
	import os

	# Load the ONNX model
	model_path = "model.onnx"
	session = ort.InferenceSession(model_path, providers=["CPUExecutionProvider"])

	# Folder paths
	input_folder = "input_images" # Folder containing images
	output_folder = "output_images" # Folder to save processed images
	os.makedirs(output_folder, exist_ok=True)

	# Define model input shape
	MODEL_INPUT_SIZE = (320, 320) # Change based on your model input size

	# Define class labels (update based on your model)
	CLASS_NAMES = ["person", "car", "truck", "bicycle", "dog", "cat"] # Update accordingly

	# Define unique colors for each class (BGR format for OpenCV)
	CLASS_COLORS = {
	"person": (255, 0, 0), # Blue
	"car": (0, 255, 0), # Green
	"truck": (0, 0, 255), # Red
	"bicycle": (255, 255, 0), # Cyan
	"dog": (255, 0, 255), # Magenta
	"cat": (0, 255, 255), # Yellow
	}
	DEFAULT_COLOR = (200, 200, 200) # Gray for unknown classes

	def preprocess_image(image_path):
	""" Preprocess image for ONNX model input """
	image = cv2.imread(image_path)
	original_image = image.copy() # Save original for later drawing
	image = cv2.resize(image, MODEL_INPUT_SIZE) # Resize to model input size
	image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB) # Convert to RGB
	image = image.astype(np.float32) / 255.0 # Normalize
	image = np.transpose(image, (2, 0, 1)) # Convert to CHW format
	image = np.expand_dims(image, axis=0) # Add batch dimension
	return image, original_image

	def postprocess_output(output, orig_image):
	""" Post-process ONNX model output """
	height, width, _ = orig_image.shape

	# Extract boxes, scores, and class indices
	boxes = output[0] # Adjust key names if needed
	scores = output[1]
	class_indices = output[2]

	# Draw bounding boxes
	for i in range(len(scores)):
	if scores[i] > 0.5: # Confidence threshold
	x1, y1, x2, y2 = boxes[i] # Get box coordinates
	x1, y1, x2, y2 = int(x1 * width), int(y1 * height), int(x2 * width), int(y2 * height) # Scale box

	# Get class label
	class_id = int(class_indices[i])
	label = CLASS_NAMES[class_id] if class_id < len(CLASS_NAMES) else "Unknown"
	confidence = scores[i]

	# Get class-specific color
	color = CLASS_COLORS.get(label, DEFAULT_COLOR)

	# Draw bounding box
	cv2.rectangle(orig_image, (x1, y1), (x2, y2), color, 2)

	# Put label text
	label_text = f"{label}: {confidence:.2f}"
	text_size = cv2.getTextSize(label_text, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 2)[0]
	text_x, text_y = x1, y1 - 10

	# Draw text background
	cv2.rectangle(orig_image, (text_x, text_y - text_size[1] - 5), (text_x + text_size[0] + 5, text_y + 5), color, -1)
	# Put label text
	cv2.putText(orig_image, label_text, (text_x, text_y), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 2)

	return orig_image

	# Process all images in the input folder
	for image_name in os.listdir(input_folder):
	image_path = os.path.join(input_folder, image_name)
	output_path = os.path.join(output_folder, image_name)

	# Preprocess
	image_tensor, orig_image = preprocess_image(image_path)

	# Run inference
	inputs = {session.get_inputs()[0].name: image_tensor}
	outputs = session.run(None, inputs)

	# Post-process and save image
	processed_image = postprocess_output(outputs, orig_image)
	cv2.imwrite(output_path, processed_image)

	print(f"Processed: {image_name}")

	print("Processing complete! Results saved in", output_folder)