YogaPoseClassify / ml_pose_classifier.py

train and test python script

b26156a verified 6 months ago

44.8 kB

	#!/usr/bin/env python3
	"""
	Machine learning pose classification script.

	Features:
	1. Train classifiers on pose landmark inputs
	2. Use selected landmark coordinates as features
	3. Use folder names as class labels
	4. Train and evaluate models

	Usage:
	python ml_pose_classifier.py [--data DATA_DIR] [--model MODEL_TYPE] [--test-size RATIO]
	"""

	import json
	import argparse
	import numpy as np
	import time
	from pathlib import Path
	from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier
	from sklearn.svm import SVC
	from sklearn.linear_model import LogisticRegression
	from sklearn.model_selection import train_test_split, cross_val_score
	from sklearn.metrics import classification_report, confusion_matrix, accuracy_score
	from sklearn.preprocessing import StandardScaler, LabelEncoder
	# from sklearn.pipeline import Pipeline # not used
	from sklearn.neural_network import MLPRegressor
	import joblib
	import matplotlib.pyplot as plt
	# seaborn is optional; used only for confusion matrix plotting
	try:
	import seaborn as sns
	SEABORN_AVAILABLE = True
	except ImportError:
	SEABORN_AVAILABLE = False

	# ONNX related imports
	try:
	from skl2onnx import convert_sklearn
	from skl2onnx.common.data_types import FloatTensorType
	# onnx is not required here; we import it lazily where needed
	ONNX_AVAILABLE = True
	except ImportError:
	ONNX_AVAILABLE = False

	# ONNX Runtime import
	try:
	# onnxruntime is optional and not required unless ONNX runtime testing is implemented
	ONNX_RUNTIME_AVAILABLE = False
	except ImportError:
	ONNX_RUNTIME_AVAILABLE = False


	class PoseClassifier:
	def __init__(self, model_type='random_forest'):
	"""
	Initialize the pose classifier.

	Args:
	model_type: model type ('random_forest', 'svm', 'gradient_boost', 'logistic', 'distilled_rf')
	"""
	self.model_type = model_type
	self.model = None
	self.student_model = None # If distillation is used, save student (MLP) model
	self.scaler = StandardScaler()
	self.label_encoder = LabelEncoder()

	# Define joints we want to use (based on MediaPipe keypoint indices)
	self.target_joints = [
	'nose', # Head (nose as reference, but will actually be 0,0,0)
	'left_shoulder', # Left shoulder
	'right_shoulder', # Right shoulder
	'left_elbow', # Left elbow
	'right_elbow', # Right elbow
	'left_wrist', # Left wrist
	'right_wrist', # Right wrist
	'left_hip', # Left hip
	'right_hip', # Right hip
	'left_knee', # Left knee
	'right_knee', # Right knee
	'left_ankle', # Left ankle
	'right_ankle' # Right ankle
	]

	self.feature_columns = []
	for joint in self.target_joints:
	self.feature_columns.extend([f'{joint}_x', f'{joint}_y', f'{joint}_z'])

	print(f"Target joints: {len(self.target_joints)}")
	print(f"Feature dimension: {len(self.feature_columns)}")
	print("Joint list:", ', '.join(self.target_joints))

	def _get_model(self):
	"""Create a classifier based on the selected model type."""
	if self.model_type == 'random_forest':
	return RandomForestClassifier(
	n_estimators=100,
	max_depth=15,
	min_samples_split=5,
	min_samples_leaf=2,
	random_state=42,
	n_jobs=-1
	)
	elif self.model_type == 'svm':
	return SVC(
	C=1.0,
	kernel='rbf',
	gamma='scale',
	random_state=42
	)
	elif self.model_type == 'gradient_boost':
	return GradientBoostingClassifier(
	n_estimators=100,
	learning_rate=0.1,
	max_depth=6,
	random_state=42
	)
	elif self.model_type == 'logistic':
	return LogisticRegression(
	C=10.0, # Increase regularization parameter to improve model complexity
	max_iter=2000, # Increase maximum iterations
	solver='lbfgs', # Use L-BFGS solver, suitable for small datasets
	multi_class='multinomial', # Multi-class strategy
	random_state=42,
	n_jobs=-1
	)
	elif self.model_type == 'distilled_rf':
	# Teacher uses random forest (returns an RF for training process)
	return RandomForestClassifier(
	n_estimators=100,
	max_depth=15,
	min_samples_split=5,
	min_samples_leaf=2,
	random_state=42,
	n_jobs=-1
	)
	else:
	raise ValueError(f"Unsupported model type: {self.model_type}")

	def load_data(self, data_dir):
	"""
	Load pose data from JSON files

	Args:
	data_dir: Data directory containing label folders

	Returns:
	tuple: (feature data, labels)
	"""
	data_path = Path(data_dir)
	all_features = []
	all_labels = []

	print(f"Loading data from: {data_path}")

	# Iterate over each label directory
	for label_dir in data_path.iterdir():
	if not label_dir.is_dir() or not label_dir.name.startswith('label_'):
	continue

	label = label_dir.name
	json_files = list(label_dir.glob('*.json'))

	print(f"Processing {label}: {len(json_files)} files")

	for json_file in json_files:
	try:
	with open(json_file, 'r', encoding='utf-8') as f:
	data = json.load(f)

	landmarks = data.get('landmarks', {})

	# Extract coordinates of target joints
	features = []
	missing_joints = []

	for joint in self.target_joints:
	if joint in landmarks:
	joint_data = landmarks[joint]
	features.extend([
	joint_data.get('x', 0.0),
	joint_data.get('y', 0.0),
	joint_data.get('z', 0.0)
	])
	else:
	# If a joint is missing, fill with zeros
	features.extend([0.0, 0.0, 0.0])
	missing_joints.append(joint)

	if len(features) == len(self.feature_columns):
	all_features.append(features)
	all_labels.append(label)
	else:
	print(f"Skipping file {json_file}: feature dimension mismatch")

	if missing_joints:
	print(f"File {json_file.name} missing joints: {missing_joints}")

	except Exception as e:
	print(f"Error reading file {json_file}: {e}")
	continue

	print(f"Loaded {len(all_features)} samples")

	# count samples per label
	label_counts = {}
	for label in all_labels:
	label_counts[label] = label_counts.get(label, 0) + 1

	print("Label distribution:")
	for label, count in sorted(label_counts.items()):
	print(f" {label}: {count} samples")

	return np.array(all_features), np.array(all_labels)

	def train(self, X, y, test_size=0.2):
	"""
	Train the classifier.

	Args:
	X: feature data
	y: labels
	test_size: ratio for test split

	Returns:
	dict: a dictionary containing training results
	"""
	print(f"\nStarting training for model: {self.model_type}...")
	print(f"Data shape: {X.shape}")
	print(f"Number of labels: {len(np.unique(y))}")

	# Encode labels
	y_encoded = self.label_encoder.fit_transform(y)

	# Split data
	X_train, X_test, y_train, y_test = train_test_split(
	X, y_encoded, test_size=test_size, random_state=42, stratify=y_encoded
	)

	print(f"Train set size: {X_train.shape[0]}")
	print(f"Test set size: {X_test.shape[0]}")

	# standardize features
	X_train_scaled = self.scaler.fit_transform(X_train)
	X_test_scaled = self.scaler.transform(X_test)

	# If using distillation process: train RF teacher first, then train MLPRegressor student to fit teacher's predict_proba
	if self.model_type == 'distilled_rf':
	print("Using distillation: train RandomForest teacher, then fit an MLPRegressor student to teacher soft labels")
	# Train teacher
	teacher = self._get_model()
	teacher.fit(X_train_scaled, y_train)

	# Get teacher's probability distribution as soft labels
	y_train_proba = teacher.predict_proba(X_train_scaled)

	# Create and train student (MLPRegressor) to fit probability vectors
	student = MLPRegressor(hidden_layer_sizes=(128, 64, 32),
	activation='relu',
	solver='adam',
	max_iter=1000,
	learning_rate_init=0.001,
	random_state=42,
	early_stopping=True,
	validation_fraction=0.1)

	print("Training student model to fit teacher probability outputs...")
	print(f"Teacher probability output shape: {y_train_proba.shape}")

	# Multi-output regression, target is probability vector
	student.fit(X_train_scaled, y_train_proba)

	# Save models
	self.model = teacher
	self.student_model = student

	# Use student to predict on train/test sets
	y_train_pred_proba = student.predict(X_train_scaled)
	y_test_pred_proba = student.predict(X_test_scaled)

	# Apply softmax to ensure probabilities sum to 1
	def softmax(x):
	exp_x = np.exp(x - np.max(x, axis=1, keepdims=True))
	return exp_x / np.sum(exp_x, axis=1, keepdims=True)

	y_train_pred_proba = softmax(y_train_pred_proba)
	y_test_pred_proba = softmax(y_test_pred_proba)

	y_train_pred = np.argmax(y_train_pred_proba, axis=1)
	y_test_pred = np.argmax(y_test_pred_proba, axis=1)

	print(f"Student predicted probability shape: {y_test_pred_proba.shape}")
	print(f"Student training accuracy: {accuracy_score(y_train, y_train_pred):.4f}")

	else:
	# Standard flow: train a single model
	self.model = self._get_model()
	self.model.fit(X_train_scaled, y_train)

	y_train_pred = self.model.predict(X_train_scaled)
	y_test_pred = self.model.predict(X_test_scaled)

	# compute accuracies
	train_accuracy = accuracy_score(y_train, y_train_pred)
	test_accuracy = accuracy_score(y_test, y_test_pred)

	# cross validation on the model used for training
	# if student_model exists, still use teacher for cross-val
	cv_model = self.model if self.model is not None else None
	if cv_model is not None:
	cv_scores = cross_val_score(cv_model, X_train_scaled, y_train, cv=5)
	else:
	cv_scores = np.array([])

	print("\nTraining results:")
	print(f"Train accuracy: {train_accuracy:.4f}")
	print(f"Test accuracy: {test_accuracy:.4f}")
	print(f"5-fold CV accuracy: {cv_scores.mean():.4f} ± {cv_scores.std():.4f}")

	# classification report
	print("\nTest set classification report:")
	target_names = self.label_encoder.classes_
	print(classification_report(y_test, y_test_pred, target_names=target_names))

	# confusion matrix
	cm = confusion_matrix(y_test, y_test_pred)

	return {
	'train_accuracy': train_accuracy,
	'test_accuracy': test_accuracy,
	'cv_scores': cv_scores,
	'confusion_matrix': cm,
	'target_names': target_names,
	'X_test': X_test_scaled,
	'y_test': y_test,
	'y_test_pred': y_test_pred
	}

	def save_model(self, filepath):
	"""Save trained model to disk."""
	model_data = {
	'model': self.model,
	'scaler': self.scaler,
	'label_encoder': self.label_encoder,
	'model_type': self.model_type,
	'target_joints': self.target_joints,
	'feature_columns': self.feature_columns
	}
	joblib.dump(model_data, filepath)
	print(f"Model saved to: {filepath}")

	def load_model(self, filepath):
	"""Load trained model from disk."""
	model_data = joblib.load(filepath)
	self.model = model_data['model']
	self.scaler = model_data['scaler']
	self.label_encoder = model_data['label_encoder']
	self.model_type = model_data['model_type']
	self.target_joints = model_data['target_joints']
	self.feature_columns = model_data['feature_columns']
	print(f"Model loaded from: {filepath}")

	def predict(self, X):
	"""Run prediction on input features."""
	if self.model is None and self.student_model is None:
	raise ValueError("Model not trained or loaded")

	X_scaled = self.scaler.transform(X)

	# Prefer to use student_model (if exists) to generate probability output
	if self.student_model is not None:
	proba = self.student_model.predict(X_scaled) # Returns probability vector
	preds = np.argmax(proba, axis=1)
	labels = self.label_encoder.inverse_transform(preds)
	return labels, proba

	# Otherwise fall back to original model
	predictions = self.model.predict(X_scaled)
	probabilities = None
	if hasattr(self.model, 'predict_proba'):
	probabilities = self.model.predict_proba(X_scaled)
	return self.label_encoder.inverse_transform(predictions), probabilities

	def predict_single_json(self, json_path):
	"""
	Predict pose class for a single JSON file.

	Args:
	json_path: path to the JSON file

	Returns:
	dict: prediction details or error information
	"""
	if self.model is None:
	raise ValueError("Model not trained or loaded")

	try:
	# Read JSON file
	with open(json_path, 'r', encoding='utf-8') as f:
	data = json.load(f)

	landmarks = data.get('landmarks', {})

	# Extract coordinates of target joints
	features = []
	missing_joints = []
	available_joints = []

	for joint in self.target_joints:
	if joint in landmarks:
	joint_data = landmarks[joint]
	features.extend([
	joint_data.get('x', 0.0),
	joint_data.get('y', 0.0),
	joint_data.get('z', 0.0)
	])
	available_joints.append(joint)
	else:
	# If a joint is missing, fill with zeros
	features.extend([0.0, 0.0, 0.0])
	missing_joints.append(joint)

	if len(features) != len(self.feature_columns):
	raise ValueError(f"Feature dimension mismatch: expected {len(self.feature_columns)}, got {len(features)}")

	# Convert to numpy array and predict
	X = np.array([features])
	predictions, probabilities = self.predict(X)

	# build result dict
	result = {
	'file_path': str(json_path),
	'file_name': Path(json_path).name,
	'predicted_label': predictions[0],
	'confidence_scores': {},
	'available_joints': available_joints,
	'missing_joints': missing_joints,
	'joint_coverage': f"{len(available_joints)}/{len(self.target_joints)}"
	}

	# add per-class confidence scores
	if probabilities is not None:
	for i, label in enumerate(self.label_encoder.classes_):
	result['confidence_scores'][label] = float(probabilities[0][i])

	# highest confidence
	max_prob_idx = np.argmax(probabilities[0])
	result['max_confidence'] = float(probabilities[0][max_prob_idx])

	return result

	except Exception as e:
	return {
	'file_path': str(json_path),
	'file_name': Path(json_path).name,
	'error': str(e),
	'predicted_label': None
	}

	def evaluate_test_directory(self, test_dir):
	"""
	Evaluate all data in a test directory.

	Args:
	test_dir: path to the test data directory

	Returns:
	dict: dictionary containing detailed evaluation results
	"""
	if self.model is None:
	raise ValueError("Model not trained or loaded")

	test_path = Path(test_dir)
	if not test_path.exists():
	raise ValueError(f"Test directory does not exist: {test_dir}")

	# start timing
	start_time = time.time()
	print(f"Starting evaluation on test dataset: {test_path}")
	print(f"Start time: {time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time))}")

	# store all prediction results
	all_results = []
	label_stats = {}
	total_prediction_time = 0.0
	prediction_count = 0

	# iterate over label folders
	for label_dir in test_path.iterdir():
	if not label_dir.is_dir() or not label_dir.name.startswith('label_'):
	continue

	true_label = label_dir.name
	json_files = list(label_dir.glob('*.json'))

	print(f"Evaluating {true_label}: {len(json_files)} files")

	label_stats[true_label] = {
	'total': len(json_files),
	'correct': 0,
	'incorrect': 0,
	'errors': 0,
	'predictions': {},
	'confidence_scores': [],
	'prediction_times': []
	}

	for json_file in json_files:
	# Single prediction timing
	pred_start_time = time.time()
	result = self.predict_single_json(json_file)
	pred_end_time = time.time()

	single_prediction_time = pred_end_time - pred_start_time
	total_prediction_time += single_prediction_time
	prediction_count += 1

	if 'error' in result:
	label_stats[true_label]['errors'] += 1
	print(f" Error: {json_file.name} - {result['error']}")
	continue

	predicted_label = result['predicted_label']
	is_correct = predicted_label == true_label

	if is_correct:
	label_stats[true_label]['correct'] += 1
	else:
	label_stats[true_label]['incorrect'] += 1

	# Count prediction distribution
	if predicted_label not in label_stats[true_label]['predictions']:
	label_stats[true_label]['predictions'][predicted_label] = 0
	label_stats[true_label]['predictions'][predicted_label] += 1

	# Record confidence and prediction time
	if 'max_confidence' in result:
	label_stats[true_label]['confidence_scores'].append(result['max_confidence'])
	label_stats[true_label]['prediction_times'].append(single_prediction_time)

	# Save detailed result
	all_results.append({
	'file_path': str(json_file),
	'file_name': json_file.name,
	'true_label': true_label,
	'predicted_label': predicted_label,
	'is_correct': is_correct,
	'confidence': result.get('max_confidence', 0.0),
	'confidence_scores': result.get('confidence_scores', {}),
	'joint_coverage': result.get('joint_coverage', '0/13'),
	'prediction_time': single_prediction_time
	})

	# end timing
	end_time = time.time()
	total_execution_time = end_time - start_time

	# compute aggregate statistics
	total_samples = sum(stats['total'] for stats in label_stats.values())
	total_correct = sum(stats['correct'] for stats in label_stats.values())
	total_errors = sum(stats['errors'] for stats in label_stats.values())
	total_tested = total_samples - total_errors

	overall_accuracy = total_correct / total_tested if total_tested > 0 else 0.0
	avg_prediction_time = total_prediction_time / prediction_count if prediction_count > 0 else 0.0

	# build confusion matrix
	confusion_matrix = {}
	for true_label in label_stats.keys():
	confusion_matrix[true_label] = {}
	for predicted_label in label_stats.keys():
	confusion_matrix[true_label][predicted_label] = 0

	for result in all_results:
	if result.get('is_correct') is not None: # exclude error cases
	true_label = result['true_label']
	predicted_label = result['predicted_label']
	confusion_matrix[true_label][predicted_label] += 1

	return {
	'label_stats': label_stats,
	'overall_accuracy': overall_accuracy,
	'total_samples': total_samples,
	'total_correct': total_correct,
	'total_errors': total_errors,
	'total_tested': total_tested,
	'confusion_matrix': confusion_matrix,
	'detailed_results': all_results,
	'timing_stats': {
	'total_execution_time': total_execution_time,
	'total_prediction_time': total_prediction_time,
	'avg_prediction_time': avg_prediction_time,
	'prediction_count': prediction_count,
	'start_time': start_time,
	'end_time': end_time,
	'overhead_time': total_execution_time - total_prediction_time
	}
	}

	def print_evaluation_report(self, eval_results):
	"""
	Print a detailed evaluation report.

	Args:
	eval_results: dictionary returned by evaluate_test_directory
	"""
	timing_stats = eval_results.get('timing_stats', {})

	print("\n" + "=" * 80)
	print("Test dataset evaluation report")
	print("=" * 80)

	# Overall statistics
	print(f"Total samples: {eval_results['total_samples']}")
	print(f"Successfully tested: {eval_results['total_tested']}")
	print(f"Errors: {eval_results['total_errors']}")
	print(
	f"Overall accuracy: {eval_results['overall_accuracy']:.4f} "
	f"({eval_results['total_correct']}/{eval_results['total_tested']})"
	)

	# Timing statistics
	if timing_stats:
	total_time = timing_stats['total_execution_time']
	prediction_time = timing_stats['total_prediction_time']
	avg_time = timing_stats['avg_prediction_time']
	overhead_time = timing_stats['overhead_time']
	prediction_count = timing_stats['prediction_count']

	print("\nTiming statistics:")
	print("-" * 50)
	print(f"Total execution time: {total_time:.4f} s")
	print(f"Total prediction time: {prediction_time:.4f} s")
	print(f"Overhead time: {overhead_time:.4f} s")
	print(f"Average prediction time: {avg_time * 1000:.2f} ms")
	print(f"Prediction throughput: {prediction_count / total_time:.2f} preds/s")
	print(
	f"Prediction efficiency: {(prediction_time / total_time) * 100:.1f}% "
	f"(prediction time / total)"
	)

	# Per-label detailed statistics
	print("\nPer-label stats:")
	print("-" * 80)
	print(
	f"{'Label':<10} {'Total':<6} {'Correct':<6} {'Wrong':<6} "
	f"{'Accuracy':<8} {'AvgConf':<10} {'AvgPredTime':<12}"
	)
	print("-" * 80)

	for label, stats in sorted(eval_results['label_stats'].items()):
	accuracy = (
	stats['correct'] / (stats['total'] - stats['errors'])
	if (stats['total'] - stats['errors']) > 0
	else 0.0
	)
	avg_confidence = (
	np.mean(stats['confidence_scores']) if stats['confidence_scores'] else 0.0
	)
	avg_pred_time = (
	np.mean(stats['prediction_times'])
	if 'prediction_times' in stats and stats['prediction_times']
	else 0.0
	)

	print(
	f"{label:<10} {stats['total']:<6} {stats['correct']:<6} {stats['incorrect']:<6} "
	f"{accuracy:.4f} {avg_confidence:.4f} {avg_pred_time * 1000:.2f}ms"
	)

	# Confusion matrix
	print("\nConfusion matrix:")
	print("-" * 60)
	labels = sorted(eval_results['label_stats'].keys())

	# Header row
	print(f"{'True\\Pred':<12}", end="")
	for label in labels:
	print(f"{label:<10}", end="")
	print()

	# Data rows
	for true_label in labels:
	print(f"{true_label:<12}", end="")
	for pred_label in labels:
	count = eval_results['confusion_matrix'][true_label][pred_label]
	print(f"{count:<10}", end="")
	print()

	# Per-label prediction distribution
	print("\nPer-label prediction distribution:")
	print("-" * 80)
	for true_label, stats in sorted(eval_results['label_stats'].items()):
	if stats['predictions']:
	print(f"{true_label}:")
	total_predictions = sum(stats['predictions'].values())
	for pred_label, count in sorted(stats['predictions'].items()):
	percentage = (count / total_predictions) * 100
	print(f" -> {pred_label}: {count} ({percentage:.1f}%)")

	# Error analysis
	print("\nError analysis:")
	print("-" * 40)
	incorrect_results = [r for r in eval_results['detailed_results'] if not r['is_correct']]

	if incorrect_results:
	# Sort by confidence and show top mistaken predictions
	incorrect_results.sort(key=lambda x: x['confidence'], reverse=True)
	print("Highest-confidence incorrect predictions (top 10):")
	for i, result in enumerate(incorrect_results[:10]):
	pred_time = result.get('prediction_time', 0) * 1000 # ms
	print(
	f"{i + 1:2d}. {result['file_name']}: {result['true_label']} -> {result['predicted_label']} "
	f"(conf: {result['confidence']:.4f}, time: {pred_time:.2f}ms)"
	)
	else:
	print("No incorrect predictions found.")

	# Performance analysis
	if timing_stats and eval_results['detailed_results']:
	print("\nPerformance analysis:")
	print("-" * 40)
	prediction_times = [
	r.get('prediction_time', 0) for r in eval_results['detailed_results'] if 'prediction_time' in r
	]
	if prediction_times:
	min_time = min(prediction_times) * 1000
	max_time = max(prediction_times) * 1000
	median_time = np.median(prediction_times) * 1000
	std_time = np.std(prediction_times) * 1000

	print("Prediction time distribution:")
	print(f" Fastest: {min_time:.2f}ms")
	print(f" Slowest: {max_time:.2f}ms")
	print(f" Median: {median_time:.2f}ms")
	print(f" Stddev: {std_time:.2f}ms")

	print("\n" + "=" * 80)

	def plot_confusion_matrix(self, cm, target_names, save_path=None):
	"""Plot confusion matrix."""
	plt.figure(figsize=(10, 8))
	if SEABORN_AVAILABLE:
	sns.heatmap(
	cm,
	annot=True,
	fmt='d',
	cmap='Blues',
	xticklabels=target_names,
	yticklabels=target_names,
	)
	else:
	# Fallback using matplotlib only
	im = plt.imshow(cm, interpolation='nearest', cmap=plt.cm.Blues)
	plt.colorbar(im)
	tick_marks = np.arange(len(target_names))
	plt.xticks(tick_marks, target_names, rotation=45, ha='right')
	plt.yticks(tick_marks, target_names)
	# Annotate cells
	thresh = cm.max() / 2.0 if cm.size else 0
	for i in range(cm.shape[0]):
	for j in range(cm.shape[1]):
	plt.text(j, i, format(cm[i, j], 'd'),
	ha="center", va="center",
	color="white" if cm[i, j] > thresh else "black")

	plt.title(f"{self.model_type.title()} model confusion matrix")
	plt.xlabel('Predicted')
	plt.ylabel('True')

	if save_path:
	plt.savefig(save_path, dpi=300, bbox_inches='tight')
	print(f"Confusion matrix saved to: {save_path}")

	plt.show()

	def export_to_onnx(self, model_type='random_forest', output_path=None):
	"""
	Export the trained model to ONNX format (only models supported by Barracuda).
	Note: Barracuda does not support LinearClassifier layers (e.g., LogisticRegression/SVM) — only tree models are supported.
	"""
	if not ONNX_AVAILABLE:
	print("Error: ONNX export is unavailable. Please install skl2onnx and onnx packages:")
	print("pip install skl2onnx onnx")
	return None

	if not hasattr(self, 'model') or self.model is None:
	print("Error: Model is not trained yet. Please train the model first.")
	return None

	# Check if current model type matches requested export type
	if hasattr(self, 'model_type') and self.model_type != model_type:
	print(f"Warning: Currently trained {self.model_type} model, but requested to export {model_type} model")
	print(f"Will export currently trained {self.model_type} model")
	model_name = self.model_type
	else:
	model_name = model_type

	# Barracuda only supports tree models, not LinearClassifier
	if model_name in ['logistic', 'svm']:
	print(f"❌ Barracuda/Unity does not support ONNX import for {model_name} models (LinearClassifier layer).")
	print("Please use random_forest or gradient_boost for export.")
	return None

	# If student_model exists -> export student_model (MLP), otherwise export self.model
	model_to_export = None
	export_name = None

	if self.student_model is not None:
	model_to_export = self.student_model
	export_name = 'distilled_mlp'
	print("Detected student_model. Exporting student (MLP) to ONNX (suitable for Unity/Barracuda).")
	else:
	model_to_export = self.model
	export_name = model_name

	if model_to_export is None:
	print("Error: No model available for export.")
	return None

	# Generate output file path
	if output_path is None:
	output_path = f"pose_classifier_{export_name}.onnx"

	print(f"About to export model to: {output_path}, export target: {export_name}")

	try:
	feature_count = len(self.target_joints) * 3
	initial_type = [('float_input', FloatTensorType([None, feature_count]))]

	onnx_model = convert_sklearn(
	model_to_export,
	initial_types=initial_type,
	target_opset=12
	)

	with open(output_path, "wb") as f:
	f.write(onnx_model.SerializeToString())

	print(f"✅ Successfully exported {export_name} model to ONNX format: {output_path}")

	# Save label mapping and Scaler parameters
	label_mapping_path = output_path.replace('.onnx', '_labels.json')
	label_mapping = {
	'label_encoder_classes': self.label_encoder.classes_.tolist(),
	'model_type': export_name,
	'feature_count': feature_count,
	'target_joints': self.target_joints,
	'description': f'Pose classifier - {len(self.target_joints)} landmarks with x,y,z coordinates',
	'scaler_mean': self.scaler.mean_.tolist(),
	'scaler_scale': self.scaler.scale_.tolist()
	}

	with open(label_mapping_path, 'w', encoding='utf-8') as f:
	json.dump(label_mapping, f, ensure_ascii=False, indent=2)

	print(f"✅ Label mapping and scaler parameters saved to: {label_mapping_path}")

	print("⚠️ Note: The exported ONNX expects inputs to be standardized with scaler_mean/scaler_scale.")

	return output_path

	except Exception as e:
	print(f"❌ ONNX export failed: {str(e)}")
	import traceback
	traceback.print_exc()
	return None

	def export_to_tflite(self, output_path=None):
	"""
	Export student_model (MLP) to TFLite format.
	Dependencies: skl2onnx, onnx, onnx-tf, tensorflow
	"""
	if self.student_model is None:
	print("❌ Only exporting student_model (MLPRegressor) to TFLite is supported. Please train with --model distilled_rf first.")
	return None

	try:
	import onnx
	from skl2onnx import convert_sklearn
	from skl2onnx.common.data_types import FloatTensorType
	from onnx_tf.backend import prepare
	import tensorflow as tf
	except ImportError:
	print("❌ You need to install skl2onnx, onnx, onnx-tf, tensorflow.")
	print("pip install skl2onnx onnx onnx-tf tensorflow")
	return None

	feature_count = len(self.target_joints) * 3
	initial_type = [('float_input', FloatTensorType([None, feature_count]))]

	# 1. Export to ONNX
	print("Exporting student_model to ONNX...")
	onnx_model = convert_sklearn(
	self.student_model,
	initial_types=initial_type,
	target_opset=12
	)
	onnx_path = "temp_student.onnx"
	with open(onnx_path, "wb") as f:
	f.write(onnx_model.SerializeToString())
	print(f"✅ ONNX export successful: {onnx_path}")

	# 2. ONNX -> TensorFlow SavedModel
	print("Converting ONNX to TensorFlow SavedModel...")
	tf_model = prepare(onnx.load(onnx_path))
	tf_saved_path = "temp_student_tf"
	tf_model.export_graph(tf_saved_path)
	print(f"✅ SavedModel export successful: {tf_saved_path}")

	# 3. SavedModel -> TFLite
	print("Converting SavedModel to TFLite...")
	converter = tf.lite.TFLiteConverter.from_saved_model(tf_saved_path)
	tflite_model = converter.convert()
	if output_path is None:
	output_path = "pose_classifier_distilled_mlp.tflite"
	with open(output_path, "wb") as f:
	f.write(tflite_model)
	print(f"✅ TFLite export successful: {output_path}")

	# Cleanup temporary files (optional)
	import os
	os.remove(onnx_path)
	import shutil
	shutil.rmtree(tf_saved_path, ignore_errors=True)

	return output_path

	def main():
	parser = argparse.ArgumentParser(description="Pose classification machine learning script")
	parser.add_argument("--data", "-d", default="PoseData", help="Pose data directory (default: PoseData)")
	parser.add_argument(
	"--model",
	"-m",
	choices=['random_forest', 'svm', 'gradient_boost', 'logistic', 'distilled_rf'],
	default='random_forest',
	help="Model type (default: random_forest)",
	)
	parser.add_argument("--test-size", "-t", type=float, default=0.2, help="Test set ratio (default: 0.2)")
	parser.add_argument("--save-model", "-s", help="Path to save the trained model")
	parser.add_argument("--load-model", "-l", help="Path to load an already trained model")
	parser.add_argument("--predict", "-p", help="Path of a single JSON file to predict")
	parser.add_argument("--evaluate", "-e", help="Path of a test directory to evaluate all JSON files")
	parser.add_argument("--no-plot", action="store_true", help="Do not display confusion matrix plot")
	parser.add_argument("--train", action="store_true", help="Force training even if --load-model is provided")
	parser.add_argument("--export-onnx", help="Export model to ONNX format; specify output file path")
	parser.add_argument(
	"--export-model-type",
	choices=['random_forest', 'logistic', 'distilled_rf'],
	default='random_forest',
	help="Model type to export (default: random_forest)",
	)
	parser.add_argument("--test-onnx", help="Test an ONNX model; specify ONNX file path")
	parser.add_argument("--onnx-labels", help="ONNX label mapping JSON path (auto-detect if not provided)")
	parser.add_argument("--onnx-test-data", help="ONNX batch test data directory (if not provided, single-sample test)")
	parser.add_argument(
	"--export-tflite",
	help="Export model to TFLite format; specify output path (supported for distilled_rf student model only)",
	)

	args = parser.parse_args()

	print("Pose classification ML tool")
	print("=" * 60)

	# If ONNX test mode
	if args.test_onnx:
	print("ONNX model test mode")
	print(f"ONNX model: {args.test_onnx}")
	print("=" * 60)

	# Create classifier instance for testing
	classifier = PoseClassifier()
	# Note: test_onnx_model is not implemented in this script; this is a placeholder.
	# You can implement it later if needed.
	print("ONNX test requested but functionality is not implemented in this script.")
	return

	# If evaluation mode
	if args.evaluate:
	if not args.load_model:
	# Try to use default model file
	default_model = f"pose_classifier_{args.model}.pkl"
	if Path(default_model).exists():
	args.load_model = default_model
	else:
	print(
	f"Error: Need to specify model file path (--load-model) or ensure default model file exists: {default_model}"
	)
	return

	print("Evaluation mode")
	print(f"Test data directory: {args.evaluate}")
	print(f"Model file: {args.load_model}")
	print("=" * 60)

	# Create classifier and load model
	classifier = PoseClassifier(model_type=args.model)
	classifier.load_model(args.load_model)

	# Perform comprehensive evaluation
	try:
	eval_results = classifier.evaluate_test_directory(args.evaluate)
	classifier.print_evaluation_report(eval_results)
	except Exception as e:
	print(f"Error during evaluation: {e}")

	return

	# Prediction-only mode
	if args.predict:
	if not args.load_model:
	# Try to use default model file
	default_model = f"pose_classifier_{args.model}.pkl"
	if Path(default_model).exists():
	args.load_model = default_model
	else:
	print(
	f"Error: Need to specify model file path (--load-model) or ensure default model file exists: {default_model}"
	)
	return

	print("Prediction mode")
	print(f"JSON file: {args.predict}")
	print(f"Model file: {args.load_model}")
	print("=" * 60)

	# Create classifier and load model
	classifier = PoseClassifier(model_type=args.model)
	classifier.load_model(args.load_model)

	# Run prediction
	result = classifier.predict_single_json(args.predict)

	# Show prediction result
	print("\nPrediction result:")
	print(f"File: {result['file_name']}")

	if 'error' in result:
	print(f"Error: {result['error']}")
	else:
	print(f"Predicted label: {result['predicted_label']}")
	print(f"Joint coverage: {result['joint_coverage']}")

	if result['confidence_scores']:
	print(f"Max confidence: {result['max_confidence']:.4f}")
	print("\nPer-class confidence:")
	sorted_scores = sorted(result['confidence_scores'].items(), key=lambda x: x[1], reverse=True)
	for label, score in sorted_scores:
	print(f" {label}: {score:.4f}")

	if result['missing_joints']:
	print(f"\nMissing joints: {', '.join(result['missing_joints'])}")

	return

	# Training mode
	print("Training mode")
	print(f"Data directory: {args.data}")
	print(f"Model type: {args.model}")
	print(f"Test size: {args.test_size}")
	print("=" * 60)

	# Check data directory
	if not Path(args.data).exists():
	print(f"Error: data directory does not exist: {args.data}")
	return

	# Create classifier
	classifier = PoseClassifier(model_type=args.model)

	# If loading an existing model and not forcing training
	if args.load_model and not args.train:
	print(f"Loading existing model: {args.load_model}")
	classifier.load_model(args.load_model)
	print("Model loaded, skipping training step")
	else:
	# Load data
	X, y = classifier.load_data(args.data)
	if len(X) == 0:
	print("Error: no valid data found")
	return
	# Train model
	results = classifier.train(X, y, test_size=args.test_size)
	# Plot confusion matrix (if not disabled)
	if not args.no_plot:
	try:
	classifier.plot_confusion_matrix(
	results['confusion_matrix'], results['target_names'], save_path=f"confusion_matrix_{args.model}.png"
	)
	except Exception as e:
	print(f"Error while plotting confusion matrix: {e}")
	# Save model (if specified)
	if args.save_model:
	classifier.save_model(args.save_model)
	else:
	# Default save path
	default_path = f"pose_classifier_{args.model}.pkl"
	classifier.save_model(default_path)
	print("\nTraining complete!")
	print(f"Final test accuracy: {results['test_accuracy']:.4f}")

	# Export ONNX if requested
	if args.export_onnx:
	print(f"\nExporting {args.export_model_type} model to ONNX format...")
	onnx_path = classifier.export_to_onnx(model_type=args.export_model_type, output_path=args.export_onnx)
	if onnx_path:
	print(f"✅ ONNX model exported: {onnx_path}")

	# Export TFLite if requested
	if args.export_tflite:
	print("\nExporting student_model to TFLite format...")
	tflite_path = classifier.export_to_tflite(output_path=args.export_tflite)
	if tflite_path:
	print(f"✅ TFLite model exported: {tflite_path}")



	if __name__ == "__main__":
	main()