Spaces:

karlopintaric
/

instrument-recognizer-api

Running

App Files Files Community

instrument-recognizer-api / src /modeling /metrics.py

Karlo Pintaric

Upload 25 files

fdc1efd 11 months ago

raw

history blame contribute delete

No virus

6.68 kB

	import numpy as np
	from sklearn.metrics import (
	accuracy_score,
	average_precision_score,
	f1_score,
	hamming_loss,
	precision_recall_curve,
	zero_one_loss,
	)


	def hamming_score(preds, targets, thresholds: np.array = None):
	"""Compute Hamming Score.

	This function computes the Hamming Score, a performance metric used for multi-label classification tasks.
	The Hamming Score measures the similarity between the predicted labels and the ground truth labels, where
	a higher score indicates better prediction accuracy.

	:param preds: The predicted labels.
	:type preds: numpy array
	:param targets: The ground truth labels.
	:type targets: numpy array
	:return: The computed Hamming Score.
	:rtype: int
	"""
	if thresholds is None:
	thresholds = optimize_accuracy(preds, targets)

	preds = (preds > thresholds).astype(int)
	return 1 - hamming_loss(targets, preds)


	def zero_one_score(preds, targets, thresholds: np.array = None):
	"""
	Compute Zero-One Score.

	This function computes the Zero-One Score, a performance metric used for
	multi-label classification tasks. The Zero-One Score measures the similarity
	between the predicted labels and the ground truth labels, where a higher score
	indicates better prediction accuracy. The Zero-One Score ranges from 0 to 1, with 1 being a perfect match.

	:param preds: The predicted labels.
	:type preds: numpy array
	:param targets: The ground truth labels.
	:type targets: numpy array
	:return: The computed Zero-One Score.
	:rtype: int
	"""

	if thresholds is None:
	thresholds = optimize_accuracy(preds, targets)

	preds = (preds > thresholds).astype(int)
	return 1 - zero_one_loss(targets, preds, normalize=True)


	def mean_f1_score(preds, targets, thresholds: np.array = None):
	"""Compute Mean F1 Score.

	This function computes the Mean F1 Score, a performance metric used for multi-label
	classification tasks. The Mean F1 Score measures the trade-off between precision and recall,
	where a higher score indicates better prediction accuracy. The Mean F1 Score ranges from
	0 to 1, with 1 being a perfect match.

	:param preds: The predicted labels.
	:type preds: numpy array
	:param targets: The ground truth labels.
	:type targets: numpy array
	:return: The computed Mean F1 Score.
	:rtype: int
	"""
	if thresholds is None:
	thresholds = optimize_f1_score(preds, targets)

	preds = (preds > thresholds).astype(int)
	return f1_score(targets, preds, average="samples", zero_division=0)


	def per_instr_f1_score(preds, targets, thresholds: np.array = None):
	"""Compute Per-Instrument F1 Score.

	This function computes the F1 Score for each instrument separately in a multi-label
	classification task. The Per-Instrument F1 Score measures the prediction accuracy for
	each instrument class independently. The F1 Score is the harmonic mean of precision and recall,
	where a higher score indicates better prediction accuracy. The Per-Instrument F1 Score ranges
	from 0 to 1, with 1 being a perfect match.

	:param preds: The predicted labels.
	:type preds: numpy array
	:param targets: The ground truth labels.
	:type targets: numpy array
	:return: The computed Per-Instrument F1 Score.
	:rtype: numpy array
	"""

	if thresholds is None:
	thresholds = optimize_f1_score(preds, targets)

	preds = (preds > thresholds).astype(int)
	return f1_score(targets, preds, average=None, zero_division=0)


	def mean_average_precision(preds, targets):
	"""
	Compute mean Average Precision (mAP).

	This function computes the mean Average Precision (mAP), a performance metric used
	for multi-label classification tasks. The mAP measures the average precision across
	all classes, taking into account the precision-recall trade-off, where a higher score
	indicates better prediction accuracy.

	:param preds: The predicted probabilities or scores.
	:type preds: numpy array
	:param targets: The ground truth labels.
	:type targets: numpy array
	:return: The computed mAP score.
	:rtype: int
	"""

	return average_precision_score(targets, preds, average="samples")


	def optimize_f1_score(preds, targets):
	"""
	Optimize Threshold.

	This function optimizes the threshold for binary classification based on the predicted probabilities
	and ground truth labels. It computes the precision, recall, and F1 Score for each class separately
	using the precision_recall_curve function from sklearn.metrics module. It then selects the threshold
	that maximizes the F1 Score for each class.

	:param preds: The predicted probabilities.
	:type preds: numpy array
	:param targets: The ground truth labels.
	:type targets: numpy array
	:return: The optimized thresholds for binary classification.
	:rtype: numpy array
	"""

	label_thresholds = np.empty(preds.shape[1])

	for i in range(preds.shape[1]):
	precision, recall, thresholds = precision_recall_curve(targets[:, i], preds[:, i])
	fscore = (2 * precision * recall) / (precision + recall)
	ix = np.argmax(fscore)
	best_thresh = thresholds[ix]
	label_thresholds[i] = best_thresh

	return label_thresholds


	def optimize_accuracy(preds, targets):
	"""
	Determine the optimal threshold for each label, based on the predicted probabilities and the true targets,
	in order to maximize the accuracy of the predictions.

	:param preds: A 2D NumPy array containing the predicted probabilities for each label.
	:type preds: numpy.ndarray
	:param targets: A 2D NumPy array containing the true binary targets for each label.
	:type targets: numpy.ndarray
	:raises ValueError: If the input arrays are not 2D arrays or have incompatible shapes.
	:return: A 1D NumPy array containing the optimal threshold for each label.
	:rtype: numpy.ndarray
	"""

	# Vary the threshold for each label and calculate accuracy for each threshold
	thresholds = np.arange(0.0001, 1, 0.0001)
	best_thresholds = np.empty(preds.shape[1])
	for i in range(preds.shape[1]):
	accuracies = []
	for th in thresholds:
	y_pred = (preds[:, i] >= th).astype(int) # Convert probabilities to binary predictions using the threshold
	acc = accuracy_score(targets[:, i], y_pred)
	accuracies.append(acc)
	# Find the threshold that gives the highest accuracy for this label
	best_idx = np.argmax(accuracies)
	best_thresholds[i] = thresholds[best_idx]

	return best_thresholds