Sifal
/

pokemon_classification

Image Classification

Model card Files Files and versions Community

pokemon_classification / inference.py

Sifal's picture

Upload 9 files

c7f0510 verified 11 days ago

history blame contribute delete

2.23 kB

	import torch
	import argparse
	from utils.inference_utils import preprocess_image, predict
	from utils.train_utils import initialize_model
	from utils.interpretability import lime_interpret_image_inference
	from utils.data import CLASS_NAMES


	def main():
	parser = argparse.ArgumentParser(description="Image Inference")
	parser.add_argument(
	"--model_name",
	type=str,
	help="Model name (resnet, alexnet, vgg, squeezenet, densenet)",
	default="resnet",
	)
	parser.add_argument(
	"--model_weights",
	type=str,
	help="Path to the model weights",
	default="./trained_models/pokemon_resnet.pth",
	)
	parser.add_argument(
	"--image_path",
	type=str,
	help="Path to the image",
	default="./pokemonclassification/PokemonData/Chansey/57ccf27cba024fac9531baa9f619ec62.jpg",
	)
	parser.add_argument(
	"--num_classes", type=int, help="Number of classes", default=150
	)
	parser.add_argument(
	"--lime_interpretability",
	action="store_true",
	help="Whether to run interpretability or not",
	)
	parser.add_argument(
	"--classify",
	action="store_true",
	help="Whether to classify the image when saving the lime filter")

	args = parser.parse_args()

	if args.lime_interpretability:
	assert (
	args.model_name == "resnet"
	), "Interpretability is only supported for ResNet model for now"

	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

	# Initialize the model
	model = initialize_model(args.model_name, args.num_classes)
	model = model.to(device)

	# Load the model weights
	model.load_state_dict(torch.load(args.model_weights, map_location=device))

	# Preprocess the image
	image = preprocess_image(args.image_path, (224, 224)).to(device)

	# Perform inference
	preds = torch.max(predict(model, image), 1)[1]
	print(f"Predicted class: {CLASS_NAMES[preds.item()]}")

	if args.lime_interpretability:
	lime_interpret_image_inference(args, model, image, device)


	if __name__ == "__main__":
	main()