Spaces:

jkang
/

demo-artist-classifier

Runtime error

demo-artist-classifier / gradcam_utils.py

jaekookang

first upload

af72b72 almost 3 years ago

4.77 kB

	'''
	Grad-CAM visualization utilities

	- Based on https://keras.io/examples/vision/grad_cam/

	---
	- 2021-12-18 jkang first created
	- 2022-01-16
	- copied from https://huggingface.co/spaces/jkang/demo-gradcam-imagenet/blob/main/utils.py
	- updated for artis/trend classifier
	'''
	import matplotlib.cm as cm

	import os
	import re
	from glob import glob
	import numpy as np
	import tensorflow as tf
	tfk = tf.keras
	K = tfk.backend

	# Disable GPU for testing
	# os.environ['CUDA_VISIBLE_DEVICES'] = '-1'


	def get_imagenet_classes():
	'''Retrieve all 1000 imagenet classes/labels as dictionaries'''
	classes = tfk.applications.imagenet_utils.decode_predictions(
	np.expand_dims(np.arange(1000), 0), top=1000
	)
	idx2lab = {cla[2]: cla[1] for cla in classes[0]}
	lab2idx = {idx2lab[idx]: idx for idx in idx2lab}
	return idx2lab, lab2idx


	def search_by_name(str_part):
	'''Search imagenet class by partial matching string'''
	results = [key for key in list(lab2idx.keys()) if re.search(str_part, key)]
	if len(results) != 0:
	return [(key, lab2idx[key]) for key in results]
	else:
	return []


	def get_xception_model():
	'''Get model to use'''
	base_model = tfk.applications.xception.Xception
	preprocessor = tfk.applications.xception.preprocess_input
	decode_predictions = tfk.applications.xception.decode_predictions
	last_conv_layer_name = "block14_sepconv2_act"

	model = base_model(weights='imagenet')
	grad_model = tfk.models.Model(
	inputs=[model.inputs],
	outputs=[model.get_layer(last_conv_layer_name).output,
	model.output]
	)
	return model, grad_model, preprocessor, decode_predictions


	def get_img_4d_array(image_file, image_size=(299, 299)):
	'''Load image as 4d array'''
	img = tfk.preprocessing.image.load_img(
	image_file, target_size=image_size) # PIL obj
	img_array = tfk.preprocessing.image.img_to_array(
	img) # float32 numpy array
	img_array = np.expand_dims(img_array, axis=0) # 3d -> 4d (1,299,299,3)
	return img_array


	def make_gradcam_heatmap(grad_model, img_array, pred_idx=None):
	'''Generate heatmap to overlay with
	- img_array: 4d numpy array
	- pred_idx: eg. index out of 1000 imagenet classes
	if None, argmax is chosen from prediction
	'''
	# Get gradient of pred class w.r.t. last conv activation
	with tf.GradientTape() as tape:
	last_conv_act, predictions = grad_model(img_array)
	if pred_idx == None:
	pred_idx = tf.argmax(predictions[0])
	class_channel = predictions[:, pred_idx] # (1,1000) => (1,)

	# d(class_channel/last_conv_act)
	grads = tape.gradient(class_channel, last_conv_act)
	pooled_grads = tf.reduce_mean(grads, axis=(
	0, 1, 2)) # (1,10,10,2048) => (2048,)

	# (10,10,2048) x (2048,1) => (10,10,1)
	heatmap = last_conv_act[0] @ pooled_grads[..., tf.newaxis]
	heatmap = tf.squeeze(heatmap) # (10,10)

	# Normalize heatmap between 0 and 1
	heatmap = tf.maximum(heatmap, 0) / tf.math.reduce_max(heatmap)
	return heatmap, pred_idx.numpy(), predictions.numpy().squeeze()


	def align_image_with_heatmap(img_array, heatmap, alpha=0.3, cmap='jet'):
	'''Align the image with gradcam heatmap
	- img_array: 4d numpy array
	- heatmap: output of `def make_gradcam_heatmap()` as 2d numpy array
	'''
	img_array = img_array.squeeze() # 4d => 3d

	# Rescale to 0-255 range
	heatmap_scaled = np.uint8(255 * heatmap)
	img_array_scaled = np.uint8(255 * img_array)

	colormap = cm.get_cmap(cmap)
	colors = colormap(np.arange(256))[:, :3] # mapping RGB to heatmap
	heatmap_colored = colors[heatmap_scaled] # ? still unclear

	# Make RGB colorized heatmap
	heatmap_colored = (tfk.preprocessing.image.array_to_img(heatmap_colored) # array => PIL
	.resize((img_array.shape[1], img_array.shape[0])))
	heatmap_colored = tfk.preprocessing.image.img_to_array(
	heatmap_colored) # PIL => array

	# Overlay image with heatmap
	overlaid_img = heatmap_colored * alpha + img_array_scaled
	overlaid_img = tfk.preprocessing.image.array_to_img(overlaid_img)
	return overlaid_img


	if __name__ == '__main__':
	# Test GradCAM
	examples = sorted(glob(os.path.join('examples', '*.jpg')))
	idx2lab, lab2idx = get_imagenet_classes()

	model, grad_model, preprocessor, decode_predictions = get_xception_model()

	img_4d_array = get_img_4d_array(examples[0])
	img_4d_array = preprocessor(img_4d_array)

	heatmap = make_gradcam_heatmap(grad_model, img_4d_array, pred_idx=None)

	img_pil = align_image_with_heatmap(
	img_4d_array, heatmap, alpha=0.3, cmap='jet')

	img_pil.save('test.jpg')
	print('done')