Spaces:

Vvaann
/

Assignment_13-RESNET

Sleeping

App Files Files Community

Assignment_13-RESNET / app.py

Vvaann

Update app.py

5b33f29 verified almost 2 years ago

raw

history blame contribute delete

3.61 kB

	import torch
	import torchvision
	from torchvision import transforms
	import numpy as np
	import gradio as gr
	from PIL import Image
	from pytorch_grad_cam import GradCAM
	from pytorch_grad_cam.utils.image import show_cam_on_image
	from resnet_lightning import ResNet18Model
	import gradio as gr

	model = ResNet18Model.load_from_checkpoint("epoch=19-step=3920.ckpt")

	inv_normalize = transforms.Normalize(
	mean = [-0.50/0.23, -0.50/0.23, -0.50/0.23],
	std= [1/0.23, 1/0.23,1/0.23]
	)

	classes = ('plane', 'car', 'bird', 'cat', 'deer',
	'dog', 'frog', 'horse', 'ship', 'truck')

	model_layer_names = ["1", "2", "3"]

	def get_layer(layer_name):
	print("layer name:", layer_name)
	if layer_name == 1:
	return [model.layer1[-1]]
	elif layer_name == 2:
	return [model.layer2[-1]]
	elif layer_name == 3:
	return [model.layer3[-1]]
	else:
	return None

	def resize_image_pil(image, new_width, new_height):
	img = Image.fromarray(np.array(image))
	width, height = img.size

	width_scale = new_width/width
	height_scale = new_height/height
	scale = min(width_scale, height_scale)
	resized = img.resize((int(widthscale), int(heightscale)), Image.NEAREST)
	resized = resized.crop((0,0,new_width, new_height))

	return resized


	def inference(input_img, show_gradcam, layer_name, num_classes, transparancy = 0.5):
	print(show_gradcam, layer_name, num_classes, transparancy)
	input_img = resize_image_pil(input_img,32,32)
	input_img = np.array(input_img)
	org_img = input_img

	input_img= input_img.reshape((32,32,3))
	transform = transforms.ToTensor()
	input_img = transform(input_img)
	input_img = input_img.unsqueeze(0)
	outputs = model(input_img)
	# print(outputs)
	softmax = torch.nn.Softmax(dim=0)
	o = softmax(outputs.flatten())

	output_numpy = np.squeeze(np.asarray(outputs.detach().numpy()))
	index_sort = np.argsort(output_numpy)[::-1]

	confidences = {}
	for i in range(int(num_classes)):
	confidences[classes[index_sort[i]]] = float(o[index_sort[i]])


	prediction= torch.max(outputs, 1)

	if show_gradcam:
	target_layers = get_layer(layer_name)
	print("target layer",target_layers)
	cam = GradCAM(model=model, target_layers=target_layers)
	grayscale_cam = cam(input_tensor= input_img)
	grayscale_cam = grayscale_cam[0, :]
	visualization = show_cam_on_image(org_img/255,grayscale_cam,use_rgb=True,
	image_weight=transparancy)
	else:
	visualization = org_img


	return classes[int(prediction[0].item())], visualization, confidences

	demo = gr.Interface(
	inference,
	inputs = [
	gr.Image(width=256,height=256,label="Input image"),
	gr.Number(value=3, maximum=10, minimum=1,step=1.0, precision=0,label="Number of classes to display"),
	gr.Checkbox(True, label="Show GradCAM Image"),
	gr.Dropdown(model_layer_names, value=3, label="Which layer for Gradcam"),
	gr.Slider(0, 1, value=0.5,label="Overall opacity of the overlay"),
	],
	outputs = [
	gr.Label(label="Class", container=True, show_label= True),
	gr.Image(width= 256, height=256,label="Output Image"),
	gr.Label(label="Confidences", container=True, show_label= True),
	],
	title = "CIFAR 10 trained on ResNet model in pytorch lightning with Gradcam",
	description = " A simple gradio inference to infer on resnet18 model",
	examples = [["cat.jpg",1, True, 10, 0.4]]
	)

	if __name__ == "__main__":
	demo.launch()