Spaces:

luxmorocco
/

Doctoria_CXR

Sleeping

App Files Files Community

Doctoria_CXR / app.py

luxmorocco

Update app.py

d05d494 verified 11 months ago

raw

history blame

12.1 kB

	import streamlit as st
	import matplotlib.pyplot as plt
	import matplotlib.patches as patches
	from torchvision import transforms
	from PIL import Image
	import torch
	from torchvision.models.detection import fasterrcnn_resnet50_fpn
	from torchvision.models.detection.faster_rcnn import FastRCNNPredictor
	import cv2
	import numpy as np
	from matplotlib.colors import LinearSegmentedColormap

	# Function Definitions

	label_names = [
	"Aortic_enlargement", "Atelectasis", "Calcification", "Cardiomegaly",
	"Consolidation", "ILD", "Infiltration", "Lung_Opacity", "Nodule/Mass",
	"Other_lesion", "Pleural_effusion", "Pleural_thickening", "Pneumothorax",
	"Pulmonary_fibrosis"
	]

	class VinDetector(pl.LightningModule):
	def __init__(self, **kwargs):
	super().__init__()

	self.model = models.detection.fasterrcnn_resnet50_fpn(pretrained=True)
	num_classes = 15
	in_features = self.model.roi_heads.box_predictor.cls_score.in_features
	self.model.roi_heads.box_predictor = FastRCNNPredictor(in_features, num_classes)

	self.learning_rate = 1e-3
	self.batch_size = 4

	def forward(self, x):
	return self.model(x)

	def prepare_data(self):

	df = pd.read_csv('../input/vinbigdata-chest-xray-abnormalities-detection/train.csv')
	df = df[df['class_id'] != 14].reset_index(drop=True)
	self.train_dataset = VBDDataset(df, '../input/vinbigdata-chest-xray-original-png/train', get_train_transform())

	def train_dataloader(self):

	return DataLoader(self.train_dataset, batch_size=self.batch_size, shuffle=True, pin_memory=True, num_workers=4, collate_fn=collate_fn)

	def training_step(self, batch, batch_idx):
	images, targets = batch
	targets = [{k: v for k, v in t.items()} for t in targets]

	loss_dict = self.model(images, targets)
	loss = sum(loss for loss in loss_dict.values())
	self.log('Loss', loss, on_step=True, on_epoch=True, prog_bar=True)
	return {"loss": loss}

	def configure_optimizers(self):
	optimizer = torch.optim.SGD(self.model.parameters(), lr=self.learning_rate, momentum=0.95, weight_decay=1e-5, nesterov=True)
	scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(optimizer, T_max=6, eta_min=0, verbose=True)
	return [optimizer], [scheduler]


	#VBDDataset Class
	class VBDDataset(Dataset):

	def __init__(self, dataframe, image_dir, transforms=None, phase='train'):
	super().__init__()


	self.image_ids = dataframe['image_id'].unique()
	self.df = dataframe
	self.image_dir = image_dir
	self.transforms = transforms
	self.phase = phase

	def __getitem__(self, idx):

	image_id = self.image_ids[idx]
	records = self.df[self.df['image_id'] == image_id]


	image = cv2.imread(f'{self.image_dir}/{image_id}.png', cv2.IMREAD_COLOR)
	image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB).astype(np.float32)
	image /= 255.0


	if self.phase == 'test':
	if self.transforms:
	sample = {
	'image': image,
	}
	sample = self.transforms(**sample)
	image = sample['image']
	return image, image_id


	boxes = records[['x_min', 'y_min', 'x_max', 'y_max']].values


	area = (boxes[:, 3] - boxes[:, 1]) * (boxes[:, 2] - boxes[:, 0])
	area = torch.as_tensor(area, dtype=torch.float32)


	labels = torch.squeeze(torch.as_tensor((records.class_id.values+1,), dtype=torch.int64))
	iscrowd = torch.zeros((records.shape[0],), dtype=torch.int64)


	target = {}
	target['boxes'] = boxes
	target['labels'] = labels
	target['area'] = area
	target['image_id'] = torch.tensor([idx])
	target['iscrowd'] = iscrowd


	if self.transforms:
	sample = {
	'image': image,
	'bboxes': target['boxes'],
	'labels': labels
	}
	sample = self.transforms(**sample)
	image = sample['image']

	target['boxes'] = torch.as_tensor(sample['bboxes'])

	return image, target

	def __len__(self):

	return self.image_ids.shape[0]


	def get_train_transform():
	return A.Compose([
	A.Flip(0.5),
	ToTensorV2(p=1.0)
	], bbox_params={'format': 'pascal_voc', 'label_fields': ['labels']})

	def get_valid_transform():
	return A.Compose([
	ToTensorV2(p=1.0)
	])


	def collate_fn(batch):
	return tuple(zip(*batch))



	def format_prediction_string(labels, boxes, scores):
	pred_strings = []
	for j in zip(labels, scores, boxes):
	pred_strings.append("{0} {1:.4f} {2} {3} {4} {5}".format(
	j[0], j[1], j[2][0], j[2][1], j[2][2], j[2][3]))
	return " ".join(pred_strings)

	def generate_diagnostic_report(predictions, labels, threshold=0.5):
	# Initialize an empty report string
	report = "Diagnostic Report:\n\n"
	findings_present = False

	# Loop through each detection
	for element in range(len(predictions['boxes'])):
	score = predictions['scores'][element].cpu().numpy()
	if score > threshold:
	label_index = predictions['labels'][element].cpu().numpy() - 1
	label_name = labels[label_index]
	report += f"- {label_name} detected with probability {score:.2f}\n"
	findings_present = True

	# If no findings above the threshold, report no significant abnormalities
	if not findings_present:
	report += "No significant abnormalities detected."

	return report

	def draw_boxes_cv2(image, boxes, labels, scores, threshold=0.5, font_scale=1.0, thickness=3):
	# Define your labels and their corresponding colors
	label_names = [
	"Aortic_enlargement", "Atelectasis", "Calcification", "Cardiomegaly",
	"Consolidation", "ILD", "Infiltration", "Lung_Opacity", "Nodule/Mass",
	"Other_lesion", "Pleural_effusion", "Pleural_thickening", "Pneumothorax",
	"Pulmonary_fibrosis"
	]

	label2color = [
	[59, 238, 119], [222, 21, 229], [94, 49, 164], [206, 221, 133], [117, 75, 3],
	[210, 224, 119], [211, 176, 166], [63, 7, 197], [102, 65, 77], [194, 134, 175],
	[209, 219, 50], [255, 44, 47], [89, 125, 149], [110, 27, 100]
	]

	for i, box in enumerate(boxes):
	if scores[i] > threshold:
	# Subtract 1 from label_index to match the zero-indexed Python list
	label_index = labels[i] - 1
	label_name = label_names[label_index] if label_index < len(label_names) else "Unknown"
	color = label2color[label_index] if label_index < len(label2color) else (255, 255, 255) # Default to white for unknown labels

	label_text = f'{label_name}: {scores[i]:.2f}'
	cv2.rectangle(image, (int(box[0]), int(box[1])), (int(box[2]), int(box[3])), color, thickness)
	cv2.putText(image, label_text, (int(box[0]), int(box[1] - 10)), cv2.FONT_HERSHEY_SIMPLEX, font_scale, color, thickness)

	return image

	# Heatmap Generation Function
	def plot_image_with_colored_mask_overlay_and_original(image, predictions):
	# Assuming predictions are in the same format as Faster R-CNN outputs
	boxes = predictions['boxes'].cpu().numpy()
	scores = predictions['scores'].cpu().numpy()

	# Create a blank mask matching image size
	mask = np.zeros(image.shape[:2], dtype=np.float32)

	# Fill mask based on bounding boxes and scores
	for box, score in zip(boxes, scores):
	if score > 0.5: # Threshold can be adjusted
	x_min, y_min, x_max, y_max = map(int, box)
	mask[y_min:y_max, x_min:x_max] += score # Increase mask intensity with score

	# Normalize mask
	normed_mask = cv2.normalize(mask, None, alpha=0, beta=1, norm_type=cv2.NORM_MINMAX, dtype=cv2.CV_32F)

	# Create a custom colormap with transparency
	colors = [(0, 0, 0, 0), (0, 0, 1, 1), (0, 1, 0, 1), (1, 1, 0, 1), (1, 0, 0, 1)]
	cmap_name = 'doctoria_heatmap'
	custom_cmap = LinearSegmentedColormap.from_list(cmap_name, colors, N=256)

	# Apply custom colormap
	heatmap = custom_cmap(normed_mask)

	# Convert heatmap to BGR format with uint8 type
	heatmap_bgr = (heatmap[:, :, 2::-1] * 255).astype(np.uint8)

	# Overlay heatmap on original image
	overlayed_image = image.copy()
	overlayed_image[mask > 0] = overlayed_image[mask > 0] * 0.5 + heatmap_bgr[mask > 0] * 0.5

	# Plotting
	fig, axs = plt.subplots(1, 2, figsize=[12, 6])

	# Original image
	axs[0].imshow(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
	axs[0].set_title('Original Image')
	axs[0].axis('off')

	# Image with heatmap
	axs[1].imshow(cv2.cvtColor(overlayed_image, cv2.COLOR_BGR2RGB))
	axs[1].set_title('Image with Heatmap Overlay')
	axs[1].axis('off')

	# Adding colorbar
	sm = plt.cm.ScalarMappable(cmap=custom_cmap, norm=plt.Normalize(0, 1))
	sm.set_array([])
	fig.colorbar(sm, ax=axs[1], orientation='vertical', fraction=0.046, pad=0.04)

	plt.show()


	# Load the model
	def create_model(num_classes):
	model = fasterrcnn_resnet50_fpn(pretrained=False)
	in_features = model.roi_heads.box_predictor.cls_score.in_features
	model.roi_heads.box_predictor = FastRCNNPredictor(in_features, num_classes)
	return model


	# Streamlit app title
	st.title("Doctoria CXR")

	# Sidebar for user input
	st.sidebar.title("Upload Chest X-ray Image")

	# File uploader allows user to add their own image
	uploaded_file = st.sidebar.file_uploader("Upload Chest X-ray image", type=["png", "jpg", "jpeg"])

	# Load the model (use your model loading function)
	# Ensure the model path is correct and accessible

	#model = create_model(num_classes=15)
	#model.load_state_dict(torch.load('Doctoria CXR Thoraric Full Model.pth', map_location=torch.device('cpu')))
	#model.eval()

	def load_model(model_path):
	# Create an instance of the VinDetector model
	model = VinDetector(num_classes=14) # Adjust num_classes as needed

	# Load the saved state_dict
	model.load_state_dict(torch.load(model_path, map_location=torch.device('cpu')))

	model.eval() # Set the model to evaluation mode
	return model

	model = load_model('Doctoria CXR Thoraric Full Model.pth')

	def process_image(image_path):
	# Load and transform the image
	image = Image.open(image_path).convert('RGB')
	transform = get_transform()
	image = transform(image).unsqueeze(0)

	# Perform inference
	with torch.no_grad():
	prediction = model(image)

	return prediction, image

	# When the user uploads a file
	if uploaded_file is not None:
	# Display the uploaded image
	st.image(uploaded_file, caption="Uploaded X-ray", use_column_width=True)
	st.write("")

	# Process the uploaded image
	prediction, image_tensor = process_image(uploaded_file)

	# Convert tensor to PIL Image for display
	image_pil = transforms.ToPILImage()(image_tensor.squeeze(0)).convert("RGB")

	# Visualization and report generation
	image_np = np.array(image_pil)
	for element in range(len(prediction[0]['boxes'])):
	box = prediction[0]['boxes'][element].cpu().numpy()
	score = prediction[0]['scores'][element].cpu().numpy()
	label_index = prediction[0]['labels'][element].cpu().numpy()
	if score > 0.5:
	draw_boxes_cv2(image_np, [box], [label_index], [score], font_scale=3) # Increased font size

	image_pil_processed = Image.fromarray(image_np)

	# Display processed image
	st.image(image_pil_processed, caption="Processed X-ray with Abnormalities Marked", use_column_width=True)

	# Generate the diagnostic report
	report = generate_diagnostic_report(prediction[0], label_names, 0.5)
	st.write(report)

	# Instructions
	st.sidebar.write("Instructions:")
	st.sidebar.write("1. Upload an X-ray image.")
	st.sidebar.write("2. View the processed image and diagnostic report.")