File size: 2,079 Bytes
fc9bdaf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
import torch
import gradio as gr
import matplotlib.pyplot as plt
from PIL import Image
from transformers import SamModel, SamProcessor

device = 'cuda' if torch.cuda.is_available() else 'cpu'
processor = SamProcessor.from_pretrained('facebook/sam-vit-base')
model = SamModel.from_pretrained('hmdliu/sidewalks-seg-base')
model.to(device)

def segment_sidewalk(image, threshold):
    # init data
    width, height = image.size
    prompt = [0, 0, width, height]
    inputs = processor(image, input_boxes=[[prompt]], return_tensors='pt')
    # make prediction
    outputs = model(pixel_values=inputs['pixel_values'].to(device),
                    input_boxes=inputs['input_boxes'].to(device),
                    multimask_output=False)
    prob_map = torch.sigmoid(outputs.pred_masks.squeeze()).cpu().detach()
    prediction = (prob_map > threshold).float()
    prob_map, prediction = prob_map.numpy(), prediction.numpy()
    # visualize results
    save_image(image, 'image.png')
    save_image(prob_map, 'prob.png', cmap='jet')
    save_image(prediction, 'mask.png', cmap='gray')
    return Image.open('image.png'), Image.open('mask.png'), Image.open('prob.png')

def save_image(image, path, **kwargs):
    plt.figure(figsize=(8, 8))
    plt.imshow(image, interpolation='nearest', **kwargs)
    plt.axis('off')
    plt.tight_layout()
    plt.savefig(path, bbox_inches='tight', pad_inches=0)
    plt.close()

with gr.Blocks() as demo:
    with gr.Row():
        with gr.Column():
            image_input = gr.Image(type='pil', label='TIFF Image')
            threshold_slider = gr.Slider(minimum=0, maximum=1, step=0.01, value=0.5, label='Prediction Threshold')
            segment_button = gr.Button('Segment')
        with gr.Column():
            prediction = gr.Image(type='pil', label='Segmentation Result')
            prob_map = gr.Image(type='pil', label='Probability Map')
    segment_button.click(
        segment_image, 
        inputs=[image_input, threshold_slider], 
        outputs=[image_input, prediction, prob_map]
    )
demo.launch(debug=True, show_error=True)