Spaces:

ockkjs
/

Gradio3

Sleeping

App Files Files Community

ockkjs commited on Nov 7

Commit

1eb0080

1 Parent(s): 9178aac

first commit

Browse files

Files changed (7) hide show

.gitattributes +3 -0
.idea/.gitignore +5 -0
app.py +108 -0
labels.txt +19 -0
requirements.txt +6 -0
road-2.jpg +3 -0
road-3.jpeg +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.jpg filter=lfs diff=lfs merge=lfs -text
+*.jpeg filter=lfs diff=lfs merge=lfs -text
+*.png filter=lfs diff=lfs merge=lfs -text

.idea/.gitignore ADDED Viewed

	@@ -0,0 +1,5 @@

+# Default ignored files
+/shelf/
+/workspace.xml
+# Editor-based HTTP Client requests
+/httpRequests/

app.py ADDED Viewed

	@@ -0,0 +1,108 @@

+import gradio as gr
+from matplotlib import gridspec
+import matplotlib.pyplot as plt
+import numpy as np
+from PIL import Image
+import torch
+from transformers import AutoImageProcessor, AutoModelForSemanticSegmentation
+MODEL_ID = "nvidia/segformer-b4-finetuned-cityscapes-1024-1024"
+processor = AutoImageProcessor.from_pretrained(MODEL_ID)
+model = AutoModelForSemanticSegmentation.from_pretrained(MODEL_ID)
+def ade_palette():
+    """ADE20K palette that maps each class to RGB values."""
+    return [
+        [0, 0, 0],
+        [255, 0, 0],
+        [171, 242, 0],
+        [153, 138, 0],
+        [255, 228, 0],
+        [0, 216, 255],
+        [90, 180, 56],
+        [155, 102, 200],
+        [33, 147, 176],
+        [255, 183, 76],
+        [67, 123, 89],
+        [190, 60, 45],
+        [134, 114, 200],
+        [56, 45, 189],
+        [200, 56, 123],
+        [87, 92, 200],
+        [120, 56, 123],
+        [45, 78, 123],
+    ]
+labels_list = []
+with open("labels.txt", "r", encoding="utf-8") as fp:
+    for line in fp:
+        labels_list.append(line.rstrip("\n"))
+colormap = np.asarray(ade_palette(), dtype=np.uint8)
+def label_to_color_image(label):
+    if label.ndim != 2:
+        raise ValueError("Expect 2-D input label")
+    if np.max(label) >= len(colormap):
+        raise ValueError("label value too large.")
+    return colormap[label]
+def draw_plot(pred_img, seg_np):
+    fig = plt.figure(figsize=(20, 15))
+    grid_spec = gridspec.GridSpec(1, 2, width_ratios=[6, 1])
+    plt.subplot(grid_spec[0])
+    plt.imshow(pred_img)
+    plt.axis('off')
+    LABEL_NAMES = np.asarray(labels_list)
+    FULL_LABEL_MAP = np.arange(len(LABEL_NAMES)).reshape(len(LABEL_NAMES), 1)
+    FULL_COLOR_MAP = label_to_color_image(FULL_LABEL_MAP)
+    unique_labels = np.unique(seg_np.astype("uint8"))
+    ax = plt.subplot(grid_spec[1])
+    plt.imshow(FULL_COLOR_MAP[unique_labels].astype(np.uint8), interpolation="nearest")
+    ax.yaxis.tick_right()
+    plt.yticks(range(len(unique_labels)), LABEL_NAMES[unique_labels])
+    plt.xticks([], [])
+    ax.tick_params(width=0.0, labelsize=25)
+    return fig
+def run_inference(input_img):
+    # input: numpy array from gradio -> PIL
+    img = Image.fromarray(input_img.astype(np.uint8)) if isinstance(input_img, np.ndarray) else input_img
+    if img.mode != "RGB":
+        img = img.convert("RGB")
+    inputs = processor(images=img, return_tensors="pt")
+    with torch.no_grad():
+        outputs = model(**inputs)
+        logits = outputs.logits  # (1, C, h/4, w/4)
+    # resize to original
+    upsampled = torch.nn.functional.interpolate(
+        logits, size=img.size[::-1], mode="bilinear", align_corners=False
+    )
+    seg = upsampled.argmax(dim=1)[0].cpu().numpy().astype(np.uint8)  # (H,W)
+    # colorize & overlay
+    color_seg = colormap[seg]                                # (H,W,3)
+    pred_img = (np.array(img) * 0.5 + color_seg * 0.5).astype(np.uint8)
+    fig = draw_plot(pred_img, seg)
+    return fig
+demo = gr.Interface(
+    fn=run_inference,
+    inputs=gr.Image(type="numpy", label="Input Image"),
+    outputs=gr.Plot(label="Overlay + Legend"),
+    examples=[
+        "road-2.jpg",
+        "road-3.jpeg",
+    ],
+    flagging_mode="never",
+    cache_examples=False,
+)
+if __name__ == "__main__":
+    demo.launch()

labels.txt ADDED Viewed

	@@ -0,0 +1,19 @@

+road
+sidewalk
+building
+wall
+fence
+pole
+traffic light
+traffic sign
+vegetation
+terrain
+sky
+person
+rider
+car
+truck
+bus
+train
+motorcycle
+bicycle

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+torch
+transformers>=4.41.0
+gradio>=4.0.0
+Pillow
+numpy
+matplotlib

road-2.jpg ADDED Viewed

Git LFS Details

SHA256: 45b47a2019280cf41797fe32a41db266bc3311a46767c88e068e712d4230860c
Pointer size: 130 Bytes
Size of remote file: 90.8 kB

road-3.jpeg ADDED Viewed

Git LFS Details

SHA256: 8f3938362d0a5279e15e5667ee3f0617f826cbc334d151d59b69ee6b988cca56
Pointer size: 130 Bytes
Size of remote file: 12.6 kB