Spaces:

modelscope
/

ReplaceAnything

Running on L4

App Files Files Community

tastelikefeet commited on Jan 11, 2024

Commit

239f98e

1 Parent(s): 4d1c498

init

Browse files

Files changed (7) hide show

app.py +302 -0
css/0.png +0 -0
css/style.css +59 -0
models/DOWNLOAD_MODEL_HERE.txt +2 -0
models/sam_vit_h_4b8939.pth +3 -0
requirements.txt +2 -0
versions.py +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,302 @@

+##!/usr/bin/python3
+# -*- coding: utf-8 -*-
+# @Time    : 2023-06-01
+# @Author  : ashui(Binghui Chen)
+from sympy import im
+from versions import RELEASE_NOTE, VERSION
+import time
+import cv2
+import gradio as gr
+import numpy as np
+import random
+import math
+import uuid
+import torch
+from torch import autocast
+from src.util import resize_image, HWC3, call_with_messages, upload_np_2_oss
+from src.virtualmodel import call_virtualmodel
+from src.person_detect import call_person_detect
+from src.background_generation import call_bg_genration
+import sys, os
+from PIL import Image, ImageFilter, ImageOps, ImageDraw
+from segment_anything import SamPredictor, sam_model_registry
+mobile_sam = sam_model_registry['vit_h'](checkpoint='models/sam_vit_h_4b8939.pth').to("cuda")
+mobile_sam.eval()
+mobile_predictor = SamPredictor(mobile_sam)
+colors = [(255, 0, 0), (0, 255, 0)]
+markers = [1, 5]
+# - - - - - examples  - - - - -  #
+# 输入图地址, 文本, 背景图地址, index, []
+image_examples = [
+                            ["imgs/000.jpg", "一位年轻女性身穿短袖，展示一台手机", None, 0, []],
+                            ["imgs/001.jpg", "一位年轻女性身穿短袖，手持杯子", None, 1, []],
+                            ["imgs/003.png", "一名女子身穿黑色西服，背景蓝色", "imgs/003_bg.jpg", 2, []],
+                            ["imgs/002.png", "一名年轻女性身穿裙子摆拍，背景是蓝色的", "imgs/002_bg.png", 3, []],
+                            ["imgs/bg_gen/base_imgs/1cdb9b1e6daea6a1b85236595d3e43d6.png", "水滴飞溅", None, 4, []],
+                            ["imgs/bg_gen/base_imgs/1cdb9b1e6daea6a1b85236595d3e43d6.png", "", "imgs/bg_gen/ref_imgs/df9a93ac2bca12696a9166182c4bf02ad9679aa5.jpg", 5, []],
+                            ["imgs/bg_gen/base_imgs/IMG_2941.png", "在沙漠地面上", None, 6, []],
+                            ["imgs/bg_gen/base_imgs/b2b1ed243364473e49d2e478e4f24413.png","白色地面，白色背景，光线射入，佳能",None,7,[]],
+                        ]
+img = "image_gallery/"
+files = os.listdir(img)
+files = sorted(files)
+showcases = []
+for idx, name in enumerate(files):
+        temp = os.path.join(os.path.dirname(__file__), img, name)
+        showcases.append(temp)
+def process(input_image, original_image, original_mask, selected_points, source_background, prompt, face_prompt):
+    if original_image is None or original_mask is None or len(selected_points)==0:
+        raise gr.Error('请上传输入图片并通过点击鼠标选择需要保留的物体.')
+    # load example image
+    if isinstance(original_image, int):
+            image_name = image_examples[original_image][0]
+            original_image = cv2.imread(image_name)
+            original_image = cv2.cvtColor(original_image, cv2.COLOR_BGR2RGB)
+    original_mask = np.clip(255 - original_mask, 0, 255).astype(np.uint8)
+    request_id = str(uuid.uuid4())
+    input_image_url = upload_np_2_oss(original_image, request_id+".png")
+    input_mask_url = upload_np_2_oss(original_mask, request_id+"_mask.png")
+    source_background_url = "" if source_background is None else upload_np_2_oss(source_background, request_id+"_bg.png")
+    # person detect: [[x1,y1,x2,y2,score],]
+    det_res = call_person_detect(input_image_url)
+    res = []
+    if len(det_res)>0:
+        if len(prompt)==0:
+            raise gr.Error('请输入prompt')
+        res = call_virtualmodel(input_image_url, input_mask_url, source_background_url, prompt, face_prompt)
+    else:
+        ### 这里接入主图背景生成
+        if len(prompt)==0:
+            prompt=None
+        ref_image_url=None if source_background_url =='' else source_background_url
+        original_mask=original_mask[:,:,:1]
+        base_image=np.concatenate([original_image, original_mask],axis=2)
+        base_image_url=upload_np_2_oss(base_image, request_id+"_base.png")
+        res=call_bg_genration(base_image_url,ref_image_url,prompt,ref_prompt_weight=0.5)
+    return res, request_id, True
+block = gr.Blocks(
+        css="css/style.css",
+        theme=gr.themes.Soft(
+             radius_size=gr.themes.sizes.radius_none,
+             text_size=gr.themes.sizes.text_md
+         )
+        ).queue(concurrency_count=3)
+with block:
+    with gr.Row():
+        with gr.Column():
+            gr.HTML(f"""
+                    </br>
+                    <div class="baselayout" style="text-shadow: white 0.01rem 0.01rem 0.4rem; position:fixed; z-index: 9999; top:0; left:0;right:0; background-size:100% 100%">
+                        <h1 style="text-align:center; color:white; font-size:3rem; position: relative;"> ReplaceAnything (V{VERSION})</h1>
+                    </div>
+                    </br>
+                    </br>
+                    <div style="text-align: center;">
+                        <h1 >ReplaceAnything as you want: Ultra-high quality content replacement</h1>
+                        <div style="display: flex; justify-content: center; align-items: center; text-align: center;">
+                            <a href=""></a>
+                            <a href='https://aigcdesigngroup.github.io/replace-anything/'><img src='https://img.shields.io/badge/Project_Page-ReplaceAnything-green' alt='Project Page'></a>
+                            <a href='https://github.com/AIGCDesignGroup/ReplaceAnything'><img src='https://img.shields.io/badge/Github-Repo-blue'></a>
+                        </div>
+                        </br>
+                        <h3> 我们发现，在严格保持某个“物体ID”不变的情况下生成新的内容有着很大的市场需求，同时也是具有挑战性的。为此，我们提出了ReplaceAnything框架。它可以用于很多场景，比如<b>人体替换、服装替换、物体替换以及背景替换</b>等等。</h3>
+                        <h5 style="margin: 0; color: red">如果你认为该项目有所帮助的话，不妨给我们Github点个Star以便获取最新的项目进展.</h5>
+                        </br>
+                    </div>
+            """)
+    with gr.Tabs(elem_classes=["Tab"]):
+        with gr.TabItem("作品广场"):
+            gr.Gallery(value=showcases,
+                        height=800,
+                        columns=4,
+                        object_fit="scale-down"
+                        )
+        with gr.TabItem("创作图像"):
+            with gr.Accordion(label="🧭 操作指南:", open=True, elem_id="accordion"):
+                with gr.Row(equal_height=True):
+                    with gr.Row(elem_id="ShowCase"):
+                            gr.Image(value="showcase/ra.gif")
+                    gr.Markdown("""
+                    - ⭐️ <b>step1：</b>在“输入图像”中上传or选择Example里面的一张图片
+                    - ⭐️ <b>step2：</b>通过点击鼠标选择图像中希望保留的物体
+                    - ⭐️ <b>step3：</b>输入对应的参数，例如prompt等，点击Run进行生成
+                    - ⭐️ <b>step4 (可选)：</b>此外支持换背景操作，上传目标风格背景，执行完step3后点击Run进行生成
+                    """)
+            with gr.Row():
+                with gr.Column():
+                    with gr.Column(elem_id="Input"):
+                        with gr.Row():
+                            with gr.Tabs(elem_classes=["feedback"]):
+                                with gr.TabItem("输入图像"):
+                                    input_image = gr.Image(type="numpy", label="输入图",scale=2)
+                        original_image = gr.State(value=None,label="索引")
+                        original_mask = gr.State(value=None)
+                        selected_points = gr.State([],label="点选坐标")
+                        with gr.Row(elem_id="Seg"):
+                            radio = gr.Radio(['前景点选', '背景点选'], label='分割点选: ', value='前景点选',scale=2)
+                            undo_button = gr.Button('撤销点选至上一步', elem_id="btnSEG",scale=1)
+                    prompt = gr.Textbox(label="Prompt (支持中英文)", placeholder="请输入期望的文本描述",value='',lines=1)
+                    run_button = gr.Button("生成图像（Run）",elem_id="btn")
+                    with gr.Accordion("更多输入参数 (推荐使用)", open=False, elem_id="accordion1"):
+                        with gr.Row(elem_id="Image"):
+                            with gr.Tabs(elem_classes=["feedback1"]):
+                                with gr.TabItem("风格背景图输入(可选项)"):
+                                    source_background = gr.Image(type="numpy", label="背景图")
+                        face_prompt = gr.Textbox(label="人脸 Prompt (支持中英文)", value='good face, beautiful face, best quality')
+                with gr.Column():
+                    with gr.Tabs(elem_classes=["feedback"]):
+                        with gr.TabItem("输出结果"):
+                            result_gallery = gr.Gallery(label='Output', show_label=False, elem_id="gallery", preview=True)
+                            recommend=gr.Button("推荐至作品广场",elem_id="recBut")
+                            request_id=gr.State(value="")
+                            gallery_flag=gr.State(value=False)
+            with gr.Row():
+                with gr.Box():
+                    def process_example(input_image, prompt, source_background, original_image, selected_points):
+                        return input_image, prompt, source_background, original_image, []
+                    example = gr.Examples(
+                        label="输入图示例",
+                        examples=image_examples,
+                        inputs=[input_image, prompt, source_background, original_image, selected_points],
+                        outputs=[input_image, prompt, source_background, original_image, selected_points],
+                        fn=process_example,
+                        run_on_click=True,
+                        examples_per_page=10
+                    )
+     # once user upload an image, the original image is stored in `original_image`
+    def store_img(img):
+        # 图片太大传输太慢了
+        if min(img.shape[0], img.shape[1]) > 1024:
+            img = resize_image(img, 1024)
+        return img, img, [], None  # when new image is uploaded, `selected_points` should be empty
+    input_image.upload(
+        store_img,
+        [input_image],
+        [input_image, original_image, selected_points, source_background]
+    )
+    # user click the image to get points, and show the points on the image
+    def segmentation(img, sel_pix):
+        # online show seg mask
+        points = []
+        labels = []
+        for p, l in sel_pix:
+            points.append(p)
+            labels.append(l)
+        mobile_predictor.set_image(img if isinstance(img, np.ndarray) else np.array(img))
+        with torch.no_grad():
+            with autocast("cuda"):
+                masks, _, _ = mobile_predictor.predict(point_coords=np.array(points), point_labels=np.array(labels), multimask_output=False)
+        output_mask = np.ones((masks.shape[1], masks.shape[2], 3))*255
+        for i in range(3):
+                output_mask[masks[0] == True, i] = 0.0
+        mask_all = np.ones((masks.shape[1], masks.shape[2], 3))
+        color_mask = np.random.random((1, 3)).tolist()[0]
+        for i in range(3):
+                mask_all[masks[0] == True, i] = color_mask[i]
+        masked_img = img / 255 * 0.3 + mask_all * 0.7
+        masked_img = masked_img*255
+        ## draw points
+        for point, label in sel_pix:
+            cv2.drawMarker(masked_img, point, colors[label], markerType=markers[label], markerSize=20, thickness=5)
+        return masked_img, output_mask
+    def get_point(img, sel_pix, point_type, evt: gr.SelectData):
+        if point_type == '前景点选':
+            sel_pix.append((evt.index, 1))   # append the foreground_point
+        elif point_type == '背景点选':
+            sel_pix.append((evt.index, 0))    # append the background_point
+        else:
+            sel_pix.append((evt.index, 1))    # default foreground_point
+        if isinstance(img, int):
+            image_name = image_examples[img][0]
+            img = cv2.imread(image_name)
+            img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+        # online show seg mask
+        masked_img, output_mask = segmentation(img, sel_pix)
+        return masked_img.astype(np.uint8), output_mask
+    input_image.select(
+        get_point,
+        [original_image, selected_points, radio],
+        [input_image, original_mask],
+    )
+    # undo the selected point
+    def undo_points(orig_img, sel_pix):
+        # draw points
+        output_mask = None
+        if len(sel_pix) != 0:
+            if isinstance(orig_img, int):   # if orig_img is int, the image if select from examples
+                temp = cv2.imread(image_examples[orig_img][0])
+                temp = cv2.cvtColor(temp, cv2.COLOR_BGR2RGB)
+            else:
+                temp = orig_img.copy()
+            sel_pix.pop()
+            # online show seg mask
+            if len(sel_pix) !=0:
+                temp, output_mask = segmentation(temp, sel_pix)
+            return temp.astype(np.uint8), output_mask
+        else:
+            gr.Error("暂无“上一步”可撤销")
+    undo_button.click(
+        undo_points,
+        [original_image, selected_points],
+        [input_image, original_mask]
+    )
+    def upload_to_img_gallery(img, res, re_id, flag):
+        if flag:
+            if isinstance(img, int):
+                image_name = image_examples[img][0]
+                img = cv2.imread(image_name)
+                img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+            _ = upload_np_2_oss(img, name=re_id+"_ori.jpg", gallery=True)
+            for idx, r in enumerate(res):
+                r = cv2.imread(r['name'])
+                r = cv2.cvtColor(r, cv2.COLOR_BGR2RGB)
+                _ = upload_np_2_oss(r, name=re_id+f"_res_{idx}.jpg", gallery=True)
+            flag=False
+            gr.Info("图片已经被上传完毕，待审核")
+        else:
+            gr.Info("暂无图片可推荐，或者已经推荐过一次了")
+        return flag
+    recommend.click(
+        upload_to_img_gallery,
+        [original_image, result_gallery, request_id, gallery_flag],
+        [gallery_flag]
+    )
+    ips=[input_image, original_image, original_mask, selected_points, source_background, prompt, face_prompt]
+    run_button.click(fn=process, inputs=ips, outputs=[result_gallery, request_id, gallery_flag])
+block.launch(server_name='0.0.0.0', share=False, server_port=7687)

css/0.png ADDED Viewed

css/style.css ADDED Viewed

	@@ -0,0 +1,59 @@

+.baselayout{
+  background: url('https://img.alicdn.com/imgextra/i1/O1CN016hd0V91ilWY5Xr24B_!!6000000004453-2-tps-2882-256.png') no-repeat;
+}
+#btn {
+        background-color: #336699;
+        color: white;
+}
+#recBut {
+        background-color: #bb5252;
+        color: white;
+        width: 30%;
+        margin: auto;
+}
+#btnSEG {
+        background-color: #D5F3F4;
+        color: black;
+}
+#btnCHAT {
+        background-color: #B6DBF2;
+        color: black;
+}
+#accordion {
+        background-color: transparent;
+}
+#accordion1 {
+        background-color: #ecedee;
+}
+.feedback button.selected{
+        background-color: #6699CC;
+        color: white !important;
+}
+.feedback1 button.selected{
+        background-color: #839ab2;
+        color: white !important;
+}
+.Tab button.selected{
+        color: red;
+        font-weight: bold;
+}
+#Image {
+        width: 60%;
+        margin:auto;
+}
+#ShowCase {
+        width: 30%;
+        flex:none !important;
+}
+#Input {
+        border-style:solid;
+        border-width:1px;
+        border-color:#000000
+}
+#Seg {
+        min-width: min(100px, 100%) !important;
+        width: 100%;
+        margin:auto;
+}

models/DOWNLOAD_MODEL_HERE.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ 模型链接
2	+ https://vision-poster.oss-cn-shanghai.aliyuncs.com/ashui/sam_vit_h_4b8939.pth?OSSAccessKeyId=LTAI5tSPYbksBzcmooNHCYif&Expires=3599001703148669&Signature=TYznO77DKFjGNn92SnR9RbucOlU%3D

models/sam_vit_h_4b8939.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7bf3b02f3ebf1267aba913ff637d9a2d5c33d3173bb679e46d9f338c26f262e
+size 2564550879

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ dashscope
2	+ git+https://gitee.com/lllcho/segment-anything.git

versions.py ADDED Viewed

	@@ -0,0 +1,5 @@

+VERSION = '1.0.0'
+RELEASE_NOTE = '''V1.0.0: 2023/12/20
+ - init
+'''