# width="{width}" height="{height}" video_html = f"""

""" return video_html def retrieve_component(retrieve_function, text, splits_choice, nvids, n_component=24): if text == DEFAULT_TEXT or text == "" or text is None: return [None for _ in range(n_component)] # cannot produce more than n_compoenent nvids = min(nvids, n_component) if "Unseen" in splits_choice: splits = ["test"] else: splits = ["train", "val", "test"] datas = retrieve_function(text, splits=splits, nmax=nvids) htmls = [get_video_html(data, idx) for idx, data in enumerate(datas)] # get n_component exactly if asked less # pad with dummy blocks htmls = htmls + [None for _ in range(max(0, n_component - nvids))] return htmls if not os.path.exists("data"): gdown.download_folder( "https://drive.google.com/drive/folders/1MgPFgHZ28AMd01M1tJ7YW_1-ut3-4j08", use_cookies=False, ) device = torch.device("cuda" if torch.cuda.is_available() else "cpu") # LOADING model = load_model(device) splits = ["train", "val", "test"] all_unit_motion_embs = load_unit_motion_embs_splits(splits, device) all_keyids = load_keyids_splits(splits) h3d_index = load_json("amass-annotations/humanml3d.json") amass_to_babel = load_json("amass-annotations/amass_to_babel.json") keyid_to_url = partial(humanml3d_keyid_to_babel_rendered_url, h3d_index, amass_to_babel) retrieve_function = partial( retrieve, model, keyid_to_url, all_unit_motion_embs, all_keyids ) # DEMO theme = gr.themes.Default(primary_hue="blue", secondary_hue="gray") retrieve_and_show = partial(retrieve_component, retrieve_function) with gr.Blocks(css=CSS, theme=theme) as demo: gr.Markdown(WEBSITE) videos = [] with gr.Row(): with gr.Column(scale=3): with gr.Column(scale=2): text = gr.Textbox( placeholder="Type the motion you want to search with a sentence", show_label=True, label="Text prompt", value=DEFAULT_TEXT, ) with gr.Column(scale=1): btn = gr.Button("Retrieve", variant="primary") clear = gr.Button("Clear", variant="secondary") with gr.Row(): with gr.Column(scale=1): splits_choice = gr.Radio( ["All motions", "Unseen motions"], label="Gallery of motion", value="All motions", info="The motion gallery is coming from HumanML3D", ) with gr.Column(scale=1): # nvideo_slider = gr.Slider(minimum=4, maximum=24, step=4, value=8, label="Number of videos") nvideo_slider = gr.Radio( [4, 8, 12, 16, 24], label="Videos", value=8, info="Number of videos to display", ) with gr.Column(scale=2): def retrieve_example(text, splits_choice, nvideo_slider): return retrieve_and_show(text, splits_choice, nvideo_slider) examples = gr.Examples( examples=[[x, None, None] for x in EXAMPLES], inputs=[text, splits_choice, nvideo_slider], examples_per_page=20, run_on_click=False, cache_examples=False, fn=retrieve_example, outputs=[], ) i = -1 # should indent for _ in range(6): with gr.Row(): for _ in range(4): i += 1 video = gr.HTML() videos.append(video) # connect the examples to the output # a bit hacky examples.outputs = videos def load_example(example_id): processed_example = examples.non_none_processed_examples[example_id] return gr.utils.resolve_singleton(processed_example) examples.dataset.click( load_example, inputs=[examples.dataset], outputs=examples.inputs_with_examples, # type: ignore show_progress=False, postprocess=False, queue=False, ).then(fn=retrieve_example, inputs=examples.inputs, outputs=videos) btn.click( fn=retrieve_and_show, inputs=[text, splits_choice, nvideo_slider], outputs=videos, ) text.submit( fn=retrieve_and_show, inputs=[text, splits_choice, nvideo_slider], outputs=videos, ) splits_choice.change( fn=retrieve_and_show, inputs=[text, splits_choice, nvideo_slider], outputs=videos, ) nvideo_slider.change( fn=retrieve_and_show, inputs=[text, splits_choice, nvideo_slider], outputs=videos, ) def clear_videos(): return [None for x in range(24)] + [DEFAULT_TEXT] clear.click(fn=clear_videos, outputs=videos + [text]) demo.launch()

TMR: Text-to-Motion Retrieval Using Contrastive 3D Human Motion Synthesis

Mathis Petrovich Michael J. Black Gül Varol

arXiv 2023

Description

TMR: Text-to-Motion Retrieval Using Contrastive 3D Human Motion Synthesis

Mathis Petrovich Michael J. Black Gül Varol

arXiv 2023

Paper Code Webpage BibTex

Description