Spaces:

cmu-gil
/

BrickGPT-Demo

Running on Zero

File size: 9,247 Bytes

def3000
 
5218da5
def3000
 
 
 
 
 
 
 
bce7f3d
def3000
972de2b
def3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5d131e0
cc9cd8f
def3000
 
972de2b
5218da5
 
 
 
def3000
 
f75356d
 
def3000
 
 
 
 
 
 
972de2b
 
def3000
 
 
 
6e12b3d
972de2b
 
def3000
 
 
5218da5
def3000
 
 
7105ff7
def3000
 
 
 
 
 
 
 
 
 
 
 
 
 
b24c174
6e12b3d
287f91c
def3000
 
 
972de2b
cc9cd8f
 
 
b24c174
7825517
972de2b
b24c174
 
5218da5
b24c174
 
 
 
 
5218da5
cc9cd8f
 
b24c174
 
 
 
 
 
 
972de2b
 
b24c174
 
 
 
 
 
 
 
 
972de2b
5218da5
 
b24c174
972de2b
b24c174
 
972de2b
b24c174
5218da5
 
 
 
 
972de2b
5218da5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
972de2b
5218da5
 
 
972de2b
5218da5
b24c174
def3000
 
972de2b
def3000
 
972de2b
def3000

import json
import os
import shutil
import subprocess
import time
import uuid
import zipfile
from dataclasses import fields
from urllib.request import urlretrieve

import gradio as gr
import spaces
import transformers
from brickgpt.models import BrickGPT, BrickGPTConfig


def setup():
    # Set up Gurobi licence
    licence_filename = 'gurobi.lic'
    licence_lines = []
    for secret_name in ['WLSACCESSID', 'WLSSECRET', 'LICENSEID']:
        secret = os.environ.get(secret_name)
        if not secret:
            raise ValueError(f'Env variable {secret_name} not found. Please set it in the Hugging Face Space settings.')
        licence_lines.append(f'{secret_name}={secret}\n')
    with open(licence_filename, 'w') as f:
        f.writelines(licence_lines)
    os.environ['GRB_LICENSE_FILE'] = os.path.abspath(licence_filename)

    # Download LDraw part library and set LDraw library path
    ldraw_zip_url = 'https://library.ldraw.org/library/updates/complete.zip'
    ldraw_zip_filename = 'complete.zip'
    urlretrieve(ldraw_zip_url, ldraw_zip_filename)
    with zipfile.ZipFile(ldraw_zip_filename) as zip_ref:
        zip_ref.extractall()
    os.environ['LDRAW_LIBRARY_PATH'] = os.path.abspath('ldraw')


def main():
    if os.environ.get('IS_HF_SPACE') == '1':
        print('Running in Hugging Face Space, setting up environment...')
        setup()

    model_cfg = BrickGPTConfig(max_regenerations=5, device='cuda')
    generator = BrickGenerator(model_cfg)

    # Define inputs and outputs
    in_prompt = gr.Textbox(label='Prompt', placeholder='Enter a prompt to generate a brick model.', max_length=500)
    in_optout = gr.Checkbox(label='Do not save my data',
                            info='We may collect model inputs and outputs to help us improve the model. '
                                 'Your data will never be shared or used for any other purpose. '
                                 'If you wish to opt out of data collection, please check the box below.')
    in_temperature = gr.Slider(0.01, 2.0, value=model_cfg.temperature, step=0.01,
                               label='Temperature', info=get_help_string('temperature'))
    in_seed = gr.Number(value=42, label='Seed', info='Random seed for generation.',
                        precision=0, minimum=0, maximum=2 ** 32 - 1, step=1)
    in_bricks = gr.Number(value=model_cfg.max_bricks, label='Max bricks', info=get_help_string('max_bricks'),
                          precision=0, minimum=1, step=1)
    in_rejections = gr.Number(value=model_cfg.max_brick_rejections, label='Max brick rejections',
                              info=get_help_string('max_brick_rejections'), precision=0, minimum=0, step=1)
    in_regenerations = gr.Number(value=model_cfg.max_regenerations, label='Max regenerations',
                                 info=get_help_string('max_regenerations'), precision=0, minimum=0, step=1)
    out_img = gr.Image(label='Output image', format='png')
    out_txt = gr.Textbox(label='Output bricks', lines=5, max_lines=5, show_copy_button=True,
                         info='The brick structure in text format. Each line of the form "hxw (x,y,z)" represents a '
                              '1-unit-tall rectangular brick with dimensions hxw placed at coordinates (x,y,z).')

    # Define Gradio interface
    demo = gr.Interface(
        fn=generator.generate_bricks,
        title='BrickGPT Demo',
        description='Official demo for [BrickGPT](https://avalovelace1.github.io/BrickGPT/), the first approach for generating physically stable toy brick models from text prompts.\n\n'
                    'The model is restricted to creating structures made of 1-unit-tall cuboid bricks on a 20x20x20 grid. It was trained on a dataset of 21 object categories: '
                    '*basket, bed, bench, birdhouse, bookshelf, bottle, bowl, bus, camera, car, chair, guitar, jar, mug, piano, pot, sofa, table, tower, train, vessel.* '
                    'Performance on prompts from outside these categories may be limited. This demo does not include texturing or coloring.',
        inputs=[in_prompt, in_optout],
        additional_inputs=[in_temperature, in_seed, in_bricks, in_rejections, in_regenerations],
        outputs=[out_img, out_txt],
        flagging_mode='never',
        deep_link=False,
    )
    with demo:
        with gr.Row():
            examples = get_examples()
            dummy_name = gr.Textbox(visible=False, label='Name')
            dummy_out_img = gr.Image(visible=False, label='Result')
            gr.Examples(
                examples=[[name, example['prompt'], example['temperature'], example['seed'], example['output_img']]
                          for name, example in examples.items()],
                inputs=[dummy_name, in_prompt, in_temperature, in_seed, dummy_out_img],
                outputs=[out_img, out_txt],
                fn=lambda *args: (args[-1], examples[args[0]]['output_txt']),
                run_on_click=True,
            )

    concurrency_limit = 1 if os.environ.get('CONCURRENCY_LIMIT') is None else int(os.environ.get('CONCURRENCY_LIMIT'))
    demo.queue(default_concurrency_limit=concurrency_limit)
    demo.launch(share=True)


class BrickGenerator:
    def __init__(self, model_cfg: BrickGPTConfig):
        self.model_cfg = model_cfg
        self.model = None

    @spaces.GPU(duration=600)
    def generate_bricks(
            self,
            prompt: str,
            do_not_save_data: bool,
            temperature: float | None,
            seed: int | None,
            max_bricks: int | None,
            max_brick_rejections: int | None,
            max_regenerations: int | None,
    ) -> (str, str):
        self.model = BrickGPT(self.model_cfg)

        # Set model parameters
        if temperature is not None: self.model.temperature = temperature
        if max_bricks is not None: self.model.max_bricks = max_bricks
        if max_brick_rejections is not None: self.model.max_brick_rejections = max_brick_rejections
        if max_regenerations is not None: self.model.max_regenerations = max_regenerations
        if seed is not None: transformers.set_seed(seed)

        # Generate bricks
        print(f'Generating bricks for prompt: "{prompt}"')
        start_time = time.time()
        output = self.model(prompt)

        # Write output LDR to file
        output_dir = os.path.abspath('out')
        output_uuid = str(uuid.uuid4())
        os.makedirs(output_dir, exist_ok=True)
        ldr_filename = os.path.join(output_dir, f'{output_uuid}.ldr')
        with open(ldr_filename, 'w') as f:
            f.write(output['bricks'].to_ldr())
        generation_time = time.time() - start_time
        print(f'Finished generation in {generation_time:.1f}s!')

        # Render brick model to image
        print('Rendering image...')
        img_filename = os.path.join(output_dir, f'{output_uuid}.png')
        subprocess.run(['python', 'render_bricks.py', '--in_file', ldr_filename, '--out_file', img_filename],
                       check=True)  # Run render as a subprocess to prevent issues with Blender
        rendering_time = time.time() - start_time - generation_time
        print(f'Finished rendering in {rendering_time:.1f}s!')

        # Save data persistently
        if not do_not_save_data:
            data_dir = '/data/apun/brickgpt_demo_out'
            os.makedirs(data_dir, exist_ok=True)

            # Copy output image to persistent storage
            img_copy_filename = os.path.join(data_dir, f'{output_uuid}.png')
            shutil.copy(img_filename, img_copy_filename)

            # Save metadata
            metadata_filename = os.path.join(data_dir, f'{output_uuid}.json')
            with open(metadata_filename, 'w') as f:
                json.dump({
                    'prompt': prompt,
                    'temperature': self.model.temperature,
                    'seed': seed,
                    'max_bricks': self.model.max_bricks,
                    'max_brick_rejections': self.model.max_brick_rejections,
                    'max_regenerations': self.model.max_regenerations,
                    'start_timestamp': time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(start_time)),
                    'generation_time': generation_time,
                    'rendering_time': rendering_time,
                    'output_txt': output['bricks'].to_txt(),
                }, f)
            print(f'Saved data to {metadata_filename}.')

        return img_filename, output['bricks'].to_txt()


def get_help_string(field_name: str) -> str:
    """
    :param field_name: Name of a field in BrickGPTConfig.
    :return: Help string for the field.
    """
    data_fields = fields(BrickGPTConfig)
    name_field = next(f for f in data_fields if f.name == field_name)
    return name_field.metadata['help']


def get_examples(example_dir: str = os.path.abspath('examples')) -> dict[str, dict[str, str]]:
    examples_file = os.path.join(example_dir, 'examples.json')
    with open(examples_file) as f:
        examples = json.load(f)

    for example in examples.values():
        example['output_img'] = os.path.join(example_dir, example['output_img'])
    return examples


if __name__ == '__main__':
    main()