Spaces:

Vipitis
/

ShaderCoder

Runtime error

App Files Files Community

Vipitis commited on Jun 3, 2023

Commit

fee32de

•

1 Parent(s): 0680c21

generate function body button

Browse files

Files changed (5) hide show

app.py +101 -11
build/my-languages.exp +0 -0
build/my-languages.lib +0 -0
build/my-languages.so +0 -0
requirements.txt +2 -1

app.py CHANGED Viewed

@@ -142,18 +142,30 @@ If I find an efficient way, the shaders might run in real time and be interactiv
 ## TODO:
  - [x] use embedded Shadertoy for reference/attribution (done, but some errors)
- - [] working render implementation on CPU only space (use the browser for WebGPU?)
  - [~] generate variations of return statements [ShaderEval task1](https://huggingface.co/spaces/Vipitis/ShaderEval) (missing all of the generation parameters)
  - [] generation history stating which function and orig/generated returns. (use State ??). do it as comments in the code?
- - [] generate whole functions
  - [] generate whole shaders (via prompts?)
 """
 passes_dataset = datasets.load_dataset("Vipitis/Shadertoys")
-single_passes = passes_dataset.filter(lambda x: not x["has_inputs"] and x["num_passes"] == 1 and x["code"].count("return") >= 1) #filter easier than having a custom loader script?
 all_single_passes = datasets.concatenate_datasets([single_passes["train"], single_passes["test"]])
 num_samples = len(all_single_passes)
 async def get_image(code, time= 0.0, resolution=(512, 420)):
     shader = ShadertoyCustom(code, resolution, OffscreenCanvas, run_offscreen) #pass offscreen canvas here.
     shader._uniform_data["time"] = time #set any time you want
     shader._canvas.request_draw(shader._draw_frame)
@@ -172,11 +184,25 @@ def grab_sample(sample_idx):
     sample_auhtor = sample_pass["author"]
     source_iframe = construct_embed(sample_source)
     print(f"{source_iframe=}")
-    return sample_pass, sample_code, source_iframe #, sample_title, sample_auhtor
-PIPE = None #gloabl var in CAPS indicates constant? so why are we changing it?
-def _make_pipeline(model_cp = "gpt2"): #bad default model for testing
     tokenizer = AutoTokenizer.from_pretrained(model_cp, trust_remote_code=True)
     model = AutoModelForCausalLM.from_pretrained(model_cp, trust_remote_code=True)
     pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, trust_remote_code=True)
@@ -184,6 +210,7 @@ def _make_pipeline(model_cp = "gpt2"): #bad default model for testing
     print(f"loaded model {model_cp} as a pipline")
     return pipe
 def process_retn(retn):
     return retn.split(";")[0].strip()
@@ -231,11 +258,67 @@ def alter_return(orig_code, func_idx=0, pipeline=PIPE): #default pipeline can't
     return altered_code
 def add_history(func_id, orig_rtn, gened_rtn, history):
     # is this a list? or a JSON dict?
     history[func_id] =  (orig_rtn, gened_rtn)
     return history, history
 def construct_embed(source_url):
     shader_id = source_url.split("/")[-1]
     return f'<iframe width="640" height="360" frameborder="0" src="https://www.shadertoy.com/embed/{shader_id}?gui=true&t=0&paused=true&muted=true" allowfullscreen></iframe>'
@@ -244,23 +327,30 @@ with gr.Blocks() as site:
     text_md = gr.Markdown(text)
     model_cp = gr.Textbox(value="Vipitis/santacoder-finetuned-Shadertoys-fine", label="Model Checkpoint (Enter to load!)", interactive=True)
     sample_idx = gr.Slider(minimum=0, maximum=num_samples, value=3211, label="pick sample from dataset", step=1.0)
-    run_button = gr.Button("generate a alternate return statement for one function", label="generate code")
     render_button = gr.Button("render frame0 (can carsh the sapce on invalid shadercode)",label="render frame")
     time_slider = gr.Slider(minimum=0, maximum=10, value=0, label="time (update on release, also used to pick other functions as a bodge)", step=0.02)
     with gr.Row():
         with gr.Column():
             source_embed = gr.HTML('<iframe width="640" height="360" frameborder="0" src="https://www.shadertoy.com/embed/WsBcWV?gui=true&t=0&paused=true&muted=true" allowfullscreen></iframe>', label="How this shader originally renders")
-            rendered_frame = gr.Image(shape=(512, 420), label=f"rendered frame preview")
-        sample_code = gr.Code(label="Current Code (will update changes you generate)", language=None, readonly=True, lines=20)
     sample_pass = gr.State(value={})
     pipe = gr.State(value=PIPE)
     # hist_state = gr.State(Value={})
     # history_table = gr.JSON()
     model_cp.submit(fn=_make_pipeline, inputs=[model_cp], outputs=[pipe])
-    sample_idx.release(fn=grab_sample, inputs=[sample_idx], outputs=[sample_pass, sample_code, source_embed])
-    run_button.click(fn=alter_return, inputs=[sample_code, time_slider, pipe], outputs=[sample_code])
     # run_button.click(fn=add_history, inputs=[time_slider, sample_pass, sample_code, hist_state], outputs=[history_table, hist_state])
     # sample_idx.release(fn=construct_embed, inputs=[sample_idx], outputs=[source_embed]) #twice to make have different outputs?
     time_slider.release(fn=lambda code, time: asyncio.run(get_image(code, time)), inputs=[sample_code, time_slider], outputs=rendered_frame)

 ## TODO:
  - [x] use embedded Shadertoy for reference/attribution (done, but some errors)
+ - [] working render implementation on CPU only space (use the browser for WebGPU?, maybe via an iFrame too?)
  - [~] generate variations of return statements [ShaderEval task1](https://huggingface.co/spaces/Vipitis/ShaderEval) (missing all of the generation parameters)
  - [] generation history stating which function and orig/generated returns. (use State ??). do it as comments in the code?
+ - [x?] generate whole functions (only works once)
  - [] generate whole shaders (via prompts?)
 """
 passes_dataset = datasets.load_dataset("Vipitis/Shadertoys")
+single_passes = passes_dataset.filter(lambda x: not x["has_inputs"] and x["num_passes"] == 1) #could also include shaders with no extra functions.
 all_single_passes = datasets.concatenate_datasets([single_passes["train"], single_passes["test"]])
 num_samples = len(all_single_passes)
+import tree_sitter
+from tree_sitter import Language, Parser
+Language.build_library("build/my-languages.so", ['tree-sitter-glsl'])
+GLSL_LANGUAGE = Language('build/my-languages.so', 'glsl')
+parser = Parser()
+parser.set_language(GLSL_LANGUAGE)
 async def get_image(code, time= 0.0, resolution=(512, 420)):
+    tree = parser.parse(bytes(code, "utf8"))
+    if tree.root_node.has_error:
+        print("ERROR in the tree, aborting.")
+        return None
     shader = ShadertoyCustom(code, resolution, OffscreenCanvas, run_offscreen) #pass offscreen canvas here.
     shader._uniform_data["time"] = time #set any time you want
     shader._canvas.request_draw(shader._draw_frame)
     sample_auhtor = sample_pass["author"]
     source_iframe = construct_embed(sample_source)
     print(f"{source_iframe=}")
+    sample_funcs = _parse_functions(sample_code)
+    funcs = _parse_functions(sample_code)
+    func_identifiers = [(idx,n.child_by_field_name("declarator").text.decode()) for idx, n in enumerate(funcs)]
+    print(f"updating drop down to:{func_identifiers}")
+    return sample_pass, sample_code, source_iframe, funcs, gr.Dropdown.update(choices=func_identifiers) #, sample_title, sample_auhtor
+def _parse_functions(in_code):
+    """
+    returns all functions in the code as their actual nodes.
+    """
+    tree = parser.parse(bytes(in_code, "utf8"))
+    funcs = [n for n in tree.root_node.children if n.type == "function_definition"]
+    return funcs
+PIPE = None
+def _make_pipeline(model_cp = "Vipitis/santacoder-finetuned-Shadertoys-fine"): #bad default model for testing
     tokenizer = AutoTokenizer.from_pretrained(model_cp, trust_remote_code=True)
     model = AutoModelForCausalLM.from_pretrained(model_cp, trust_remote_code=True)
     pipe = pipeline("text-generation", model=model, tokenizer=tokenizer, trust_remote_code=True)
     print(f"loaded model {model_cp} as a pipline")
     return pipe
 def process_retn(retn):
     return retn.split(";")[0].strip()
     return altered_code
+def _line_chr2char(text, line_idx, chr_idx):
+    """
+    returns the character index at the given line and character index.
+    """
+    lines = text.split("\n")
+    char_idx = 0
+    for i in range(line_idx):
+        char_idx += len(lines[i]) + 1
+    char_idx += chr_idx
+    return char_idx
+def alter_body(old_code, func_id, funcs_list, pipeline=PIPE):
+    """
+    Replaces the body of a function with a generated one.
+    Args:
+        old_code (str): The original code.
+        func_node (Node): The node of the function to replace the body of.
+        pipeline (Pipeline): The pipeline to use for generation.
+    Returns:
+        str: The altered code.
+    """
+    print(f"{func_id=}")
+    func_id = int(func_id.split(",")[0]) #undo their string casting?
+    func_node = funcs_list[func_id]
+    print(f"using for generation: {func_node=}")
+    if pipeline is None:
+        print("no pipeline found, loading default one")
+        pipeline = _make_pipeline("Vipitis/santacoder-finetuned-Shadertoys-fine")
+    func_start_idx = _line_chr2char(old_code, func_node.start_point[0], func_node.start_point[1])
+    body_node = func_node.child_by_field_name("body")
+    body_start_idx = _line_chr2char(old_code, body_node.start_point[0], body_node.start_point[1])
+    body_end_idx = _line_chr2char(old_code, body_node.end_point[0], body_node.end_point[1])
+    print(f"{old_code[body_start_idx:body_end_idx]=}")
+    model_context = old_code[:body_start_idx]
+    generation = pipeline(model_context, max_new_tokens=(body_end_idx - body_start_idx)*2, return_full_text=False)[0]["generated_text"]
+    print(f"{generation=}")
+    first_gened_func = _parse_functions(old_code[func_start_idx:body_start_idx] + generation)[0] # truncate generation to a single function?
+    # strip just the body.
+    generated_body = first_gened_func.child_by_field_name("body").text.decode()
+    print(f"{generated_body=}")
+    altered_code = old_code[:body_start_idx] + generated_body + old_code[body_end_idx:]
+    return altered_code
 def add_history(func_id, orig_rtn, gened_rtn, history):
     # is this a list? or a JSON dict?
     history[func_id] =  (orig_rtn, gened_rtn)
     return history, history
+def list_dropdown(in_code):
+    funcs = _parse_functions(in_code)
+    # print(f"updating drop down to:{func_identifiers=}")
+    func_identifiers = [(idx,n.child_by_field_name("declarator").text.decode()) for idx, n in enumerate(funcs)]
+    # funcs = [n for n in funcs] #wrapped as set to avoid json issues?
+    print(f"updating drop down to:{func_identifiers}")
+    return funcs, gr.Dropdown.update(choices=func_identifiers)
 def construct_embed(source_url):
     shader_id = source_url.split("/")[-1]
     return f'<iframe width="640" height="360" frameborder="0" src="https://www.shadertoy.com/embed/{shader_id}?gui=true&t=0&paused=true&muted=true" allowfullscreen></iframe>'
     text_md = gr.Markdown(text)
     model_cp = gr.Textbox(value="Vipitis/santacoder-finetuned-Shadertoys-fine", label="Model Checkpoint (Enter to load!)", interactive=True)
     sample_idx = gr.Slider(minimum=0, maximum=num_samples, value=3211, label="pick sample from dataset", step=1.0)
+    func_dropdown = gr.Dropdown(label="chose a function to modify") #breaks if I add a string in before that?
+    with gr.Row():
+        gen_return_button = gr.Button("generate a alternate return statement", label="generate return")
+        gen_func_button = gr.Button("generate an alternate function body", label="generate function")
+        # update_funcs_button = gr.Button("update functions", label="update functions")
     render_button = gr.Button("render frame0 (can carsh the sapce on invalid shadercode)",label="render frame")
     time_slider = gr.Slider(minimum=0, maximum=10, value=0, label="time (update on release, also used to pick other functions as a bodge)", step=0.02)
     with gr.Row():
         with gr.Column():
             source_embed = gr.HTML('<iframe width="640" height="360" frameborder="0" src="https://www.shadertoy.com/embed/WsBcWV?gui=true&t=0&paused=true&muted=true" allowfullscreen></iframe>', label="How this shader originally renders")
+            rendered_frame = gr.Image(shape=(512, 420), label=f"rendered frame preview", type="pil") #colors are messed up?
+        sample_code = gr.Code(label="Current Code (will update changes you generate)", language=None)
     sample_pass = gr.State(value={})
     pipe = gr.State(value=PIPE)
+    funcs = gr.State(value=[])
     # hist_state = gr.State(Value={})
     # history_table = gr.JSON()
     model_cp.submit(fn=_make_pipeline, inputs=[model_cp], outputs=[pipe])
+    sample_idx.release(fn=grab_sample, inputs=[sample_idx], outputs=[sample_pass, sample_code, source_embed, funcs, func_dropdown])
+    # sample_idx.release(fn=list_dropdown, inputs=[sample_code], outputs=[funcs, func_dropdown]) #use multiple event handles to call other functions! seems to not work really well. always messes up
+    gen_return_button.click(fn=alter_return, inputs=[sample_code, time_slider, pipe], outputs=[sample_code])
+    gen_func_button.click(fn=alter_body, inputs=[sample_code, func_dropdown, funcs, pipe], outputs=[sample_code])
     # run_button.click(fn=add_history, inputs=[time_slider, sample_pass, sample_code, hist_state], outputs=[history_table, hist_state])
     # sample_idx.release(fn=construct_embed, inputs=[sample_idx], outputs=[source_embed]) #twice to make have different outputs?
     time_slider.release(fn=lambda code, time: asyncio.run(get_image(code, time)), inputs=[sample_code, time_slider], outputs=rendered_frame)

build/my-languages.exp ADDED Viewed

Binary file (744 Bytes). View file

build/my-languages.lib ADDED Viewed

Binary file (1.8 kB). View file

build/my-languages.so ADDED Viewed

Binary file (631 kB). View file

requirements.txt CHANGED Viewed

@@ -7,4 +7,5 @@ pillow
 gradio
 numpy
 glfw
-jupylet

 gradio
 numpy
 glfw
+jupylet
+tree-sitter