Spaces:

DHEIVER
/

Pedrita

Sleeping

App Files Files Community

DHEIVER commited on Jun 29, 2023

Commit

471343c

•

1 Parent(s): a9f0202

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -17

app.py CHANGED Viewed

@@ -2,57 +2,56 @@ import gradio as gr
 from transformers import AutoTokenizer, AutoModelForCausalLM, set_seed, pipeline
-title = "Gerador de Código"
-description = "Este é um espaço para converter texto em inglês para código Python usando o modelo [codeparrot-small-text-to-code](https://huggingface.co/codeparrot/codeparrot-small-text-to-code),\
-            um modelo de geração de código Python pré-treinado em um conjunto de dados de docstrings e código Python extraído de notebooks Jupyter disponível em [github-jupyter-text](https://huggingface.co/datasets/codeparrot/github-jupyter-text)."
 example = [
-    ["Função de utilidade para calcular a precisão de predições usando métricas do sklearn", 65, 0.6, 42],
-    ["Vamos implementar uma função que calcula o tamanho de um arquivo chamado filepath", 60, 0.6, 42],
-    ["Vamos implementar o algoritmo de ordenação Bubble Sort em uma função auxiliar:", 87, 0.6, 42],
     ]
-# Altere o modelo para o modelo pré-treinado
 tokenizer = AutoTokenizer.from_pretrained("codeparrot/codeparrot-small-text-to-code")
 model = AutoModelForCausalLM.from_pretrained("codeparrot/codeparrot-small-text-to-code")
-def criar_docstring(gen_prompt):
     return "\"\"\"\n" + gen_prompt + "\n\"\"\"\n\n"
-def gerar_codigo(gen_prompt, max_tokens, temperatura=0.6, seed=42):
     set_seed(seed)
     pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
-    prompt = criar_docstring(gen_prompt)
-    generated_text = pipe(prompt, do_sample=True, top_p=0.95, temperature=temperatura, max_new_tokens=max_tokens)[0]['generated_text']
     return generated_text
 iface = gr.Interface(
-    fn=gerar_codigo,
     inputs=[
-        gr.Textbox(label="Instruções em inglês", placeholder="Digite as instruções em inglês..."),
         gr.inputs.Slider(
             minimum=8,
             maximum=256,
             step=1,
             default=8,
-            label="Número de tokens para gerar",
         ),
         gr.inputs.Slider(
             minimum=0,
             maximum=2.5,
             step=0.1,
             default=0.6,
-            label="Temperatura",
         ),
         gr.inputs.Slider(
             minimum=0,
             maximum=1000,
             step=1,
             default=42,
-            label="Semente aleatória para a geração"
         )
     ],
-    outputs=gr.Code(label="Código Python gerado", language="python", lines=10),
     examples=example,
     layout="horizontal",
     theme="peach",

 from transformers import AutoTokenizer, AutoModelForCausalLM, set_seed, pipeline
+title = "Python Code Generator"
+description = "This is a space to convert English text to Python code using the [codeparrot-small-text-to-code](https://huggingface.co/codeparrot/codeparrot-small-text-to-code) model, a pre-trained Python code generation model trained on a dataset of docstrings and Python code extracted from Jupyter notebooks available at [github-jupyter-text](https://huggingface.co/datasets/codeparrot/github-jupyter-text)."
 example = [
+    ["Utility function to calculate the precision of predictions using sklearn metrics", 65, 0.6, 42],
+    ["Let's implement a function that calculates the size of a file called filepath", 60, 0.6, 42],
+    ["Let's implement the Bubble Sort sorting algorithm in an auxiliary function:", 87, 0.6, 42],
     ]
+# Change the model to the pre-trained model
 tokenizer = AutoTokenizer.from_pretrained("codeparrot/codeparrot-small-text-to-code")
 model = AutoModelForCausalLM.from_pretrained("codeparrot/codeparrot-small-text-to-code")
+def create_docstring(gen_prompt):
     return "\"\"\"\n" + gen_prompt + "\n\"\"\"\n\n"
+def generate_code(gen_prompt, max_tokens, temperature=0.6, seed=42):
     set_seed(seed)
     pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
+    prompt = create_docstring(gen_prompt)
+    generated_text = pipe(prompt, do_sample=True, top_p=0.95, temperature=temperature, max_new_tokens=max_tokens)[0]['generated_text']
     return generated_text
 iface = gr.Interface(
+    fn=generate_code,
     inputs=[
+        gr.Textbox(label="English instructions", placeholder="Enter English instructions..."),
         gr.inputs.Slider(
             minimum=8,
             maximum=256,
             step=1,
             default=8,
+            label="Number of tokens to generate",
         ),
         gr.inputs.Slider(
             minimum=0,
             maximum=2.5,
             step=0.1,
             default=0.6,
+            label="Temperature",
         ),
         gr.inputs.Slider(
             minimum=0,
             maximum=1000,
             step=1,
             default=42,
+            label="Random seed for generation"
         )
     ],
+    outputs=gr.Code(label="Generated Python code", language="python", lines=10),
     examples=example,
     layout="horizontal",
     theme="peach",