import gradio as gr import os # save your HF API token from https:/ as an env variable to avoid rate limiting auth_token = os.getenv("auth_token") # load a model from as an interface, then use it as an api # you can remove the api_key parameter if you don't care about rate limiting. api = gr.Interface.load("huggingface/EleutherAI/gpt-j-6B", api_key=auth_token) def complete_with_gpt(text): return text[:-50] + api(text[-50:]) with gr.Blocks() as demo: textbox = gr.Textbox(placeholder="Type here...", lines=4) btn = gr.Button("Autocomplete") # define what will run when the button is clicked, here the textbox is used as both an input and an output, inputs=textbox, outputs=textbox, queue=False) demo.launch()