import gradio as gr from huggingface_hub import InferenceClient """ For more information on `huggingface_hub` Inference API support, please check the docs: """ client = InferenceClient("HuggingFaceH4/zephyr-7b-beta") def respond( message, history: list[tuple[str, str]], system_message, max_tokens, temperature, top_p, ): return "test", [] """ For information on how to customize the ChatInterface, peruse the gradio docs: """ demo = gr.ChatInterface( respond, additional_inputs=[ gr.Markdown("Please enter your message. Add privacy tags (...) around the words you want to hide. Only the most recent message submitted will be taken into account (no history is retained)."), gr.Slider(minimum=1, maximum=128, value=32, step=1, label="Max new tokens"), gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"), ], ) if __name__ == "__main__": demo.launch()