import os import re import base64 import json from typing import Dict, List, Optional, Tuple import gradio as gr from loguru import logger import sambanova_gradio from sambanova_gradio import get_fn import modelscope_studio.components.base as ms import modelscope_studio.components.legacy as legacy import modelscope_studio.components.antd as antd from config import DEMO_LIST, SystemPrompt YOUR_API_TOKEN = os.getenv('SAMBANOVA_API_KEY') History = List[Tuple[str, str]] Messages = List[Dict[str, str]] from tree_sitter_languages import get_parser def check_code_error(code, language='python'): language_ext = {'go': 'go', 'html': 'html', 'python': 'python', 'cpp': 'cpp', # 'sql': 'sql', 'php': 'php', 'javascript': 'javascript', # 'R': 'r', 'typescript': 'typescript', 'ruby': 'ruby', 'bash': 'bash', 'rust': 'rust', # 'D': 'd', 'scala': 'scala', 'csharp': 'c_sharp', 'java': 'java', 'json': 'json', 'julia': 'julia', 'css': 'css', 'jsdoc': 'jsdoc', 'swift': 'swift', 'cli': 'cli', } if language not in language_ext.keys(): return {'result': True, 'error': 'no language in tree_sitter_languages'} try: parser = get_parser(language_ext[language]) code_bytes = code.encode('utf-8') tree = parser.parse(code_bytes) root_node = tree.root_node visit_list = [root_node] ans = [] while visit_list: node = visit_list.pop() if node.type == 'ERROR': return {'result': True, 'error': True, 'root_node': root_node} is_inner = True if node.children else False ans.append([node, is_inner]) for child in node.children: visit_list.append(child) return {'result': True, 'error': False, 'root_node': root_node} except Exception as e: return {'result': False, 'error': str(e)} def history_to_messages(history: History, system: str) -> Messages: messages = [{'role': 'system', 'content': system}] for h in history: messages.append({'role': 'user', 'content': h[0]}) messages.append({'role': 'assistant', 'content': h[1]}) return messages def messages_to_history(messages: Messages) -> History: assert messages[0]['role'] == 'system' history = [] for q, r in zip(messages[1::2], messages[2::2]): history.append([q['content'], r['content']]) return history def remove_code_block(text, language='html'): pattern = r'```' + language.lower() + '\n(.+?)\n```' match = re.search(pattern, text, re.DOTALL) if match: return match.group(1).strip() else: return text.strip() def history_render(history: History): return gr.update(open=True), history def clear_history(): return [] def send_to_sandbox(code): encoded_html = base64.b64encode(code.encode('utf-8')).decode('utf-8') data_uri = f"data:text/html;charset=utf-8;base64,{encoded_html}" return f"" def demo_card_click(e: gr.EventData): index = e._data['component']['index'] return DEMO_LIST[index]['description'] def read_jsonl(fn): with open(fn, encoding="utf-8") as f: return [json.loads(l) for l in f.readlines()] def get_item_by_index(item_list, index, val=None): if val is not None and val in item_list: return val if len(item_list) > index: return item_list[index] return "" def get_item_list(locale="zh", programming_language="", category="", difficulty="", debugInfo=""): samples = read_jsonl(f'./FullStackBench_data/fsb_{locale}_20241204.jsonl') item_list_count = {} item_samples = [] for sample in samples: labels = sample['labels'] content = [sample['content']] sample_dict = [labels['programming_language'], f"/{labels['category']}/{labels['difficulty']}/", content] if (locale != "" and labels['locale'] == locale): if programming_language == "": item = labels['programming_language'] item_list_count[item] = item_list_count.get(item, 0) + 1 item_samples.append(sample_dict) elif category == "" and labels['programming_language'] == programming_language: item = labels['category'] item_list_count[item] = item_list_count.get(item, 0) + 1 item_samples.append(sample_dict) elif difficulty == "" and labels['programming_language'] == programming_language and labels['category'] == category: item = labels['difficulty'] item_list_count[item] = item_list_count.get(item, 0) + 1 item_samples.append(sample_dict) elif labels['programming_language'] == programming_language and labels['category'] == category and labels['difficulty'] == difficulty: item = labels['difficulty'] item_list_count[item] = item_list_count.get(item, 0) + 1 item_samples.append(sample_dict) item_list = list(item_list_count.keys()) item_list_dropdown = [] all_count = 0 for item in item_list: all_count += item_list_count[item] item_list_dropdown.append((f"{item}[{item_list_count[item]}]",item)) item_list_dropdown.insert(0,(f"All[{all_count}]", "")) return item_list, item_list_dropdown, item_samples item_list_locale = ["en", "zh"] item_list_dropdown_locale = [("en[1687]", "en"), ("zh[1687]", "zh")] item_list_programming_language, item_list_dropdown_programming_language, item_samples = get_item_list(locale=item_list_locale[0], programming_language="", category="", difficulty="") item_list_category, item_list_dropdown_category, item_samples = get_item_list(locale=item_list_locale[0], programming_language=get_item_by_index(item_list_programming_language, 0, "python"), category="", difficulty="") item_list_difficulty, item_list_dropdown_difficulty, item_samples = get_item_list(locale=item_list_locale[0], programming_language=get_item_by_index(item_list_programming_language, 0, "python"), category=get_item_by_index(item_list_category, 0, "Basic Programming"), difficulty="") item_list_select, item_list_select_dropdown, item_samples = get_item_list(locale=item_list_locale[0], programming_language=get_item_by_index(item_list_programming_language, 0, "python"), category=get_item_by_index(item_list_category, 0, "Basic Programming"), difficulty=get_item_by_index(item_list_difficulty, 0)) def get_input_examples(): input_examples = [] for demo in DEMO_LIST: input_examples.append(['html', demo['title'], demo['description']]) return input_examples def code_syntax_check_fun(code, language='html'): check_result = check_code_error(code, language=language.lower()) if check_result['result'] == True: if check_result['error'] == True: return 'No pass' elif check_result['error'] == False: return 'Pass' else: return 'No check [no language in check_languages]' else: return check_result['error'] with gr.Blocks(css_paths="app.css", title="Qwen2.5 Coder Artifacts (+SambaNova+FullStackBench)") as demo: history_state = gr.State([]) setting = gr.State({ "system": SystemPrompt, }) with gr.Row(): code_language_example = gr.Textbox(show_label=False, lines=1, container=False, visible=False) input_text_title= gr.TextArea(show_label=False, container=False, visible=False) input_text_example = gr.TextArea(show_label=False, container=False, visible=False) with gr.Tab("Examples_HTML"): input_examples = get_input_examples() gr.Examples( examples=input_examples, inputs=[code_language_example, input_text_title, input_text_example], outputs=None, label='', examples_per_page=10, cache_examples=False, ) with gr.Tab("Examples_from_FullStackBench"): with gr.Row(): with gr.Column(): locale = gr.Dropdown( choices=item_list_dropdown_locale, label="locale", value=get_item_by_index(item_list_locale, 0), ) with gr.Column(): programming_language = gr.Dropdown( choices=item_list_dropdown_programming_language, label="programming_language", value=get_item_by_index(item_list_programming_language, 0, "python"), ) with gr.Column(): category = gr.Dropdown( choices=item_list_dropdown_category, label="category", value=get_item_by_index(item_list_category, 0, "Basic Programming"), ) with gr.Column(): difficulty = gr.Dropdown( choices=item_list_dropdown_difficulty, label="difficulty", value=get_item_by_index(item_list_difficulty, 0), ) with gr.Row(): test_examples = gr.Examples( examples=item_samples, inputs=[code_language_example, input_text_title, input_text_example], outputs=None, label='Examples:', examples_per_page=5, cache_examples=False, ) def locale_select(locale): item_list_programming_language, item_list_dropdown_programming_language, item_samples = get_item_list(locale=locale, programming_language="", category="", difficulty="", debugInfo="locale_1_") item_list_category, item_list_dropdown_category, item_samples = get_item_list(locale=locale, programming_language=get_item_by_index(item_list_programming_language, 0), category="", difficulty="", debugInfo="locale_2_") item_list_difficulty, item_list_dropdown_difficulty, item_samples = get_item_list(locale=locale, programming_language=get_item_by_index(item_list_programming_language, 0), category=get_item_by_index(item_list_category, 0), difficulty="", debugInfo="locale_3_") _, _, item_samples = get_item_list(locale=locale, programming_language=get_item_by_index(item_list_programming_language, 0), category=get_item_by_index(item_list_category, 0), difficulty=get_item_by_index(item_list_difficulty, 0), debugInfo="locale_4_") return (gr.Dropdown(choices=item_list_dropdown_programming_language, value=item_list_dropdown_programming_language[0][1]), gr.Dropdown(choices=item_list_dropdown_category, value=item_list_dropdown_category[0][1]), gr.Dropdown(choices=item_list_dropdown_difficulty, value=item_list_dropdown_difficulty[0][1]), gr.Dataset(samples=item_samples)) locale.select( fn=locale_select, inputs=[locale], outputs=[programming_language, category, difficulty, test_examples.dataset] ) def programming_language_select(locale, programming_language): item_list_category, item_list_dropdown_category, item_samples = get_item_list(locale=locale, programming_language=programming_language, category="", difficulty="", debugInfo="programming_language_1_") item_list_difficulty, item_list_dropdown_difficulty, item_samples = get_item_list(locale=locale, programming_language=programming_language, category=get_item_by_index(item_list_category, 0), difficulty="", debugInfo="programming_language_2_") _, _, item_samples = get_item_list(locale=locale, programming_language=programming_language, category=get_item_by_index(item_list_category, 0), difficulty=get_item_by_index(item_list_difficulty, 0), debugInfo="programming_language_3_") return (gr.Dropdown(choices=item_list_dropdown_category, value=item_list_dropdown_category[0][1]), gr.Dropdown(choices=item_list_dropdown_difficulty, value=item_list_dropdown_difficulty[0][1]), gr.Dataset(samples=item_samples)) programming_language.select( fn=programming_language_select, inputs=[locale, programming_language], outputs=[category, difficulty, test_examples.dataset] ) def category_select(locale, programming_language, category): item_list_difficulty, item_list_dropdown_difficulty, item_samples = get_item_list(locale=locale, programming_language=programming_language, category=category, difficulty="", debugInfo="category_1_") _, _, item_samples = get_item_list(locale=locale, programming_language=programming_language, category=category, difficulty=get_item_by_index(item_list_difficulty, 0), debugInfo="category_2_") return (gr.Dropdown(choices=item_list_dropdown_difficulty, value=item_list_dropdown_difficulty[0][1]), gr.Dataset(samples=item_samples)) category.select( fn=category_select, inputs=[locale, programming_language, category], outputs=[difficulty, test_examples.dataset] ) def difficulty_select(locale, programming_language, category, difficulty): _, _, item_samples = get_item_list(locale=locale, programming_language=programming_language, category=category, difficulty=difficulty, debugInfo="difficulty_1_") return gr.Dataset(samples=item_samples) difficulty.select( fn=difficulty_select, inputs=[locale, programming_language, category, difficulty], outputs=[test_examples.dataset] ) with ms.Application() as app: with antd.ConfigProvider(): with antd.Row(gutter=[32, 12]) as layout: with antd.Col(span=24, md=8): with antd.Flex(vertical=True, gap="middle", wrap=True): header = gr.HTML("""

Qwen2.5-Coder-32B with SambaNova Cloud API

""") input = antd.InputTextarea(size="middle", allow_clear=True, placeholder="Please enter what kind of application you want") code_language = gr.Textbox(label="code language", lines=1) btn = antd.Button("send", type="primary", size="large") with antd.Flex(gap="small", wrap=True): settingPromptBtn = antd.Button( "⚙️ set system Prompt", type="default") codeBtn = antd.Button("🧑‍💻 view code", type="default") historyBtn = antd.Button("📜 history", type="default") clear_btn = antd.Button("clear history", type="default", size="large") with antd.Modal(open=False, title="set system Prompt", width="800px") as system_prompt_modal: systemPromptInput = antd.InputTextarea( SystemPrompt, auto_size=True) settingPromptBtn.click(lambda: gr.update( open=True), inputs=[], outputs=[system_prompt_modal]) system_prompt_modal.ok(lambda input: ({"system": input}, gr.update( open=False)), inputs=[systemPromptInput], outputs=[setting, system_prompt_modal]) system_prompt_modal.cancel(lambda: gr.update( open=False), outputs=[system_prompt_modal]) with antd.Drawer(open=False, title="code", placement="left", width="750px") as code_drawer: code_output = legacy.Markdown() codeBtn.click(lambda: gr.update(open=True), inputs=[], outputs=[code_drawer]) code_drawer.close(lambda: gr.update( open=False), inputs=[], outputs=[code_drawer]) with antd.Drawer(open=False, title="history", placement="left", width="900px") as history_drawer: history_output = legacy.Chatbot(show_label=False, flushing=False, height=960, elem_classes="history_chatbot") historyBtn.click(history_render, inputs=[history_state], outputs=[history_drawer, history_output]) history_drawer.close(lambda: gr.update( open=False), inputs=[], outputs=[history_drawer]) with antd.Col(span=24, md=16): with ms.Div(elem_classes="right_panel"): gr.HTML('
') with antd.Tabs(active_key="empty", render_tab_bar="() => null") as state_tab: with antd.Tabs.Item(key="empty", label="Render_empty"): empty = antd.Empty(description="empty input", elem_classes="right_content") with antd.Tabs.Item(key="loading", label="Render_loading"): loading = antd.Spin(True, tip="coding...", size="large", elem_classes="right_content") with antd.Tabs.Item(key="render_html", label="Render_HTML") as render_html: sandbox = gr.HTML(elem_classes="html_content") with antd.Tabs.Item(key="render_other", label="Render_Code") as render_other: sandbox_other = legacy.Markdown() with antd.Row(): code_syntax_check = gr.Textbox(label="check code syntax: ", lines=1, interactive=False) def generation_code(query: Optional[str], code_language, _setting: Dict[str, str], _history: Optional[History]): if query is None: query = '' if _history is None: _history = [] # Prepare the preprocess and postprocess functions def preprocess(message, history): if code_language.lower() == 'html': messages = [{'role': 'system', 'content': _setting['system']}] else: messages = [{'role': 'system', 'content': ""}] for user_msg, assistant_msg in history: messages.append({'role': 'user', 'content': user_msg}) messages.append({'role': 'assistant', 'content': assistant_msg}) messages.append({'role': 'user', 'content': message}) return {'messages': messages} def postprocess(response_text): return response_text # Get the model from sambanova_gradio fn = get_fn( model_name='Qwen2.5-Coder-32B-Instruct', preprocess=preprocess, postprocess=postprocess, api_key=YOUR_API_TOKEN ) response_text = '' assistant_response = '' local_history = _history.copy() for content in fn(query, local_history): response_text = content # Update code_output yield { code_output: response_text, state_tab: gr.update(active_key="loading"), code_drawer: gr.update(open=True), } assistant_response = response_text local_history.append([query, assistant_response]) code = remove_code_block(assistant_response, language=code_language) if "```html" in assistant_response: sandbox_val = send_to_sandbox(code) state_tab_val = gr.update(active_key="render_html") render_html_val = gr.update(visible=True) render_other_val = gr.update(visible=False) sandbox_other_val = "" else: sandbox_val = "" state_tab_val = gr.update(active_key="render_other") render_html_val = gr.update(visible=False) render_other_val = gr.update(visible=True) sandbox_other_val = content code_syntax_check_val = code_syntax_check_fun(code, language=code_language) yield { code_output: assistant_response, history_state: local_history, sandbox: sandbox_val, state_tab: state_tab_val, code_drawer: gr.update(open=False), render_html: render_html_val, render_other: render_other_val, sandbox_other: sandbox_other_val, code_syntax_check: code_syntax_check_val, } def code_language_example_change(code_language): return code_language code_language_example.change( fn=code_language_example_change, inputs=[code_language_example], outputs=[code_language], ) def input_text_example_change(input_text_example): return input_text_example input_text_example.change( fn=input_text_example_change, inputs=[input_text_example], outputs=[input], ) btn.click(generation_code, inputs=[input, code_language, setting, history_state], outputs=[code_output, history_state, sandbox, state_tab, code_drawer, render_html, render_other, sandbox_other, code_syntax_check]) clear_btn.click(clear_history, inputs=[], outputs=[history_state]) with gr.Row(): DESCRIPTION = f'### This demo from [SambaNova-Qwen2.5-Coder-Artifacts](https://huggingface.co/spaces/sambanovasystems/SambaNova-Qwen2.5-Coder-Artifacts).
' DESCRIPTION += f'More examples from [FullStackBench](https://github.com/bytedance/FullStackBench).
' DESCRIPTION += f'Thanks for their excellent work.' gr.Markdown(DESCRIPTION) if __name__ == "__main__": demo.queue(default_concurrency_limit=20).launch(ssr_mode=False, show_api=False)