stack-llama

Runtime error

App Files Files Community

lvwerra HF Staff commited on Aug 8, 2023

Commit

ec23712

1 Parent(s): f1751f2

stack-llama-2 (#37)

Browse files

- update to stack-llama-v2 (0bc403488329943436e326a81e639c0d4efbaf54)

Files changed (1) hide show

app.py +12 -9

app.py CHANGED Viewed

@@ -3,13 +3,13 @@ import os
 import shutil
 import gradio as gr
-from huggingface_hub import Repository
 from text_generation import Client
 from share_btn import community_icon_html, loading_icon_html, share_js, share_btn_css
 HF_TOKEN = os.environ.get("TRL_TOKEN", None)
-API_URL = os.environ.get("API_URL")
 theme = gr.themes.Monochrome(
@@ -25,10 +25,15 @@ if HF_TOKEN:
     except:
         pass
-    repo = Repository(
-        local_dir="./data/", clone_from="trl-lib/stack-llama-prompts", use_auth_token=HF_TOKEN, repo_type="dataset"
     )
-    repo.git_pull()
 client = Client(
     API_URL,
@@ -42,8 +47,6 @@ def save_inputs_and_outputs(inputs, outputs, generate_kwargs):
     with open(os.path.join("data", "prompts.jsonl"), "a") as f:
         json.dump({"inputs": inputs, "outputs": outputs, "generate_kwargs": generate_kwargs}, f, ensure_ascii=False)
         f.write("\n")
-        commit_url = repo.push_to_hub()
 def generate(instruction, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0,  do_save=True):
     formatted_instruction = PROMPT_TEMPLATE.format(prompt=instruction)
@@ -106,11 +109,11 @@ with gr.Blocks(theme=theme, analytics_enabled=False, css=css) as demo:
             """![](https://huggingface.co/spaces/trl-lib/stack-llama/resolve/main/stackllama_logo.png)
-            StackLLaMa is a 7 billion parameter language model based on [Meta's LLaMA model](https://ai.facebook.com/blog/large-language-model-llama-meta-ai/) that has been trained on pairs of questions and answers from [Stack Exchange](https://stackexchange.com) using Reinforcement Learning from Human Feedback (RLHF) with the [TRL library](https://github.com/lvwerra/trl). For more details, check out our [blog post](https://huggingface.co/blog/stackllama).
             Type in the box below and click the button to generate answers to your most pressing questions!
-            ⚠️ **Intended Use**: this app and its [supporting model](https://huggingface.co/trl-lib/llama-7b-se-rl-peft) are provided as educational tools to explain RLHF with the TRL library; not to serve as replacement for human expertise. For more details on the model's limitations in terms of factuality and biases, see the [model card.](https://huggingface.co/trl-lib/llama-7b-se-rl-peft#intended-uses--limitations)
             ⚠️ **Data Collection**: by default, we are collecting the prompts entered in this app to further improve and evaluate the model. Do not share any personal or sensitive information while using the app! You can opt out of this data collection by removing the checkbox below:
       """

 import shutil
 import gradio as gr
+from huggingface_hub import Repository, CommitScheduler
 from text_generation import Client
 from share_btn import community_icon_html, loading_icon_html, share_js, share_btn_css
 HF_TOKEN = os.environ.get("TRL_TOKEN", None)
+API_URL = "https://api-inference.huggingface.co/models/kashif/stack-llama-2"
 theme = gr.themes.Monochrome(
     except:
         pass
+    # Schedule regular uploads every 10 minutes. Remote repo and local folder are created if they don't already exist.
+    scheduler = CommitScheduler(
+        repo_id="trl-lib/stack-llama-2-prompts",
+        repo_type="dataset",
+        folder_path="./data/",
+        path_in_repo="./",
+        every=10,
     )
 client = Client(
     API_URL,
     with open(os.path.join("data", "prompts.jsonl"), "a") as f:
         json.dump({"inputs": inputs, "outputs": outputs, "generate_kwargs": generate_kwargs}, f, ensure_ascii=False)
         f.write("\n")
 def generate(instruction, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0,  do_save=True):
     formatted_instruction = PROMPT_TEMPLATE.format(prompt=instruction)
             """![](https://huggingface.co/spaces/trl-lib/stack-llama/resolve/main/stackllama_logo.png)
+            StackLLaMa-2 is a 7 billion parameter language model based on [Meta's LLaMA 2 model](https://ai.meta.com/llama/) that has been trained on pairs of questions and answers from [Stack Exchange](https://stackexchange.com) using Direct Preference Optimization (DPO) with the [TRL library](https://github.com/lvwerra/trl). For more details, check out our [blog post](https://huggingface.co/blog/dpo-trl).
             Type in the box below and click the button to generate answers to your most pressing questions!
+            ⚠️ **Intended Use**: this app and its [supporting model](https://huggingface.co/kashif/stack-llama-2) are provided as educational tools to explain RLHF with the TRL library; not to serve as replacement for human expertise. For more details on the model's limitations in terms of factuality and biases, see the [model card.](https://huggingface.co/kashif/stack-llama-2#intended-uses--limitations)
             ⚠️ **Data Collection**: by default, we are collecting the prompts entered in this app to further improve and evaluate the model. Do not share any personal or sensitive information while using the app! You can opt out of this data collection by removing the checkbox below:
       """