codellama-playground

Running

lvwerra HF staff

pcuenq HF staff commited on Aug 25, 2023

Commit

6e419a7

•

1 Parent(s): 57659db

Infilling update (untested) (#1)

- Infilling update (untested) (b00b30b03d4f1b8740b97ff52aa4059fb063a042)

Co-authored-by: Pedro Cuenca <pcuenq@users.noreply.huggingface.co>

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,13 +13,14 @@ HF_TOKEN = os.environ.get("HF_TOKEN", None)
 API_URL = "https://api-inference.huggingface.co/models/codellama/CodeLlama-7b-hf"
-FIM_PREFIX = "<fim_prefix>"
-FIM_MIDDLE = "<fim_middle>"
-FIM_SUFFIX = "<fim_suffix>"
 FIM_INDICATOR = "<FILL_HERE>"
 EOS_STRING = "</s>"
 theme = gr.themes.Monochrome(
     primary_hue="indigo",
@@ -78,7 +79,7 @@ def generate(
     previous_token = ""
     for response in stream:
-        if response.token.text == EOS_STRING:
             if fim_mode:
                 output += suffix
             else:

 API_URL = "https://api-inference.huggingface.co/models/codellama/CodeLlama-7b-hf"
+FIM_PREFIX = "<PRE> "
+FIM_MIDDLE = " <MID>"
+FIM_SUFFIX = "<SUF>"
 FIM_INDICATOR = "<FILL_HERE>"
 EOS_STRING = "</s>"
+EOT_STRING = "<EOT>"
 theme = gr.themes.Monochrome(
     primary_hue="indigo",
     previous_token = ""
     for response in stream:
+        if response.token.text in [EOS_STRING, EOT_STRING]:
             if fim_mode:
                 output += suffix
             else: