codellama-playground

Running

pcuenq HF staff commited on Aug 25, 2023

Commit

b00b30b

1 Parent(s): e3716e2

Infilling update (untested)

Following this code: https://github.com/facebookresearch/codellama/blob/427d6ac90f0b7db206bc4c62f4c5d38f92ca4d10/llama/generation.py#L380

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,13 +13,14 @@ HF_TOKEN = os.environ.get("HF_TOKEN", None)
 API_URL = "https://api-inference.huggingface.co/models/codellama/CodeLlama-7b-hf"
-FIM_PREFIX = "<fim_prefix>"
-FIM_MIDDLE = "<fim_middle>"
-FIM_SUFFIX = "<fim_suffix>"
 FIM_INDICATOR = "<FILL_HERE>"
 EOS_STRING = "</s>"
 theme = gr.themes.Monochrome(
     primary_hue="indigo",
@@ -78,7 +79,7 @@ def generate(
     previous_token = ""
     for response in stream:
-        if response.token.text == EOS_STRING:
             if fim_mode:
                 output += suffix
             else:

 API_URL = "https://api-inference.huggingface.co/models/codellama/CodeLlama-7b-hf"
+FIM_PREFIX = "<PRE> "
+FIM_MIDDLE = " <MID>"
+FIM_SUFFIX = "<SUF>"
 FIM_INDICATOR = "<FILL_HERE>"
 EOS_STRING = "</s>"
+EOT_STRING = "<EOT>"
 theme = gr.themes.Monochrome(
     primary_hue="indigo",
     previous_token = ""
     for response in stream:
+        if response.token.text in [EOS_STRING, EOT_STRING]:
             if fim_mode:
                 output += suffix
             else: