PMBeta

Paused

Sergidev commited on Jul 18

Commit

aeab65b

•

1 Parent(s): dd82b95

Update modules/pmbl.py

Files changed (1) hide show

modules/pmbl.py CHANGED Viewed

@@ -102,7 +102,7 @@ class PMBL:
             yield chunk
     def generate_response_task(self, system_prompt, prompt, n_ctx):
-        llm = Llama(model_path=self.model_path, n_ctx=n_ctx, n_threads=8, n_gpu_layers=-1, mlock=True)
         response = llm(
             system_prompt,
@@ -110,9 +110,7 @@ class PMBL:
             temperature=0.7,
             stop=["</s>", "\nUser:", "\nuser:", "\nSystem:", "\nsystem:"],
             echo=False,
-            stream=True,
-            use_flash_attn=True,
-            mlock=True,
         )
         response_text = ""

             yield chunk
     def generate_response_task(self, system_prompt, prompt, n_ctx):
+        llm = Llama(model_path=self.model_path, n_ctx=n_ctx, n_threads=8, n_gpu_layers=-1, use_flash_attn=True, mlock=True)
         response = llm(
             system_prompt,
             temperature=0.7,
             stop=["</s>", "\nUser:", "\nuser:", "\nSystem:", "\nsystem:"],
             echo=False,
+            stream=True
         )
         response_text = ""