PMBeta

Paused

Sergidev commited on Jun 11

Commit

2f6a972

•

1 Parent(s): 50fe85a

undo cuda

Files changed (1) hide show

modules/pmbl.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import sqlite3
 from datetime import datetime
 from concurrent.futures import ThreadPoolExecutor
-from llama_cpp import Llama
 class PMBL:
     def __init__(self, model_path):
@@ -101,11 +100,9 @@ class PMBL:
         for chunk in response.result():
             yield chunk
     def generate_response_task(self, system_prompt, prompt, n_ctx):
         llm = Llama(model_path=self.model_path, n_ctx=n_ctx, n_threads=8, mlock=True)
-        llm = llm.to("cuda")  # Move the model to the GPU
         response = llm(
             system_prompt,
@@ -149,11 +146,9 @@ class PMBL:
             conn.commit()
         conn.close()
     def generate_topic(self, prompt, response):
         llm = Llama(model_path=self.model_path, n_ctx=1690, n_threads=8, mlock=True)
-        llm = llm.to("cuda")  # Move the model to the GPU
         system_prompt = f"Based on the following interaction between a user and an AI assistant, generate a concise topic for the conversation in 2-4 words:\n\nUser: {prompt}\nAssistant: {response}\n\nTopic:"
@@ -165,4 +160,4 @@ class PMBL:
             echo=False
         )
-        return topic['choices'][0]['text'].strip()

 import sqlite3
 from datetime import datetime
 from concurrent.futures import ThreadPoolExecutor
 class PMBL:
     def __init__(self, model_path):
         for chunk in response.result():
             yield chunk
     def generate_response_task(self, system_prompt, prompt, n_ctx):
         llm = Llama(model_path=self.model_path, n_ctx=n_ctx, n_threads=8, mlock=True)
         response = llm(
             system_prompt,
             conn.commit()
         conn.close()
     def generate_topic(self, prompt, response):
         llm = Llama(model_path=self.model_path, n_ctx=1690, n_threads=8, mlock=True)
         system_prompt = f"Based on the following interaction between a user and an AI assistant, generate a concise topic for the conversation in 2-4 words:\n\nUser: {prompt}\nAssistant: {response}\n\nTopic:"
             echo=False
         )
+        return topic['choices'][0]['text'].strip()