PMBeta

Paused

Sergidev commited on Jun 10

Commit

201275c

•

1 Parent(s): 2f93e4b

Update modules/pmbl.py

Files changed (1) hide show

modules/pmbl.py CHANGED Viewed

@@ -104,7 +104,7 @@ class PMBL:
         for chunk in response.result():
             yield chunk
-    @spaces.GPU
     def generate_response_task(self, system_prompt, prompt, n_ctx):
         llm = Llama(model_path=self.model_path, n_ctx=n_ctx, n_threads=8, n_gpu_layers=-1, mlock=True)
         llm = llm.to("cuda")  # Move the model to the GPU
@@ -152,7 +152,7 @@ class PMBL:
         conn.close()
-    @spaces.GPU
     def generate_topic(self, prompt, response):
         llm = Llama(model_path=self.model_path, n_ctx=1690, n_threads=8, n_gpu_layers=-1, mlock=True)
         llm = llm.to("cuda")  # Move the model to the GPU

         for chunk in response.result():
             yield chunk
     def generate_response_task(self, system_prompt, prompt, n_ctx):
         llm = Llama(model_path=self.model_path, n_ctx=n_ctx, n_threads=8, n_gpu_layers=-1, mlock=True)
         llm = llm.to("cuda")  # Move the model to the GPU
         conn.close()
     def generate_topic(self, prompt, response):
         llm = Llama(model_path=self.model_path, n_ctx=1690, n_threads=8, n_gpu_layers=-1, mlock=True)
         llm = llm.to("cuda")  # Move the model to the GPU