Spaces:

markqiu
/

prinvest_mate

Sleeping

App Files Files Community

johnsmith253325 commited on Nov 23, 2023

Commit

4cae7cc

1 Parent(s): cebe276

feat: 支持ChatGLM3 resolve #941

Browse files

Files changed (3) hide show

modules/models/ChatGLM.py +24 -1
modules/models/base_model.py +5 -0
modules/presets.py +2 -0

modules/models/ChatGLM.py CHANGED Viewed

@@ -4,6 +4,8 @@ import logging
 import os
 import platform
 import colorama
 from ..index_func import *
@@ -18,6 +20,7 @@ class ChatGLM_Client(BaseLLMModel):
         import torch
         from transformers import AutoModel, AutoTokenizer
         global CHATGLM_TOKENIZER, CHATGLM_MODEL
         if CHATGLM_TOKENIZER is None or CHATGLM_MODEL is None:
             system_name = platform.system()
             model_path = None
@@ -53,7 +56,12 @@ class ChatGLM_Client(BaseLLMModel):
             model = model.eval()
             CHATGLM_MODEL = model
-    def _get_glm_style_input(self):
         history = [x["content"] for x in self.history]
         query = history.pop()
         logging.debug(colorama.Fore.YELLOW +
@@ -65,6 +73,12 @@ class ChatGLM_Client(BaseLLMModel):
                    for i in range(0, len(history), 2)]
         return history, query
     def get_answer_at_once(self):
         history, query = self._get_glm_style_input()
         response, _ = CHATGLM_MODEL.chat(
@@ -82,3 +96,12 @@ class ChatGLM_Client(BaseLLMModel):
             temperature=self.temperature,
         ):
             yield response

 import os
 import platform
+import gc
+import torch
 import colorama
 from ..index_func import *
         import torch
         from transformers import AutoModel, AutoTokenizer
         global CHATGLM_TOKENIZER, CHATGLM_MODEL
+        self.deinitialize()
         if CHATGLM_TOKENIZER is None or CHATGLM_MODEL is None:
             system_name = platform.system()
             model_path = None
             model = model.eval()
             CHATGLM_MODEL = model
+    def _get_glm3_style_input(self):
+        history = self.history
+        query = history.pop()["content"]
+        return history, query
+    def _get_glm2_style_input(self):
         history = [x["content"] for x in self.history]
         query = history.pop()
         logging.debug(colorama.Fore.YELLOW +
                    for i in range(0, len(history), 2)]
         return history, query
+    def _get_glm_style_input(self):
+        if "glm2" in self.model_name:
+            return self._get_glm2_style_input()
+        else:
+            return self._get_glm3_style_input()
     def get_answer_at_once(self):
         history, query = self._get_glm_style_input()
         response, _ = CHATGLM_MODEL.chat(
             temperature=self.temperature,
         ):
             yield response
+    def deinitialize(self):
+        # 释放显存
+        global CHATGLM_MODEL, CHATGLM_TOKENIZER
+        CHATGLM_MODEL = None
+        CHATGLM_TOKENIZER = None
+        gc.collect()
+        torch.cuda.empty_cache()
+        logging.info("ChatGLM model deinitialized")

modules/models/base_model.py CHANGED Viewed

@@ -847,6 +847,11 @@ class BaseLLMModel:
         """
         return gr.update()
 class Base_Chat_Langchain_Client(BaseLLMModel):
     def __init__(self, model_name, user_name=""):

         """
         return gr.update()
+    def deinitialize(self):
+        """deinitialize the model, implement if needed
+        """
+        pass
 class Base_Chat_Langchain_Client(BaseLLMModel):
     def __init__(self, model_name, user_name=""):

modules/presets.py CHANGED Viewed

@@ -87,6 +87,8 @@ LOCAL_MODELS = [
     "chatglm-6b-int4-ge",
     "chatglm2-6b",
     "chatglm2-6b-int4",
     "StableLM",
     "MOSS",
     "Llama-2-7B-Chat",

     "chatglm-6b-int4-ge",
     "chatglm2-6b",
     "chatglm2-6b-int4",
+    "chatglm3-6b",
+    "chatglm3-6b-32k",
     "StableLM",
     "MOSS",
     "Llama-2-7B-Chat",