upgrade chatglm to chatglm2

2023-06-30 12:06:28 +08:00 · 2023-06-30 12:06:28 +08:00 · 403667aec1
commit 403667aec1
parent 37172906ef
2 changed files with 13 additions and 4 deletions
--- a/request_llm/bridge_all.py
+++ b/request_llm/bridge_all.py
@ -152,7 +152,7 @@ model_info = {
        "token_cnt": get_token_num_gpt4,
    },

-    # chatglm
+    # 将 chatglm 直接对齐到 chatglm2
    "chatglm": {
        "fn_with_ui": chatglm_ui,
        "fn_without_ui": chatglm_noui,
@ -161,6 +161,15 @@ model_info = {
        "tokenizer": tokenizer_gpt35,
        "token_cnt": get_token_num_gpt35,
    },
+    "chatglm2": {
+        "fn_with_ui": chatglm_ui,
+        "fn_without_ui": chatglm_noui,
+        "endpoint": None,
+        "max_token": 1024,
+        "tokenizer": tokenizer_gpt35,
+        "token_cnt": get_token_num_gpt35,
+    },
+    
    # newbing
    "newbing": {
        "fn_with_ui": newbing_ui,
--- a/request_llm/bridge_chatglm.py
+++ b/request_llm/bridge_chatglm.py
@ -40,12 +40,12 @@ class GetGLMHandle(Process):
        while True:
            try:
                if self.chatglm_model is None:
-                    self.chatglm_tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
+                    self.chatglm_tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm2-6b", trust_remote_code=True)
                    device, = get_conf('LOCAL_MODEL_DEVICE')
                    if device=='cpu':
-                        self.chatglm_model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).float()
+                        self.chatglm_model = AutoModel.from_pretrained("THUDM/chatglm2-6b", trust_remote_code=True).float()
                    else:
-                        self.chatglm_model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()
+                        self.chatglm_model = AutoModel.from_pretrained("THUDM/chatglm2-6b", trust_remote_code=True).half().cuda()
                    self.chatglm_model = self.chatglm_model.eval()
                    break
                else: