lm-sys · silk55 · Oct 31, 2023 · Oct 31, 2023 · Oct 31, 2023 · Oct 31, 2023
diff --git a/docs/model_support.md b/docs/model_support.md
@@ -39,6 +39,7 @@
 - [StabilityAI/stablelm-tuned-alpha-7b](https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b)
 - [THUDM/chatglm-6b](https://huggingface.co/THUDM/chatglm-6b)
 - [THUDM/chatglm2-6b](https://huggingface.co/THUDM/chatglm2-6b)
+- [THUDM/chatglm3-6b](https://huggingface.co/THUDM/chatglm3-6b)
 - [tiiuae/falcon-40b](https://huggingface.co/tiiuae/falcon-40b)
 - [tiiuae/falcon-180B-chat](https://huggingface.co/tiiuae/falcon-180B-chat)
 - [timdettmers/guanaco-33b-merged](https://huggingface.co/timdettmers/guanaco-33b-merged)

diff --git a/fastchat/conversation.py b/fastchat/conversation.py
@@ -140,6 +140,17 @@ def get_prompt(self) -> str:
         elif self.sep_style == SeparatorStyle.CHATGLM:
             # source: https://huggingface.co/THUDM/chatglm-6b/blob/1d240ba371910e9282298d4592532d7f0f3e9f3e/modeling_chatglm.py#L1302-L1308
             # source2: https://huggingface.co/THUDM/chatglm2-6b/blob/e186c891cf64310ac66ef10a87e6635fa6c2a579/modeling_chatglm.py#L926
+            if self.name == "chatglm3":
+                if self.system_message and system_prompt:
+                    ret = system_prompt + "\n"
+                else:
+                    ret = ""
+                for i, (role, message) in enumerate(self.messages):
+                    if message:
+                        ret += role + "\n" + message + "\n"
+                    else:
+                        ret += role + "\n"
+                return ret
             round_add_n = 1 if self.name == "chatglm2" else 0
             if system_prompt:
                 ret = system_prompt + self.sep
@@ -448,6 +459,18 @@ def get_conv_template(name: str) -> Conversation:
     )
 )
 
+# ChatGLM3 default template
+register_conv_template(
+    Conversation(
+        name="chatglm3",
+        system_template="<|system|>\n{system_message}",
+        roles=("<|user|>", "<|assistant|>"),
+        sep_style=SeparatorStyle.CHATGLM,
+        sep=None,
+        stop_token_ids=[2, 64795, 64797],
+    )
+)
+
 # Dolly V2 default template
 register_conv_template(
     Conversation(

diff --git a/fastchat/model/model_adapter.py b/fastchat/model/model_adapter.py
@@ -739,6 +739,8 @@ def get_default_conv_template(self, model_path: str) -> Conversation:
         model_path = model_path.lower()
         if "chatglm2" in model_path.lower():
             return get_conv_template("chatglm2")
+        if "chatglm3" in model_path.lower():
+            return get_conv_template("chatglm3")
         return get_conv_template("chatglm")
 
 

diff --git a/fastchat/model/model_registry.py b/fastchat/model/model_registry.py
@@ -129,7 +129,7 @@ def get_model_info(name: str) -> ModelInfo:
     "an RNN with transformer-level LLM performance",
 )
 register_model_info(
-    ["chatglm-6b", "chatglm2-6b"],
+    ["chatglm-6b", "chatglm2-6b", "chatglm3-6b"],
     "ChatGLM",
     "https://chatglm.cn/blog",
     "an open bilingual dialogue language model by Tsinghua University",

diff --git a/fastchat/serve/gradio_block_arena_anony.py b/fastchat/serve/gradio_block_arena_anony.py
@@ -175,6 +175,7 @@ def share_click(state0, state1, model_selector0, model_selector1, request: gr.Re
     "vicuna-7b": 1.0,
     "llama-2-7b-chat": 1.0,
     "chatglm2-6b": 1.0,
+    "chatglm3-6b": 1.0,
     "mistral-7b-instruct": 1.0,
     # deprecated
     "codellama-13b-instruct": 1.0,