mlc-ai · junrushao · Sep 28, 2023 · Sep 27, 2023
diff --git a/cpp/conv_templates.cc b/cpp/conv_templates.cc
@@ -46,6 +46,22 @@ Conversation Llama2() {
   return conv;
 }
 
+Conversation MistralDefault() {
+  Conversation conv;
+  conv.name = "mistral_default";
+  conv.roles = {"[INST]", "[/INST]"};
+  conv.messages = {};
+  conv.offset = 0;
+  conv.separator_style = SeparatorStyle::kSepRoleMsg;
+  conv.seps = {" "};
+  conv.role_msg_sep = " ";
+  conv.role_empty_sep = " ";
+  conv.stop_tokens = {2};
+  conv.stop_str = "</s>";
+  conv.add_bos = true;
+  return conv;
+}
+
 Conversation CodeLlamaCompletion() {
   Conversation conv;
   conv.name = "codellama_completion";
@@ -546,6 +562,7 @@ Conversation Conversation::FromTemplate(const std::string& name) {
   static std::unordered_map<std::string, ConvFactory> factory = {
       {"llama_default", LlamaDefault},
       {"llama-2", Llama2},
+      {"mistral_default", MistralDefault},
       {"codellama_completion", CodeLlamaCompletion},
       {"codellama_instruct", CodeLlamaInstruct},
       {"vicuna_v1.1", VicunaV11},

diff --git a/mlc_llm/core.py b/mlc_llm/core.py
@@ -593,6 +593,8 @@ def build_model_from_args(args: argparse.Namespace):
     if not use_cache or args.convert_weight_only:
         if args.model_category == "llama":
             mod, param_manager, params, model_config = llama.get_model(args, config)
+        elif args.model_category == "mistral":
+            mod, param_manager, params, model_config = llama.get_model(args, config)
         elif args.model_category == "gpt_neox":
             mod, param_manager, params, model_config = gpt_neox.get_model(args, config)
         elif args.model_category == "gpt_bigcode":

diff --git a/mlc_llm/utils.py b/mlc_llm/utils.py
@@ -13,7 +13,7 @@
 from .transform import ReorderTransformFunc
 
 supported_model_types = set(
-    ["llama", "gpt_neox", "gpt_bigcode", "minigpt", "moss", "rwkv", "gptj", "chatglm"]
+    ["llama", "gpt_neox", "gpt_bigcode", "minigpt", "moss", "rwkv", "gptj", "chatglm", "mistral"]
 )