diff --git a/doc/source/gen_docs.py b/doc/source/gen_docs.py
index 68e381edf6..a41472d187 100644
--- a/doc/source/gen_docs.py
+++ b/doc/source/gen_docs.py
@@ -46,17 +46,15 @@ def get_metrics_from_url(metrics_url):
         })
     return result
 
+
 def main():
-    template_dir = '../templates' 
+    template_dir = '../templates'
     env = Environment(loader=FileSystemLoader(template_dir))
 
     with open('../../xinference/model/llm/llm_family.json', 'r') as model_file:
         models = json.load(model_file)
 
-        model_by_names = { m['model_name']: m for m in models}
-        model_scope_file = open('../../xinference/model/llm/llm_family_modelscope.json')
-        models_modelscope = json.load(model_scope_file)
-        model_by_names_modelscope = { m['model_name']: m for m in models_modelscope}
+        model_by_names = {m['model_name']: m for m in models}
 
         sorted_models = []
         output_dir = './models/builtin/llm'
@@ -69,10 +67,16 @@ def main():
             sorted_models.append(model)
 
             for model_spec in model['model_specs']:
-                model_spec['model_hubs'] = [{                                                                  
-                    'name': MODEL_HUB_HUGGING_FACE, 
-                    'url': f"https://huggingface.co/{model_spec['model_id']}"
+                original_model_hubs = model_spec['model_hubs']
+                model_spec['model_hubs'] = [{
+                    'name': MODEL_HUB_HUGGING_FACE,
+                    'url': f"https://huggingface.co/{original_model_hubs['huggingface']['model_id']}"
                 }]
+                if 'modelscope' in original_model_hubs:
+                    model_spec['model_hubs'].append({
+                        'name': MODEL_HUB_MODELSCOPE,
+                        'url': f"https://modelscope.cn/models/{original_model_hubs['modelscope']['model_id']}"
+                    })
 
                 # model engines
                 engines = []
@@ -90,22 +94,6 @@ def main():
                             engines.append(engine)
                 model_spec['engines'] = sorted(list(set(engines)), reverse=True)
 
-            # manual merge
-            if model_name in model_by_names_modelscope.keys():
-
-                def get_unique_id(spec):
-                    return spec['model_format'] + '-' + str(spec['model_size_in_billions'])
-
-                model_by_ids_modelscope = {get_unique_id(s) : s for s in model_by_names_modelscope[model_name]['model_specs']}
-
-                for model_spec in model['model_specs']:
-                    spec_id = get_unique_id(model_spec)
-                    if spec_id in model_by_ids_modelscope.keys():
-                        model_spec['model_hubs'].append({
-                            'name': MODEL_HUB_MODELSCOPE,
-                            'url': f"https://modelscope.cn/models/{model_by_ids_modelscope[spec_id]['model_id']}"
-                        })
-
             rendered = env.get_template('llm.rst.jinja').render(model)
             output_file_name = f"{model['model_name'].lower()}.rst"
             if output_file_name in current_files:
@@ -125,16 +113,14 @@ def get_unique_id(spec):
             rendered_index = env.get_template('llm_index.rst.jinja').render(models=sorted_models)
             file.write(rendered_index)
 
-
     with open('../../xinference/model/embedding/model_spec.json', 'r') as file:
         models = json.load(file)
 
-        model_by_names = { m['model_name']: m for m in models}
+        model_by_names = {m['model_name']: m for m in models}
         model_scope_file = open('../../xinference/model/embedding/model_spec_modelscope.json')
         models_modelscope = json.load(model_scope_file)
 
-        model_by_names_modelscope = { s['model_name']: s for s in models_modelscope}
-
+        model_by_names_modelscope = {s['model_name']: s for s in models_modelscope}
 
         sorted_models = []
         output_dir = './models/builtin/embedding'
@@ -147,7 +133,7 @@ def get_unique_id(spec):
 
             model['model_hubs'] = [
                 {
-                    'name': MODEL_HUB_HUGGING_FACE, 
+                    'name': MODEL_HUB_HUGGING_FACE,
                     'url': f"https://huggingface.co/{model['model_id']}"
                 }
             ]
@@ -167,7 +153,7 @@ def get_unique_id(spec):
                 print(output_file_path)
 
         index_file_path = os.path.join(output_dir, "index.rst")
-        with open(index_file_path, "w") as file:            
+        with open(index_file_path, "w") as file:
             rendered_index = env.get_template('embedding_index.rst.jinja').render(models=sorted_models)
             file.write(rendered_index)
 
@@ -186,7 +172,7 @@ def get_unique_id(spec):
 
         index_file_path = os.path.join(output_dir, "index.rst")
         with open(index_file_path, "w") as file:
-            
+
             rendered_index = env.get_template('rerank_index.rst.jinja').render(models=sorted_models)
             file.write(rendered_index)
 
diff --git a/xinference/model/llm/__init__.py b/xinference/model/llm/__init__.py
index 1980a4b81f..fbd724b21a 100644
--- a/xinference/model/llm/__init__.py
+++ b/xinference/model/llm/__init__.py
@@ -13,6 +13,7 @@
 # limitations under the License.
 
 import codecs
+import copy
 import json
 import os
 import warnings
@@ -195,85 +196,7 @@ def _install():
     SUPPORTED_ENGINES["MLX"] = MLX_CLASSES
     SUPPORTED_ENGINES["LMDEPLOY"] = LMDEPLOY_CLASSES
 
-    json_path = os.path.join(
-        os.path.dirname(os.path.abspath(__file__)), "llm_family.json"
-    )
-    for json_obj in json.load(codecs.open(json_path, "r", encoding="utf-8")):
-        model_spec = LLMFamilyV1.parse_obj(json_obj)
-        BUILTIN_LLM_FAMILIES.append(model_spec)
-
-        # register chat_template
-        if "chat" in model_spec.model_ability and isinstance(
-            model_spec.chat_template, str
-        ):
-            # note that the key is the model name,
-            # since there are multiple representations of the same prompt style name in json.
-            BUILTIN_LLM_PROMPT_STYLE[model_spec.model_name] = {
-                "chat_template": model_spec.chat_template,
-                "stop_token_ids": model_spec.stop_token_ids,
-                "stop": model_spec.stop,
-            }
-        # register model family
-        if "chat" in model_spec.model_ability:
-            BUILTIN_LLM_MODEL_CHAT_FAMILIES.add(model_spec.model_name)
-        else:
-            BUILTIN_LLM_MODEL_GENERATE_FAMILIES.add(model_spec.model_name)
-        if "tools" in model_spec.model_ability:
-            BUILTIN_LLM_MODEL_TOOL_CALL_FAMILIES.add(model_spec.model_name)
-
-    modelscope_json_path = os.path.join(
-        os.path.dirname(os.path.abspath(__file__)), "llm_family_modelscope.json"
-    )
-    for json_obj in json.load(codecs.open(modelscope_json_path, "r", encoding="utf-8")):
-        model_spec = LLMFamilyV1.parse_obj(json_obj)
-        BUILTIN_MODELSCOPE_LLM_FAMILIES.append(model_spec)
-
-        # register prompt style, in case that we have something missed
-        # if duplicated with huggingface json, keep it as the huggingface style
-        if (
-            "chat" in model_spec.model_ability
-            and isinstance(model_spec.chat_template, str)
-            and model_spec.model_name not in BUILTIN_LLM_PROMPT_STYLE
-        ):
-            BUILTIN_LLM_PROMPT_STYLE[model_spec.model_name] = {
-                "chat_template": model_spec.chat_template,
-                "stop_token_ids": model_spec.stop_token_ids,
-                "stop": model_spec.stop,
-            }
-        # register model family
-        if "chat" in model_spec.model_ability:
-            BUILTIN_LLM_MODEL_CHAT_FAMILIES.add(model_spec.model_name)
-        else:
-            BUILTIN_LLM_MODEL_GENERATE_FAMILIES.add(model_spec.model_name)
-        if "tools" in model_spec.model_ability:
-            BUILTIN_LLM_MODEL_TOOL_CALL_FAMILIES.add(model_spec.model_name)
-
-    csghub_json_path = os.path.join(
-        os.path.dirname(os.path.abspath(__file__)), "llm_family_csghub.json"
-    )
-    for json_obj in json.load(codecs.open(csghub_json_path, "r", encoding="utf-8")):
-        model_spec = LLMFamilyV1.parse_obj(json_obj)
-        BUILTIN_CSGHUB_LLM_FAMILIES.append(model_spec)
-
-        # register prompt style, in case that we have something missed
-        # if duplicated with huggingface json, keep it as the huggingface style
-        if (
-            "chat" in model_spec.model_ability
-            and isinstance(model_spec.chat_template, str)
-            and model_spec.model_name not in BUILTIN_LLM_PROMPT_STYLE
-        ):
-            BUILTIN_LLM_PROMPT_STYLE[model_spec.model_name] = {
-                "chat_template": model_spec.chat_template,
-                "stop_token_ids": model_spec.stop_token_ids,
-                "stop": model_spec.stop,
-            }
-        # register model family
-        if "chat" in model_spec.model_ability:
-            BUILTIN_LLM_MODEL_CHAT_FAMILIES.add(model_spec.model_name)
-        else:
-            BUILTIN_LLM_MODEL_GENERATE_FAMILIES.add(model_spec.model_name)
-        if "tools" in model_spec.model_ability:
-            BUILTIN_LLM_MODEL_TOOL_CALL_FAMILIES.add(model_spec.model_name)
+    _load_from_json_new("llm_family.json")
 
     for llm_specs in [
         BUILTIN_LLM_FAMILIES,
@@ -298,3 +221,63 @@ def _install():
     # register model description
     for ud_llm in get_user_defined_llm_families():
         LLM_MODEL_DESCRIPTIONS.update(generate_llm_description(ud_llm))
+
+
+def _add_model_spec(model_spec: LLMFamilyV1, LLM_FAMILIES: list[LLMFamilyV1]):
+    LLM_FAMILIES.append(model_spec)
+
+    # register chat_template
+    # register prompt style, in case that we have something missed
+    # if duplicated with huggingface json, keep it as the huggingface style
+    if (
+        "chat" in model_spec.model_ability
+        and isinstance(model_spec.chat_template, str)
+        and model_spec.model_name not in BUILTIN_LLM_PROMPT_STYLE
+    ):
+        # note that the key is the model name,
+        # since there are multiple representations of the same prompt style name in json.
+        BUILTIN_LLM_PROMPT_STYLE[model_spec.model_name] = {
+            "chat_template": model_spec.chat_template,
+            "stop_token_ids": model_spec.stop_token_ids,
+            "stop": model_spec.stop,
+        }
+    # register model family
+    if "chat" in model_spec.model_ability:
+        BUILTIN_LLM_MODEL_CHAT_FAMILIES.add(model_spec.model_name)
+    else:
+        BUILTIN_LLM_MODEL_GENERATE_FAMILIES.add(model_spec.model_name)
+    if "tools" in model_spec.model_ability:
+        BUILTIN_LLM_MODEL_TOOL_CALL_FAMILIES.add(model_spec.model_name)
+
+
+def _load_from_json_new(file_name: str):
+    json_path = os.path.join(os.path.dirname(os.path.abspath(__file__)), file_name)
+    for json_obj in json.load(codecs.open(json_path, "r", encoding="utf-8")):
+        model_specs: list[dict] = json_obj["model_specs"]
+        hub_names = ["huggingface", "modelscope", "csghub"]
+        hub_specs: dict = {}
+        for hub_name in hub_names:
+            hub_specs[hub_name] = []
+
+        hub_families = {
+            "huggingface": BUILTIN_LLM_FAMILIES,
+            "modelscope": BUILTIN_MODELSCOPE_LLM_FAMILIES,
+            "csghub": BUILTIN_CSGHUB_LLM_FAMILIES,
+        }
+
+        for model_spec in model_specs:
+            for hub_name in hub_names:
+                if hub_name in model_spec["model_hubs"]:
+                    hub_spec = copy.deepcopy(model_spec)
+                    hub_spec.update(model_spec["model_hubs"][hub_name])
+                    hub_spec["model_hub"] = hub_name
+                    del hub_spec["model_hubs"]
+                    hub_specs[hub_name].append(hub_spec)
+
+        for hub_name in hub_names:
+            a_hub_specs = hub_specs[hub_name]
+            if len(a_hub_specs) > 0:
+                model_obj = copy.deepcopy(json_obj)
+                model_obj["model_specs"] = a_hub_specs
+                converted_model_spec = LLMFamilyV1.parse_obj(model_obj)
+                _add_model_spec(converted_model_spec, hub_families[hub_name])
diff --git a/xinference/model/llm/llm_family.json b/xinference/model/llm/llm_family.json
index d31f0e64f6..d27877a830 100644
--- a/xinference/model/llm/llm_family.json
+++ b/xinference/model/llm/llm_family.json
@@ -18,8 +18,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "WisdomShell/CodeShell-7B",
-        "model_revision": "1c79ab7fd316a62ab41d764facd3548a23fa5dee"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "WisdomShell/CodeShell-7B",
+            "model_revision": "1c79ab7fd316a62ab41d764facd3548a23fa5dee"
+          },
+          "modelscope": {
+            "model_id": "WisdomShell/CodeShell-7B",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -42,8 +50,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "WisdomShell/CodeShell-7B-Chat",
-        "model_revision": "3cb06f589b7b1e2f8e728c77280b1114191d24de"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "WisdomShell/CodeShell-7B-Chat",
+            "model_revision": "3cb06f589b7b1e2f8e728c77280b1114191d24de"
+          },
+          "modelscope": {
+            "model_id": "WisdomShell/CodeShell-7B-Chat",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if item['role'] == 'user' %}{{ '## human: ' + item['content'] + '|<end>|' }}{% elif item['role'] == 'assistant' %}{{ '## assistant: ' + item['content'] + '|<end>|' }}{% endif %}{% endfor %}{{ '## assistant: ' }}",
@@ -85,8 +101,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/phi-2-GGUF",
-        "model_file_name_template": "phi-2.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/phi-2-GGUF",
+            "model_file_name_template": "phi-2.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -96,8 +116,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "microsoft/phi-2",
-        "model_revision": "d3186761bf5c4409f7679359284066c25ab668ee"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "microsoft/phi-2",
+            "model_revision": "d3186761bf5c4409f7679359284066c25ab668ee"
+          }
+        }
       }
     ]
   },
@@ -121,12 +145,20 @@
           "8-bit",
           "none"
         ],
-        "model_id": "microsoft/Phi-3-mini-128k-instruct",
-        "model_revision": "ebee18c488086b396dde649f2aa6548b9b8d2404"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "microsoft/Phi-3-mini-128k-instruct",
+            "model_revision": "ebee18c488086b396dde649f2aa6548b9b8d2404"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Phi-3-mini-128k-instruct",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ '<|endoftext|>' }}{% endif %}",
-    "stop_token_ids":[
+    "stop_token_ids": [
       32000,
       32001,
       32007
@@ -156,8 +188,12 @@
           "fp16",
           "q4"
         ],
-        "model_id": "microsoft/Phi-3-mini-4k-instruct-gguf",
-        "model_file_name_template": "Phi-3-mini-4k-instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "microsoft/Phi-3-mini-4k-instruct-gguf",
+            "model_file_name_template": "Phi-3-mini-4k-instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -167,12 +203,20 @@
           "8-bit",
           "none"
         ],
-        "model_id": "microsoft/Phi-3-mini-4k-instruct",
-        "model_revision": "b86bcaf57ea4dfdec5dbe12a377028b2fab0d480"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "microsoft/Phi-3-mini-4k-instruct",
+            "model_revision": "b86bcaf57ea4dfdec5dbe12a377028b2fab0d480"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Phi-3-mini-4k-instruct",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ '<|endoftext|>' }}{% endif %}",
-    "stop_token_ids":[
+    "stop_token_ids": [
       32000,
       32001,
       32007
@@ -205,8 +249,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "THUDM/glm-4-9b-chat",
-        "model_revision": "f6e0743b285dd808084530f070ad08e504386750"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/glm-4-9b-chat",
+            "model_revision": "f6e0743b285dd808084530f070ad08e504386750"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/glm-4-9b-chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -230,9 +282,18 @@
           "BF16",
           "FP16"
         ],
-        "model_file_name_template": "glm-4-9b-chat.{quantization}.gguf",
-        "model_id": "legraphista/glm-4-9b-chat-GGUF",
-        "model_revision": "0155a14edf0176863e9a003cdd78ce599e4d62c0"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "legraphista/glm-4-9b-chat-GGUF",
+            "model_revision": "0155a14edf0176863e9a003cdd78ce599e4d62c0",
+            "model_file_name_template": "glm-4-9b-chat.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/glm-4-9b-chat-GGUF",
+            "model_revision": "master",
+            "model_file_name_template": "glm-4-9b-chat.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "[gMASK]<sop>{% for item in messages %}{% if item['tools'] is defined %}<|system|>\n你是一个名为 ChatGLM 的人工智能助手。你是基于智谱AI训练的语言模型 GLM-4 模型开发的，你的任务是针对用户的问题和要求提供适当的答复和支持。\n\n# 可用工具{% set tools = item['tools'] %}{% for tool in tools %}{% if tool['type'] == 'function' %}\n\n## {{ tool['function']['name'] }}\n\n{{ tool['function'] | tojson(indent=4) }}\n在调用上述函数时，请使用 Json 格式表示调用的参数。{% elif tool['type'] == 'python' %}\n\n## python\n\n当你向 `python` 发送包含 Python 代码的消息时，该代码将会在一个有状态的 Jupyter notebook 环境中执行。\n`python` 返回代码执行的输出，或在执行 60 秒后返回超时。\n`/mnt/data` 将会持久化存储你的文件。在此会话中，`python` 无法访问互联网。不要使用 `python` 进行任何网络请求或者在线 API 调用，这些在线内容的访问将不会成功。{% elif tool['type'] == 'simple_browser' %}\n\n## simple_browser\n\n你可以使用 `simple_browser` 工具。该工具支持以下函数：\n`search(query: str, recency_days: int)`：使用搜索引擎进行查询并显示结果，可以使用 `recency_days` 参数控制搜索内容的时效性。\n`mclick(ids: list[int])`：获取一系列指定 id 的页面内容。每次调用时，须选择3-10个页面。选择多个角度的页面，同时尽可能选择可信任的信息来源。考虑到部分页面是无法加载的，你也可以多打开一些可能有用的页面而不用担心内容过多。\n`open_url(url: str)`：打开指定的 URL。\n\n使用 `【{引用 id}†{引用文本}】` 来引用内容。\n\n操作步骤：1. 使用 `search` 来获得信息列表; 2. 使用 `mclick` 来获取指定 ID 页面的内容; 3. 根据获得的内容进行回复。在回复中应当引用信息来源。\n 如果用户提供了 URL，也可以用 `open_url` 直接打开页面。\n如果初次搜索结果没有找到合适的信息，也可以再次使用 `search` 进行搜索。{% elif tool['type'] == 'cogview' %}\n\n## cogview\n\n如果用户的请求中包含了对图像的描述，你可以使用 `cogview` 来生成图像并展示给用户。你需要向 `cogview` 发送图像描述，规则：\n- 发送给 `cogview` 的消息必须使用英语。用户的中文描述必须完全翻译为英语。\n- 应当尽可能详细地描述图像生成的需求，需求描述约 100 英文单词。\n- 保持用户原始描述的意图。不要虚构内容或者没见过的人物。\n- 如无特殊说明，所在地为中国，持有中国立场并遵循中国社会主义价值观。{% endif %}{% endfor %}{% endif %}{% if item['content'] %}<|{{ item['role'] }}|>{{ item['metadata'] }}\n{{ item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>{% endif %}",
@@ -269,8 +330,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "THUDM/glm-4-9b-chat-1m",
-        "model_revision": "0aa722c7e0745dd21453427dd44c257dd253304f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/glm-4-9b-chat-1m",
+            "model_revision": "0aa722c7e0745dd21453427dd44c257dd253304f"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/glm-4-9b-chat-1m",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -294,9 +363,18 @@
           "BF16",
           "FP16"
         ],
-        "model_file_name_template": "glm-4-9b-chat-1m.{quantization}.gguf",
-        "model_id": "legraphista/glm-4-9b-chat-1m-GGUF",
-        "model_revision": "782e28bd5eee3c514c07108da15e0b5e06dcf776"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "legraphista/glm-4-9b-chat-1m-GGUF",
+            "model_revision": "782e28bd5eee3c514c07108da15e0b5e06dcf776",
+            "model_file_name_template": "glm-4-9b-chat-1m.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/glm-4-9b-chat-1m-GGUF",
+            "model_revision": "master",
+            "model_file_name_template": "glm-4-9b-chat-1m.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "[gMASK]<sop>{% for item in messages %}{% if item['tools'] is defined %}<|system|>\n你是一个名为 GLM-4 的人工智能助手。你是基于智谱AI训练的语言模型 GLM-4 模型开发的，你的任务是针对用户的问题和要求提供适当的答复和支持。\n\n# 可用工具{% set tools = item['tools'] %}{% for tool in tools %}{% if tool['type'] == 'function' %}\n\n## {{ tool['function']['name'] }}\n\n{{ tool['function'] | tojson(indent=4) }}\n在调用上述函数时，请使用 Json 格式表示调用的参数。{% elif tool['type'] == 'python' %}\n\n## python\n\n当你向 `python` 发送包含 Python 代码的消息时，该代码将会在一个有状态的 Jupyter notebook 环境中执行。\n`python` 返回代码执行的输出，或在执行 60 秒后返回超时。\n`/mnt/data` 将会持久化存储你的文件。在此会话中，`python` 无法访问互联网。不要使用 `python` 进行任何网络请求或者在线 API 调用，这些在线内容的访问将不会成功。{% elif tool['type'] == 'simple_browser' %}\n\n## simple_browser\n\n你可以使用 `simple_browser` 工具。该工具支持以下函数：\n`search(query: str, recency_days: int)`：使用搜索引擎进行查询并显示结果，可以使用 `recency_days` 参数控制搜索内容的时效性。\n`mclick(ids: list[int])`：获取一系列指定 id 的页面内容。每次调用时，须选择3-10个页面。选择多个角度的页面，同时尽可能选择可信任的信息来源。考虑到部分页面是无法加载的，你也可以多打开一些可能有用的页面而不用担心内容过多。\n`open_url(url: str)`：打开指定的 URL。\n\n使用 `【{引用 id}†{引用文本}】` 来引用内容。\n\n操作步骤：1. 使用 `search` 来获得信息列表; 2. 使用 `mclick` 来获取指定 ID 页面的内容; 3. 根据获得的内容进行回复。在回复中应当引用信息来源。\n 如果用户提供了 URL，也可以用 `open_url` 直接打开页面。\n如果初次搜索结果没有找到合适的信息，也可以再次使用 `search` 进行搜索。{% elif tool['type'] == 'cogview' %}\n\n## cogview\n\n如果用户的请求中包含了对图像的描述，你可以使用 `cogview` 来生成图像并展示给用户。你需要向 `cogview` 发送图像描述，规则：\n- 发送给 `cogview` 的消息必须使用英语。用户的中文描述必须完全翻译为英语。\n- 应当尽可能详细地描述图像生成的需求，需求描述约 100 英文单词。\n- 保持用户原始描述的意图。不要虚构内容或者没见过的人物。\n- 如无特殊说明，所在地为中国，持有中国立场并遵循中国社会主义价值观。{% endif %}{% endfor %}{% endif %}{% if item['content'] %}<|{{ item['role'] }}|>{{ item['metadata'] }}\n{{ item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>{% endif %}",
@@ -333,8 +411,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "THUDM/glm-4v-9b",
-        "model_revision": "01328faefe122fe605c1c127b62e6031d3ffebf7"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/glm-4v-9b",
+            "model_revision": "01328faefe122fe605c1c127b62e6031d3ffebf7"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/glm-4v-9b",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "",
@@ -370,8 +456,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "THUDM/codegeex4-all-9b",
-        "model_revision": "8c4ec1d2f2888412640825a7aa23355939a8f4c6"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/codegeex4-all-9b",
+            "model_revision": "8c4ec1d2f2888412640825a7aa23355939a8f4c6"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/codegeex4-all-9b",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -384,9 +478,17 @@
           "Q6_K_L",
           "Q8_0"
         ],
-        "model_file_name_template": "codegeex4-all-9b-{quantization}.gguf",
-        "model_id": "THUDM/codegeex4-all-9b-GGUF",
-        "model_revision": "6a04071c54c943949826d4815ee00717ed8cf153"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/codegeex4-all-9b-GGUF",
+            "model_revision": "6a04071c54c943949826d4815ee00717ed8cf153",
+            "model_file_name_template": "codegeex4-all-9b-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/codegeex4-all-9b-GGUF",
+            "model_file_name_template": "codegeex4-all-9b-{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ '<|system|>\n' + item['content'] }}{% elif loop.first %}{{ '<|system|>\n你是一位智能编程助手，你叫CodeGeeX。你会为用户回答关于编程、代码、计算机方面的任何问题，并提供格式规范、可以执行、准确安全的代码，并在必要时提供详细的解释。' }}{% endif %}{% if item['role'] == 'user' %}{{ '<|user|>\n' + item['content'] }}{% elif item['role'] == 'assistant' %}{{ '<|assistant|>\n' + item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% endif %}",
@@ -422,8 +524,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "xverse/XVERSE-7B-Chat",
-        "model_revision": "60acc8c453c067b54df88be98bfdf60585ab5441"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "xverse/XVERSE-7B-Chat",
+            "model_revision": "60acc8c453c067b54df88be98bfdf60585ab5441"
+          },
+          "modelscope": {
+            "model_id": "xverse/XVERSE-7B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -433,8 +543,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "xverse/XVERSE-13B-Chat",
-        "model_revision": "1e4944aaa1d8c8d0cdca28bb8e3a003303d0781b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "xverse/XVERSE-13B-Chat",
+            "model_revision": "1e4944aaa1d8c8d0cdca28bb8e3a003303d0781b"
+          },
+          "modelscope": {
+            "model_id": "xverse/XVERSE-13B-Chat",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ '<|system|> \n' + item['content'] }}{% endif %}{% if item['role'] == 'user' %}{{ '<|user|> \n' + item['content'] }}{% elif item['role'] == 'assistant' %}{{ '<|assistant|> \n' + item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>' }}{% endif %}",
@@ -466,8 +584,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "xverse/XVERSE-7B",
-        "model_revision": "3778b254def675586e9218ccb15b78d6ef66a3a7"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "xverse/XVERSE-7B",
+            "model_revision": "3778b254def675586e9218ccb15b78d6ef66a3a7"
+          },
+          "modelscope": {
+            "model_id": "xverse/XVERSE-7B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -477,8 +603,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "xverse/XVERSE-13B",
-        "model_revision": "11ac840dda17af81046614229fdd0c658afff747"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "xverse/XVERSE-13B",
+            "model_revision": "11ac840dda17af81046614229fdd0c658afff747"
+          },
+          "modelscope": {
+            "model_id": "xverse/XVERSE-13B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -488,8 +622,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "xverse/XVERSE-65B",
-        "model_revision": "7f1b7394f74c630f50612a19ba90bd021c373989"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "xverse/XVERSE-65B",
+            "model_revision": "7f1b7394f74c630f50612a19ba90bd021c373989"
+          },
+          "modelscope": {
+            "model_id": "xverse/XVERSE-65B",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -522,8 +664,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Llama-2-7B-Chat-GGUF",
-        "model_file_name_template": "llama-2-7b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-7B-Chat-GGUF",
+            "model_file_name_template": "llama-2-7b-chat.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Llama-2-7b-Chat-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "llama-2-7b-chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -542,8 +693,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Llama-2-13B-chat-GGUF",
-        "model_file_name_template": "llama-2-13b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-13B-chat-GGUF",
+            "model_file_name_template": "llama-2-13b-chat.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Llama-2-13b-Chat-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "llama-2-13b-chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -570,9 +730,13 @@
             "split-b"
           ]
         },
-        "model_id": "TheBloke/Llama-2-70B-Chat-GGUF",
-        "model_file_name_template": "llama-2-70b-chat.{quantization}.gguf",
-        "model_file_name_split_template": "llama-2-70b-chat.{quantization}.gguf-{part}"
+        "model_file_name_split_template": "llama-2-70b-chat.{quantization}.gguf-{part}",
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-70B-Chat-GGUF",
+            "model_file_name_template": "llama-2-70b-chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -582,8 +746,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Llama-2-7b-chat-hf",
-        "model_revision": "08751db2aca9bf2f7f80d2e516117a53d7450235"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Llama-2-7b-chat-hf",
+            "model_revision": "08751db2aca9bf2f7f80d2e516117a53d7450235"
+          },
+          "modelscope": {
+            "model_id": "modelscope/Llama-2-7b-chat-ms",
+            "model_revision": "v1.0.5"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -591,7 +763,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-7B-Chat-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-7B-Chat-GPTQ"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -599,7 +775,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-70B-Chat-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-70B-Chat-GPTQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -607,7 +787,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-70B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-70B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -615,7 +799,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-7B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-7B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -625,8 +813,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Llama-2-13b-chat-hf",
-        "model_revision": "0ba94ac9b9e1d5a0037780667e8b219adde1908c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Llama-2-13b-chat-hf",
+            "model_revision": "0ba94ac9b9e1d5a0037780667e8b219adde1908c"
+          },
+          "modelscope": {
+            "model_id": "modelscope/Llama-2-13b-chat-ms",
+            "model_revision": "v1.0.2"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -634,7 +830,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-13B-chat-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-13B-chat-GPTQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -642,7 +842,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-13B-chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-13B-chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -652,13 +856,21 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Llama-2-70b-chat-hf",
-        "model_revision": "36d9a7388cc80e5f4b3e9701ca2f250d21a96c30"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Llama-2-70b-chat-hf",
+            "model_revision": "36d9a7388cc80e5f4b3e9701ca2f250d21a96c30"
+          },
+          "modelscope": {
+            "model_id": "modelscope/Llama-2-70b-chat-ms",
+            "model_revision": "v1.0.1"
+          }
+        }
       }
     ],
     "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = '<<SYS>>\n' + messages[0]['content'] | trim + '\n<</SYS>>\n\n' %}{% set messages = messages[1:] %}{% else %}{% set system_message = '' %}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 %}{% set content = system_message + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ '<s>' + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + '</s>' }}{% endif %}{% endfor %}",
     "stop_token_ids": [
-        2
+      2
     ],
     "stop": []
   },
@@ -691,8 +903,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Llama-2-7B-GGUF",
-        "model_file_name_template": "llama-2-7b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-7B-GGUF",
+            "model_file_name_template": "llama-2-7b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -700,7 +916,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-7B-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-7B-GPTQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -708,7 +928,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-7B-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-7B-AWQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -727,8 +951,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Llama-2-13B-GGUF",
-        "model_file_name_template": "llama-2-13b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-13B-GGUF",
+            "model_file_name_template": "llama-2-13b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -755,9 +983,13 @@
             "split-b"
           ]
         },
-        "model_id": "TheBloke/Llama-2-70B-GGUF",
-        "model_file_name_template": "llama-2-70b.{quantization}.gguf",
-        "model_file_name_split_template": "llama-2-70b.{quantization}.gguf-{part}"
+        "model_file_name_split_template": "llama-2-70b.{quantization}.gguf-{part}",
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-70B-GGUF",
+            "model_file_name_template": "llama-2-70b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -767,8 +999,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Llama-2-7b-hf",
-        "model_revision": "6fdf2e60f86ff2481f2241aaee459f85b5b0bbb9"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Llama-2-7b-hf",
+            "model_revision": "6fdf2e60f86ff2481f2241aaee459f85b5b0bbb9"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -778,8 +1014,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Llama-2-13b-hf",
-        "model_revision": "db6b8eb1feabb38985fdf785a89895959e944936"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Llama-2-13b-hf",
+            "model_revision": "db6b8eb1feabb38985fdf785a89895959e944936"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -787,7 +1027,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-13B-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-13B-GPTQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -795,7 +1039,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-13B-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-13B-AWQ"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -805,8 +1053,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Llama-2-70b-hf",
-        "model_revision": "cc8aa03a000ff08b4d5c5b39673321a2a396c396"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Llama-2-70b-hf",
+            "model_revision": "cc8aa03a000ff08b4d5c5b39673321a2a396c396"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -814,7 +1066,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-70B-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-70B-GPTQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -822,7 +1078,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Llama-2-70B-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Llama-2-70B-AWQ"
+          }
+        }
       }
     ]
   },
@@ -846,7 +1106,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3-8B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3-8B"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3-8B"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -867,8 +1134,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "QuantFactory/Meta-Llama-3-8B-GGUF",
-        "model_file_name_template": "Meta-Llama-3-8B.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "QuantFactory/Meta-Llama-3-8B-GGUF",
+            "model_file_name_template": "Meta-Llama-3-8B.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -878,7 +1149,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3-70B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3-70B"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3-70B"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -887,8 +1165,12 @@
           "Q4_K_M",
           "Q5_K_M"
         ],
-        "model_id": "NousResearch/Meta-Llama-3-70B-GGUF",
-        "model_file_name_template": "Meta-Llama-3-70B-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "NousResearch/Meta-Llama-3-70B-GGUF",
+            "model_file_name_template": "Meta-Llama-3-70B-{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -914,8 +1196,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "lmstudio-community/Meta-Llama-3-8B-Instruct-GGUF",
-        "model_file_name_template": "Meta-Llama-3-8B-Instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Meta-Llama-3-8B-Instruct-GGUF",
+            "model_file_name_template": "Meta-Llama-3-8B-Instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -925,7 +1211,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3-8B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3-8B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3-8B-Instruct"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -935,8 +1228,12 @@
           "IQ2_XS",
           "Q4_K_M"
         ],
-        "model_id": "lmstudio-community/Meta-Llama-3-70B-Instruct-GGUF",
-        "model_file_name_template": "Meta-Llama-3-70B-Instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Meta-Llama-3-70B-Instruct-GGUF",
+            "model_file_name_template": "Meta-Llama-3-70B-Instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -946,7 +1243,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3-70B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3-70B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3-70B-Instruct"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -954,7 +1258,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3-8B-Instruct-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3-8B-Instruct-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -962,7 +1270,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3-8B-Instruct-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3-8B-Instruct-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -970,7 +1282,11 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mlx-community/Meta-Llama-3-8B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3-8B-Instruct"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -978,7 +1294,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3-70B-Instruct-4bit-mlx"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3-70B-Instruct-4bit-mlx"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -986,7 +1306,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3-70B-Instruct-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3-70B-Instruct-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -994,7 +1318,11 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mlx-community/Meta-Llama-3-70B-Instruct-mlx-unquantized"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3-70B-Instruct-mlx-unquantized"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1002,7 +1330,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TechxGenus/Meta-Llama-3-8B-Instruct-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TechxGenus/Meta-Llama-3-8B-Instruct-GPTQ"
+          },
+          "modelscope": {
+            "model_id": "swift/Meta-Llama-3-8B-Instruct-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1010,7 +1345,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TechxGenus/Meta-Llama-3-70B-Instruct-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TechxGenus/Meta-Llama-3-70B-Instruct-GPTQ"
+          },
+          "modelscope": {
+            "model_id": "swift/Meta-Llama-3-70B-Instruct-GPTQ-{quantization}"
+          }
+        }
       }
     ],
     "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}",
@@ -1050,7 +1392,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3.1-8B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3.1-8B"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-8B"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1071,8 +1420,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "QuantFactory/Meta-Llama-3.1-8B-GGUF",
-        "model_file_name_template": "Meta-Llama-3.1-8B.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "QuantFactory/Meta-Llama-3.1-8B-GGUF",
+            "model_file_name_template": "Meta-Llama-3.1-8B.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1082,7 +1435,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3.1-70B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3.1-70B"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-70B"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1092,7 +1452,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3.1-405B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3.1-405B"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-405B"
+          }
+        }
       }
     ]
   },
@@ -1126,8 +1493,16 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "lmstudio-community/Meta-Llama-3.1-8B-Instruct-GGUF",
-        "model_file_name_template": "Meta-Llama-3.1-8B-Instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Meta-Llama-3.1-8B-Instruct-GGUF",
+            "model_file_name_template": "Meta-Llama-3.1-8B-Instruct-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct-GGUF",
+            "model_file_name_template": "Meta-Llama-3.1-8B-Instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1135,7 +1510,14 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3.1-8B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3.1-8B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1143,7 +1525,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "unsloth/Meta-Llama-3.1-8B-Instruct-bnb-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "unsloth/Meta-Llama-3.1-8B-Instruct-bnb-4bit"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1151,7 +1537,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "hugging-quants/Meta-Llama-3.1-8B-Instruct-GPTQ-INT4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "hugging-quants/Meta-Llama-3.1-8B-Instruct-GPTQ-INT4"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct-GPTQ-INT4"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1159,7 +1552,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "hugging-quants/Meta-Llama-3.1-8B-Instruct-AWQ-INT4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "hugging-quants/Meta-Llama-3.1-8B-Instruct-AWQ-INT4"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct-AWQ-INT4"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1188,9 +1588,13 @@
             "00002-of-00002"
           ]
         },
-        "model_id": "lmstudio-community/Meta-Llama-3.1-70B-Instruct-GGUF",
-        "model_file_name_template": "Meta-Llama-3.1-70B-Instruct-{quantization}.gguf",
-        "model_file_name_split_template": "Meta-Llama-3.1-70B-Instruct-{quantization}-{part}.gguf"
+        "model_file_name_split_template": "Meta-Llama-3.1-70B-Instruct-{quantization}-{part}.gguf",
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Meta-Llama-3.1-70B-Instruct-GGUF",
+            "model_file_name_template": "Meta-Llama-3.1-70B-Instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1198,7 +1602,14 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3.1-70B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3.1-70B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-70B-Instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1206,7 +1617,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "unsloth/Meta-Llama-3.1-70B-Instruct-bnb-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "unsloth/Meta-Llama-3.1-70B-Instruct-bnb-4bit"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1214,7 +1629,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "hugging-quants/Meta-Llama-3.1-70B-Instruct-GPTQ-INT4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "hugging-quants/Meta-Llama-3.1-70B-Instruct-GPTQ-INT4"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-70B-Instruct-GPTQ-INT4"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1222,7 +1644,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-70B-Instruct-AWQ-INT4"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -1230,7 +1659,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3.1-8B-Instruct-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3.1-8B-Instruct-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -1238,7 +1671,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3.1-8B-Instruct-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3.1-8B-Instruct-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -1246,7 +1683,11 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mlx-community/Meta-Llama-3.1-8B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3.1-8B-Instruct"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -1254,7 +1695,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3.1-70B-Instruct-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3.1-70B-Instruct-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -1262,7 +1707,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Meta-Llama-3.1-70B-Instruct-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3.1-70B-Instruct-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -1270,7 +1719,11 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mlx-community/Meta-Llama-3.1-70B-Instruct-bf16"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Meta-Llama-3.1-70B-Instruct-bf16"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1280,7 +1733,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "meta-llama/Meta-Llama-3.1-405B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "meta-llama/Meta-Llama-3.1-405B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-405B-Instruct"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1288,7 +1748,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "hugging-quants/Meta-Llama-3.1-405B-Instruct-GPTQ-INT4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "hugging-quants/Meta-Llama-3.1-405B-Instruct-GPTQ-INT4"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-405B-Instruct-GPTQ-INT4"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1296,7 +1763,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "hugging-quants/Meta-Llama-3.1-405B-Instruct-AWQ-INT4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "hugging-quants/Meta-Llama-3.1-405B-Instruct-AWQ-INT4"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Meta-Llama-3.1-405B-Instruct-AWQ-INT4"
+          }
+        }
       }
     ],
     "chat_template": "{{- '<|begin_of_text|>' }}\n{%- if custom_tools is defined %}\n    {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n    {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n    {%- set date_string = \"26 Jul 2024\" %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content']|trim %}\n    {%- set messages = messages[1:] %}\n{%- else %}\n    {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message + builtin tools #}\n{{- \"<|start_header_id|>system<|end_header_id|>\n\n\" }}\n{%- if builtin_tools is defined or tools is not none %}\n    {{- \"Environment: ipython\n\" }}\n{%- endif %}\n{%- if builtin_tools is defined %}\n    {{- \"Tools: \" + builtin_tools | reject('equalto', 'code_interpreter') | join(\", \") + \"\n\n\"}}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\n\" }}\n{{- \"Today Date: \" + date_string + \"\n\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n    {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n    {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n    {{- \"Do not use variables.\n\n\" }}\n    {%- for t in tools %}\n        {{- t | tojson(indent=4) }}\n        {{- \"\n\n\" }}\n    {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n    {#- Extract the first user message so we can plug it in here #}\n    {%- if messages | length != 0 %}\n        {%- set first_user_message = messages[0]['content']|trim %}\n        {%- set messages = messages[1:] %}\n    {%- else %}\n        {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n    {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}\n    {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n    {{- \"with its proper arguments that best answers the given prompt.\n\n\" }}\n    {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n    {{- \"Do not use variables.\n\n\" }}\n    {%- for t in tools %}\n        {{- t | tojson(indent=4) }}\n        {{- \"\n\n\" }}\n    {%- endfor %}\n    {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n    {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n        {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}\n    {%- elif 'tool_calls' in message %}\n        {%- if not message.tool_calls|length == 1 %}\n            {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n        {%- endif %}\n        {%- set tool_call = message.tool_calls[0].function %}\n        {%- if builtin_tools is defined and tool_call.name in builtin_tools %}\n            {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}\n            {{- \"<|python_tag|>\" + tool_call.name + \".call(\" }}\n            {%- for arg_name, arg_val in tool_call.arguments | items %}\n                {{- arg_name + '=\"' + arg_val + '\"' }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- endif %}\n                {%- endfor %}\n            {{- \")\" }}\n        {%- else  %}\n            {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}\n            {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n            {{- '\"parameters\": ' }}\n            {{- tool_call.arguments | tojson }}\n            {{- \"}\" }}\n        {%- endif %}\n        {%- if builtin_tools is defined %}\n            {#- This means we're in ipython mode #}\n            {{- \"<|eom_id|>\" }}\n        {%- else %}\n            {{- \"<|eot_id|>\" }}\n        {%- endif %}\n    {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n        {{- \"<|start_header_id|>ipython<|end_header_id|>\n\n\" }}\n        {%- if message.content is mapping or message.content is iterable %}\n            {{- message.content | tojson }}\n        {%- else %}\n            {{- message.content }}\n        {%- endif %}\n        {{- \"<|eot_id|>\" }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}\n{%- endif %}\n",
@@ -1329,8 +1803,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "facebook/opt-125m",
-        "model_revision": "3d2b5f275bdf882b8775f902e1bfdb790e2cfc32"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "facebook/opt-125m",
+            "model_revision": "3d2b5f275bdf882b8775f902e1bfdb790e2cfc32"
+          }
+        }
       }
     ]
   },
@@ -1353,8 +1831,17 @@
         "quantizations": [
           "Q4_K_M"
         ],
-        "model_id": "Xorbits/Qwen-7B-Chat-GGUF",
-        "model_file_name_template": "Qwen-7B-Chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Xorbits/Qwen-7B-Chat-GGUF",
+            "model_file_name_template": "Qwen-7B-Chat.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Qwen-7B-Chat-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "Qwen-7B-Chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1362,8 +1849,17 @@
         "quantizations": [
           "Q4_K_M"
         ],
-        "model_id": "Xorbits/Qwen-14B-Chat-GGUF",
-        "model_file_name_template": "Qwen-14B-Chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Xorbits/Qwen-14B-Chat-GGUF",
+            "model_file_name_template": "Qwen-14B-Chat.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Qwen-14B-Chat-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "Qwen-14B-Chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1373,8 +1869,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen-1_8B-Chat",
-        "model_revision": "c3db8007171847931da7efa4b2ed4309afcce021"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-1_8B-Chat",
+            "model_revision": "c3db8007171847931da7efa4b2ed4309afcce021"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-1_8B-Chat",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1384,8 +1888,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen-7B-Chat",
-        "model_revision": "218aa3240fd5a5d1e80bb6c47d5d774361913706"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-7B-Chat",
+            "model_revision": "218aa3240fd5a5d1e80bb6c47d5d774361913706"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-7B-Chat",
+            "model_revision": "v1.1.9"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1395,8 +1907,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen-14B-Chat",
-        "model_revision": "fab8385c8f7e7980ef61944729fe134ccbbca263"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-14B-Chat",
+            "model_revision": "fab8385c8f7e7980ef61944729fe134ccbbca263"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-14B-Chat",
+            "model_revision": "v1.0.7"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1406,8 +1926,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen-72B-Chat",
-        "model_revision": "2cd9f76279337941ec1a4abeec6f8eb3c38d0f55"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-72B-Chat",
+            "model_revision": "2cd9f76279337941ec1a4abeec6f8eb3c38d0f55"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-72B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1416,7 +1944,15 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen-7B-Chat-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-7B-Chat-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-7B-Chat-{quantization}",
+            "model_revision": "v1.1.7"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1425,7 +1961,15 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen-1_8B-Chat-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-1_8B-Chat-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-1_8B-Chat-{quantization}",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1434,7 +1978,15 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen-14B-Chat-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-14B-Chat-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-14B-Chat-{quantization}",
+            "model_revision": "v1.0.7"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1443,7 +1995,15 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen-72B-Chat-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-72B-Chat-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen-72B-Chat-{quantization}",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ '<|im_start|>system\n' + item['content'] + '<|im_end|>\n' }}{% elif loop.first %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{% if item['role'] == 'user' %}{{ '<|im_start|>user\n' + item['content'] + '<|im_end|>' }}{% elif item['role'] == 'assistant' %}{{ '<|im_start|>assistant\n' + item['content'] + '<|im_end|>' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -1480,7 +2040,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-0.5B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-0.5B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-0.5B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1490,7 +2057,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-1.8B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-1.8B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-1.8B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1500,7 +2074,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-4B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-4B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-4B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1510,7 +2091,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-7B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-7B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-7B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1520,7 +2108,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-14B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-14B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-14B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1530,7 +2125,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-32B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-32B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-32B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1540,7 +2142,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-72B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-72B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-72B-Chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1550,7 +2159,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-110B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-110B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-110B-Chat"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1559,7 +2175,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen1.5-0.5B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-0.5B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-0.5B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1568,7 +2191,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen1.5-1.8B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-1.8B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-1.8B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1577,7 +2207,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen1.5-4B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-4B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-4B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1586,7 +2223,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen1.5-7B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-7B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-7B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1595,7 +2239,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen1.5-14B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-14B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-14B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1603,7 +2254,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-32B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-32B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-32B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1612,7 +2270,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen1.5-72B-Chat-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-72B-Chat-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-72B-Chat-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1620,7 +2285,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-110B-Chat-GPTQ-Int4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-110B-Chat-GPTQ-Int4"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-110B-Chat-GPTQ-Int4"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1628,7 +2300,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-0.5B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-0.5B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-0.5B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1636,7 +2315,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-1.8B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-1.8B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-1.8B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1644,7 +2330,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-4B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-4B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-4B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1652,7 +2345,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-7B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-7B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-7B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1660,7 +2360,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-14B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-14B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-14B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1668,7 +2375,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-32B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-32B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-32B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1676,7 +2390,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-72B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-72B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-72B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1684,7 +2405,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-110B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-110B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-110B-Chat-AWQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1699,8 +2427,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/Qwen1.5-0.5B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-0_5b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-0.5B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-0_5b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-0.5B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-0_5b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1715,8 +2451,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/Qwen1.5-1.8B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-1_8b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-1.8B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-1_8b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-1.8B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-1_8b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1731,8 +2475,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/Qwen1.5-4B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-4b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-4B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-4b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-4B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-4b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1747,8 +2499,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/Qwen1.5-7B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-7b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-7B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-7b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-7B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-7b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1763,8 +2523,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/Qwen1.5-14B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-14b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-14B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-14b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-14B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-14b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1779,8 +2547,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/Qwen1.5-32B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-32b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-32B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-32b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-32B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-32b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -1790,14 +2566,22 @@
           "q3_k_m",
           "q4_k_m"
         ],
-        "model_id": "Qwen/Qwen1.5-72B-Chat-GGUF",
-        "model_file_name_template": "qwen1_5-72b-chat-{quantization}.gguf",
         "model_file_name_split_template": "qwen1_5-72b-chat-{quantization}.gguf.{part}",
         "quantization_parts": {
           "q4_k_m": [
             "a",
             "b"
           ]
+        },
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-72B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-72b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-72B-Chat-GGUF",
+            "model_file_name_template": "qwen1_5-72b-chat-{quantization}.gguf"
+          }
         }
       }
     ],
@@ -1835,7 +2619,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen1.5-MoE-A2.7B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-MoE-A2.7B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-MoE-A2.7B-Chat"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -1843,7 +2634,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4"
+          }
+        }
       }
     ],
     "chat_template": "{%- macro json_to_python_type(json_spec) %}\n    {%- set basic_type_map = {\n    \"string\": \"str\",\n    \"number\": \"float\",\n    \"integer\": \"int\",\n    \"boolean\": \"bool\"\n} %}\n    {%- if basic_type_map[json_spec.type] is defined %}\n        {{- basic_type_map[json_spec.type] }}\n    {%- elif json_spec.type == \"array\" %}\n        {{- \"list[\" +  json_to_python_type(json_spec|items) + \"]\" }}\n    {%- elif json_spec.type == \"object\" %}\n        {%- if json_spec.additionalProperties is defined %}\n            {{- \"dict[str, \" + json_to_python_type(json_spec.additionalProperties) + ']' }}\n        {%- else %}\n            {{- \"dict\" }}\n        {%- endif %}\n    {%- elif json_spec.type is iterable %}\n        {{- \"Union[\" }}\n        {%- for t in json_spec.type %}\n            {{- json_to_python_type({\"type\": t}) }}\n            {%- if not loop.last %}\n                {{- \",\" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \"]\" }}\n    {%- else %}\n        {{- \"Any\" }}\n    {%- endif %}\n{%- endmacro %}\n\n{%- if tools %}\n    {{- '<|im_start|>system\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] + '\n\n' }}\n    {%- endif %}\n    {{- '# Tools\n\n' }}\n    {{- \"You are a function calling AI model. You are provided with function signatures within <tools></tools> XML tags. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: <tools> \" }}\n    {%- for tool in tools %}\n        {%- if tool.function is defined %}\n            {%- set tool = tool.function %}\n        {%- endif %}\n        {{- '{\"type\": \"function\", \"function\": ' }}\n        {{- '{\"name\": ' + tool.name + '\", ' }}\n        {{- '\"description\": \"' + tool.name + '(' }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {{- param_name + \": \" + json_to_python_type(param_fields) }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \")\" }}\n        {%- if tool.return is defined %}\n            {{- \" -> \" + json_to_python_type(tool.return) }}\n        {%- endif %}\n        {{- \" - \" + tool.description + \"\n\n\" }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {%- if loop.first %}\n                {{- \"    Args:\n\" }}\n            {%- endif %}\n            {{- \"        \" + param_name + \"(\" + json_to_python_type(param_fields) + \"): \" + param_fields.description|trim }}\n        {%- endfor %}\n        {%- if tool.return is defined and tool.return.description is defined %}\n            {{- \"\n    Returns:\n        \" + tool.return.description }}\n        {%- endif %}\n        {{- '\"' }}\n        {{- ', \"parameters\": ' }}\n        {%- if tool.parameters.properties | length == 0 %}\n            {{- \"{}\" }}\n        {%- else %}\n            {{- tool.parameters|tojson }}\n        {%- endif %}\n        {{- \"}\" }}\n        {%- if not loop.last %}\n            {{- \"\n\" }}\n        {%- endif %}\n    {%- endfor %}\n    {{- \" </tools>\" }}\n    {{- 'Use the following pydantic model json schema for each tool call you will make: {\"properties\": {\"arguments\": {\"title\": \"Arguments\", \"type\": \"object\"}, \"name\": {\"title\": \"Name\", \"type\": \"string\"}}, \"required\": [\"arguments\", \"name\"], \"title\": \"FunctionCall\", \"type\": \"object\"}\n' }}\n    {{- \"For each function call return a json object with function name and arguments within <tool_call></tool_call> XML tags as follows:\n\" }}\n    {{- \"<tool_call>\n\" }}\n    {{- '{\"name\": <function-name>, \"arguments\": <args-json-object>}\n' }}\n    {{- '</tool_call><|im_end|>\n' }}\n{%- else %}\n    {%- if messages[0]['role'] != 'system' %}\n        {{- '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message.role == \"user\" or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and message.tool_calls is not defined) %}\n        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role + '\n<tool_call>\n' }}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '{' }}\n            {{- '\"name\": \"' }}\n            {{- tool_call.name }}\n            {%- if tool_call.arguments is defined %}\n                {{- ', ' }}\n                {{- '\"arguments\": ' }}\n                {{- tool_call.arguments|tojson }}\n            {%- endif %}\n            {{- '\"}' }}\n            {{- '\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if not message.name is defined %}\n            {{- raise_exception(\"Tool response dicts require a 'name' key indicating the name of the called function!\") }}\n        {%- endif %}\n        {{- '<|im_start|>user\n<tool_response>\n' }}\n        {{- '{\"name\": \"' }}\n        {{- message.name }}\n        {{- '\", \"content\": ' }}\n        {{- message.content|tojson + '}' }}\n        {{- '\n</tool_response><|im_end|>\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\n' }}\n{%- endif %}",
@@ -1879,7 +2677,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/CodeQwen1.5-7B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/CodeQwen1.5-7B"
+          },
+          "modelscope": {
+            "model_id": "qwen/CodeQwen1.5-7B"
+          }
+        }
       }
     ]
   },
@@ -1909,8 +2714,16 @@
           "q6_k",
           "q8_0"
         ],
-        "model_id": "Qwen/CodeQwen1.5-7B-Chat-GGUF",
-        "model_file_name_template": "codeqwen-1_5-7b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/CodeQwen1.5-7B-Chat-GGUF",
+            "model_file_name_template": "codeqwen-1_5-7b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/CodeQwen1.5-7B-Chat-GGUF",
+            "model_file_name_template": "codeqwen-1_5-7b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1920,7 +2733,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/CodeQwen1.5-7B-Chat"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/CodeQwen1.5-7B-Chat"
+          },
+          "modelscope": {
+            "model_id": "qwen/CodeQwen1.5-7B-Chat"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -1928,7 +2748,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/CodeQwen1.5-7B-Chat-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/CodeQwen1.5-7B-Chat-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/CodeQwen1.5-7B-Chat-AWQ"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -1965,7 +2792,17 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen2-0.5B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-0.5B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-0.5B-Instruct"
+          },
+          "csghub": {
+            "model_id": "Qwen/Qwen2-0.5B-Instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1975,7 +2812,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen2-1.5B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-1.5B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-1.5B-Instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1985,7 +2829,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen2-7B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-7B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-7B-Instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -1995,7 +2846,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen2-72B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-72B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-72B-Instruct"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2004,7 +2862,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen2-0.5B-Instruct-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-0.5B-Instruct-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-0.5B-Instruct-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2013,7 +2878,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen2-1.5B-Instruct-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-1.5B-Instruct-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-1.5B-Instruct-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2022,7 +2894,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen2-7B-Instruct-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-7B-Instruct-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-7B-Instruct-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2031,7 +2910,14 @@
           "Int4",
           "Int8"
         ],
-        "model_id": "Qwen/Qwen2-72B-Instruct-GPTQ-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-72B-Instruct-GPTQ-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-72B-Instruct-GPTQ-{quantization}"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -2039,7 +2925,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen2-0.5B-Instruct-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-0.5B-Instruct-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-0.5B-Instruct-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -2047,7 +2940,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen2-1.5B-Instruct-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-1.5B-Instruct-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-1.5B-Instruct-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -2055,7 +2955,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen2-7B-Instruct-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-7B-Instruct-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-7B-Instruct-AWQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -2063,7 +2970,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen2-72B-Instruct-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-72B-Instruct-AWQ"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-72B-Instruct-AWQ"
+          }
+        }
       },
       {
         "model_format": "fp8",
@@ -2071,7 +2985,11 @@
         "quantizations": [
           "fp8"
         ],
-        "model_id": "neuralmagic/Qwen2-0.5B-Instruct-FP8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "neuralmagic/Qwen2-0.5B-Instruct-FP8"
+          }
+        }
       },
       {
         "model_format": "fp8",
@@ -2079,7 +2997,11 @@
         "quantizations": [
           "fp8"
         ],
-        "model_id": "neuralmagic/Qwen2-0.5B-Instruct-FP8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "neuralmagic/Qwen2-0.5B-Instruct-FP8"
+          }
+        }
       },
       {
         "model_format": "fp8",
@@ -2087,7 +3009,11 @@
         "quantizations": [
           "fp8"
         ],
-        "model_id": "neuralmagic/Qwen2-1.5B-Instruct-FP8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "neuralmagic/Qwen2-1.5B-Instruct-FP8"
+          }
+        }
       },
       {
         "model_format": "fp8",
@@ -2095,7 +3021,14 @@
         "quantizations": [
           "fp8"
         ],
-        "model_id": "neuralmagic/Qwen2-7B-Instruct-FP8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "neuralmagic/Qwen2-7B-Instruct-FP8"
+          },
+          "modelscope": {
+            "model_id": "liuzhenghua/Qwen2-7B-FP8-Instruct"
+          }
+        }
       },
       {
         "model_format": "fp8",
@@ -2103,7 +3036,14 @@
         "quantizations": [
           "fp8"
         ],
-        "model_id": "neuralmagic/Qwen2-72B-Instruct-FP8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "neuralmagic/Qwen2-72B-Instruct-FP8"
+          },
+          "modelscope": {
+            "model_id": "liuzhenghua/Qwen2-72B-FP8-Instruct"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -2111,7 +3051,14 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "Qwen/Qwen2-0.5B-Instruct-MLX"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-0.5B-Instruct-MLX"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-0.5B-Instruct-MLX"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -2119,7 +3066,14 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "Qwen/Qwen2-1.5B-Instruct-MLX"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-1.5B-Instruct-MLX"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-1.5B-Instruct-MLX"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -2127,7 +3081,14 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "Qwen/Qwen2-7B-Instruct-MLX"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-7B-Instruct-MLX"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-7B-Instruct-MLX"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -2135,7 +3096,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Qwen2-72B-Instruct-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Qwen2-72B-Instruct-4bit"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2151,8 +3116,20 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "Qwen/Qwen2-0.5B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-0_5b-instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-0.5B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-0_5b-instruct-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-0.5B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-0_5b-instruct-{quantization}.gguf"
+          },
+          "csghub": {
+            "model_id": "qwen/Qwen2-0.5B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-0_5b-instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2168,8 +3145,16 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "Qwen/Qwen2-1.5B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-1_5b-instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-1.5B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-1_5b-instruct-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-1.5B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-1_5b-instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2185,8 +3170,16 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "Qwen/Qwen2-7B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-7b-instruct-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-7B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-7b-instruct-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-7B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-7b-instruct-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2202,8 +3195,6 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "Qwen/Qwen2-72B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-72b-instruct-{quantization}.gguf",
         "model_file_name_split_template": "qwen2-72b-instruct-{quantization}-{part}.gguf",
         "quantization_parts": {
           "q5_0": [
@@ -2228,6 +3219,16 @@
             "00003-of-00004",
             "00004-of-00004"
           ]
+        },
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-72B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-72b-instruct-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-72B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-72b-instruct-{quantization}.gguf"
+          }
         }
       }
     ],
@@ -2265,7 +3266,14 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Qwen/Qwen2-57B-A14B-Instruct"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-57B-A14B-Instruct"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-57B-A14B-Instruct"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2273,7 +3281,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen2-57B-A14B-Instruct-GPTQ-Int4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-57B-A14B-Instruct-GPTQ-Int4"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-57B-A14B-Instruct-GPTQ-Int4"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2288,8 +3303,6 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "Qwen/Qwen2-57B-A14B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-57b-a14b-instruct-{quantization}.gguf",
         "model_file_name_split_template": "qwen2-57b-a14b-instruct-{quantization}-{part}.gguf",
         "quantization_parts": {
           "q8_0": [
@@ -2301,6 +3314,16 @@
             "00002-of-00003",
             "00003-of-00003"
           ]
+        },
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-57B-A14B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-57b-a14b-instruct-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-57B-A14B-Instruct-GGUF",
+            "model_file_name_template": "qwen2-57b-a14b-instruct-{quantization}.gguf"
+          }
         }
       }
     ],
@@ -2334,8 +3357,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "openai-community/gpt2",
-        "model_revision": "607a30d783dfa663caf39e06633721c8d4cfcd7e"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openai-community/gpt2",
+            "model_revision": "607a30d783dfa663caf39e06633721c8d4cfcd7e"
+          }
+        }
       }
     ]
   },
@@ -2359,8 +3386,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "WizardLMTeam/WizardMath-7B-V1.0",
-        "model_revision": "825a586f260d6c583b8aa9ceab6cdfaa3d9a4ddc"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "WizardLMTeam/WizardMath-7B-V1.0",
+            "model_revision": "825a586f260d6c583b8aa9ceab6cdfaa3d9a4ddc"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/WizardMath-7B-V1.0",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2370,8 +3405,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "WizardLMTeam/WizardMath-70B-V1.0",
-        "model_revision": "4dd9f3fcd8c056561d67ec59ae011f7c146aebd2"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "WizardLMTeam/WizardMath-70B-V1.0",
+            "model_revision": "4dd9f3fcd8c056561d67ec59ae011f7c146aebd2"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n\n### ' }}{% elif loop.first %}{{ 'Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### ' }}{% endif %}{% if item['role'] == 'user' %}{{ 'Instruction: ' + item['content'] + '\n\n### ' }}{% elif item['role'] == 'assistant' %}{{ 'Response: ' + item['content'] + '\n\n### ' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'Response: Let\\'s think step by step.' }}{% endif %}",
@@ -2402,8 +3441,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "TheBloke/CodeLlama-7B-fp16",
-        "model_revision": "ce09049eb9140a19cf78051cb5d849607b6fa8ec"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-7B-fp16",
+            "model_revision": "ce09049eb9140a19cf78051cb5d849607b6fa8ec"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-7b-hf",
+            "model_revision": "v1.0.2"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2413,8 +3460,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "TheBloke/CodeLlama-13B-fp16",
-        "model_revision": "d67ca1183da991d0d97927bdaaf35599556dfd76"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-13B-fp16",
+            "model_revision": "d67ca1183da991d0d97927bdaaf35599556dfd76"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-13b-hf",
+            "model_revision": "v1.0.1"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2424,8 +3479,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "TheBloke/CodeLlama-34B-fp16",
-        "model_revision": "f91d0cf7fc338cdc726f9c72d5ea15fe51bb16e9"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-34B-fp16",
+            "model_revision": "f91d0cf7fc338cdc726f9c72d5ea15fe51bb16e9"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-34b-hf",
+            "model_revision": "v1.0.1"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2444,8 +3507,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-7B-GGUF",
-        "model_file_name_template": "codellama-7b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-7B-GGUF",
+            "model_file_name_template": "codellama-7b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2464,8 +3531,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-13B-GGUF",
-        "model_file_name_template": "codellama-13b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-13B-GGUF",
+            "model_file_name_template": "codellama-13b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2484,8 +3555,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-34B-GGUF",
-        "model_file_name_template": "codellama-34b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-34B-GGUF",
+            "model_file_name_template": "codellama-34b.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -2509,8 +3584,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "TheBloke/CodeLlama-7B-Python-fp16",
-        "model_revision": "d51c51e625bc24b9a7a0616e82681b4859e2cfe4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-7B-Python-fp16",
+            "model_revision": "d51c51e625bc24b9a7a0616e82681b4859e2cfe4"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/CodeLlama-7B-Python-fp16",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2520,8 +3603,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "TheBloke/CodeLlama-13B-Python-fp16",
-        "model_revision": "442282f4207442b828953a72c51a919c332cba5c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-13B-Python-fp16",
+            "model_revision": "442282f4207442b828953a72c51a919c332cba5c"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-13b-Python-hf",
+            "model_revision": "v1.0.1"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2531,8 +3622,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "TheBloke/CodeLlama-34B-Python-fp16",
-        "model_revision": "875f9d97fb6c9619d8867887dd1d80918ff0f593"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-34B-Python-fp16",
+            "model_revision": "875f9d97fb6c9619d8867887dd1d80918ff0f593"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2551,8 +3646,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-7B-Python-GGUF",
-        "model_file_name_template": "codellama-7b-python.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-7B-Python-GGUF",
+            "model_file_name_template": "codellama-7b-python.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/CodeLlama-7B-Python-GGUF",
+            "model_revision": "v1.0.0",
+            "model_file_name_template": "codellama-7b-python.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2571,8 +3675,16 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-13B-Python-GGUF",
-        "model_file_name_template": "codellama-13b-python.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-13B-Python-GGUF",
+            "model_file_name_template": "codellama-13b-python.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/CodeLlama-13B-Python-GGUF",
+            "model_file_name_template": "codellama-13b-python.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2591,8 +3703,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-34B-Python-GGUF",
-        "model_file_name_template": "codellama-34b-python.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-34B-Python-GGUF",
+            "model_file_name_template": "codellama-34b-python.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -2616,8 +3732,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "codellama/CodeLlama-7b-Instruct-hf",
-        "model_revision": "6114dd1e16f69e0765ccbd7a64d33d04b265fbd2"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "codellama/CodeLlama-7b-Instruct-hf",
+            "model_revision": "6114dd1e16f69e0765ccbd7a64d33d04b265fbd2"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-7b-Instruct-hf",
+            "model_revision": "v1.0.1"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2627,8 +3751,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "codellama/CodeLlama-13b-Instruct-hf",
-        "model_revision": "ff0983bc4267bb98ead4fb5168fe2f049b442787"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "codellama/CodeLlama-13b-Instruct-hf",
+            "model_revision": "ff0983bc4267bb98ead4fb5168fe2f049b442787"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-13b-Instruct-hf",
+            "model_revision": "v1.0.1"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2638,8 +3770,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "codellama/CodeLlama-34b-Instruct-hf",
-        "model_revision": "38a1e15d8524a1f0a7760a7acf8242b81ae4eb87"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "codellama/CodeLlama-34b-Instruct-hf",
+            "model_revision": "38a1e15d8524a1f0a7760a7acf8242b81ae4eb87"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/CodeLlama-34b-Instruct-hf",
+            "model_revision": "v1.0.2"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2658,8 +3798,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-7B-Instruct-GGUF",
-        "model_file_name_template": "codellama-7b-instruct.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-7B-Instruct-GGUF",
+            "model_file_name_template": "codellama-7b-instruct.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/CodeLlama-7B-Instruct-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "codellama-7b-instruct.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2678,8 +3827,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-13B-Instruct-GGUF",
-        "model_file_name_template": "codellama-13b-instruct.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-13B-Instruct-GGUF",
+            "model_file_name_template": "codellama-13b-instruct.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/CodeLlama-13B-Instruct-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "codellama-13b-instruct.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2698,13 +3856,22 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/CodeLlama-34B-Instruct-GGUF",
-        "model_file_name_template": "codellama-34b-instruct.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/CodeLlama-34B-Instruct-GGUF",
+            "model_file_name_template": "codellama-34b-instruct.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/CodeLlama-34B-Instruct-GGUF",
+            "model_revision": "v0.1.0",
+            "model_file_name_template": "codellama-34b-instruct.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = '<<SYS>>\n' + messages[0]['content'] | trim + '\n<</SYS>>\n\n' %}{% set messages = messages[1:] %}{% else %}{% set system_message = '' %}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 %}{% set content = system_message + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ '<s>' + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + '</s>' }}{% endif %}{% endfor %}",
     "stop_token_ids": [
-        2
+      2
     ],
     "stop": [
       "</s>"
@@ -2731,8 +3898,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "baichuan-inc/Baichuan2-7B-Chat",
-        "model_revision": "2ce891951e000c36c65442608a0b95fd09b405dc"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "baichuan-inc/Baichuan2-7B-Chat",
+            "model_revision": "2ce891951e000c36c65442608a0b95fd09b405dc"
+          },
+          "modelscope": {
+            "model_id": "baichuan-inc/Baichuan2-7B-Chat",
+            "model_revision": "v1.0.4"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2742,8 +3917,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "baichuan-inc/Baichuan2-13B-Chat",
-        "model_revision": "a56c793eb7a721ab6c270f779024e0375e8afd4a"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "baichuan-inc/Baichuan2-13B-Chat",
+            "model_revision": "a56c793eb7a721ab6c270f779024e0375e8afd4a"
+          },
+          "modelscope": {
+            "model_id": "baichuan-inc/Baichuan2-13B-Chat",
+            "model_revision": "v1.0.3"
+          }
+        }
       }
     ],
     "chat_template": "{{ (messages|selectattr('role', 'equalto', 'system')|list|last).content|trim if (messages|selectattr('role', 'equalto', 'system')|list) else '' }}\n\n{% for message in messages %}\n{% if message['role'] == 'user' %}\n<reserved_106>\n{{ message['content']|trim -}}\n{% if not loop.last %}\n\n\n{% endif %}\n{% elif message['role'] == 'assistant' %}\n<reserved_107>\n{{ message['content']|trim -}}\n{% if not loop.last %}\n\n\n{% endif %}\n{% endif %}\n{% endfor %}\n{% if add_generation_prompt and messages[-1]['role'] != 'assistant' %}\n<reserved_107>\n{% endif %}",
@@ -2774,8 +3957,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "baichuan-inc/Baichuan2-7B-Base",
-        "model_revision": "f2cc3a689c5eba7dc7fd3757d0175d312d167604"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "baichuan-inc/Baichuan2-7B-Base",
+            "model_revision": "f2cc3a689c5eba7dc7fd3757d0175d312d167604"
+          },
+          "modelscope": {
+            "model_id": "baichuan-inc/Baichuan2-7B-Base",
+            "model_revision": "v1.0.2"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -2785,8 +3976,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "baichuan-inc/Baichuan2-13B-Base",
-        "model_revision": "fa88072fee36e36282287410e00897df2f59e09b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "baichuan-inc/Baichuan2-13B-Base",
+            "model_revision": "fa88072fee36e36282287410e00897df2f59e09b"
+          },
+          "modelscope": {
+            "model_id": "baichuan-inc/Baichuan2-13B-Base",
+            "model_revision": "v1.0.3"
+          }
+        }
       }
     ]
   },
@@ -2810,8 +4009,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mistral-7B-v0.1",
-        "model_revision": "ae9d75c6b4eb39515def78c685fb4d71d49fc2cf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-7B-v0.1",
+            "model_revision": "ae9d75c6b4eb39515def78c685fb4d71d49fc2cf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Mistral-7B-v0.1",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2830,8 +4037,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Mistral-7B-v0.1-GGUF",
-        "model_file_name_template": "mistral-7b-v0.1.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-v0.1-GGUF",
+            "model_file_name_template": "mistral-7b-v0.1.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Mistral-7B-v0.1-GGUF",
+            "model_revision": "v1.0.0",
+            "model_file_name_template": "mistral-7b-v0.1.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -2855,8 +4071,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mistral-7B-Instruct-v0.1",
-        "model_revision": "54766df6d50e4d3d7ccd66758e5341ba105a6d36"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-7B-Instruct-v0.1",
+            "model_revision": "54766df6d50e4d3d7ccd66758e5341ba105a6d36"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Mistral-7B-Instruct-v0.1",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -2864,7 +4088,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mistral-7B-Instruct-v0.1-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-Instruct-v0.1-AWQ"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2872,7 +4100,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mistral-7B-Instruct-v0.1-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-Instruct-v0.1-GPTQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2891,8 +4123,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Mistral-7B-Instruct-v0.1-GGUF",
-        "model_file_name_template": "mistral-7b-instruct-v0.1.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-Instruct-v0.1-GGUF",
+            "model_file_name_template": "mistral-7b-instruct-v0.1.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content'] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n        {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif %}\n    {%- if message['role'] == 'user' %}\n        {%- if loop.first and system_message is defined %}\n            {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}\n        {%- else %}\n            {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n        {%- endif %}\n    {%- elif message['role'] == 'assistant' %}\n        {{- ' ' + message['content'] + '</s>'}}\n    {%- else %}\n        {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n    {%- endif %}\n{%- endfor %}\n",
@@ -2923,8 +4159,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mistral-7B-Instruct-v0.2",
-        "model_revision": "b70aa86578567ba3301b21c8a27bea4e8f6d6d61"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-7B-Instruct-v0.2",
+            "model_revision": "b70aa86578567ba3301b21c8a27bea4e8f6d6d61"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Mistral-7B-Instruct-v0.2"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -2932,7 +4175,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mistral-7B-Instruct-v0.2-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-Instruct-v0.2-GPTQ"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -2940,7 +4187,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mistral-7B-Instruct-v0.2-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-Instruct-v0.2-AWQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -2959,8 +4210,16 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Mistral-7B-Instruct-v0.2-GGUF",
-        "model_file_name_template": "mistral-7b-instruct-v0.2.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mistral-7B-Instruct-v0.2-GGUF",
+            "model_file_name_template": "mistral-7b-instruct-v0.2.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/Mistral-7B-Instruct-v0.2-GGUF",
+            "model_file_name_template": "mistral-7b-instruct-v0.2.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content'] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n        {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif %}\n    {%- if message['role'] == 'user' %}\n        {%- if loop.first and system_message is defined %}\n            {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}\n        {%- else %}\n            {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n        {%- endif %}\n    {%- elif message['role'] == 'assistant' %}\n        {{- ' ' + message['content'] + '</s>'}}\n    {%- else %}\n        {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n    {%- endif %}\n{%- endfor %}\n",
@@ -2991,8 +4250,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mistral-7B-Instruct-v0.3",
-        "model_revision": "83e9aa141f2e28c82232fea5325f54edf17c43de"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-7B-Instruct-v0.3",
+            "model_revision": "83e9aa141f2e28c82232fea5325f54edf17c43de"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -3000,7 +4263,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "neuralmagic/Mistral-7B-Instruct-v0.3-GPTQ-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "neuralmagic/Mistral-7B-Instruct-v0.3-GPTQ-4bit"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -3008,7 +4275,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "solidrust/Mistral-7B-Instruct-v0.3-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "solidrust/Mistral-7B-Instruct-v0.3-AWQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3026,8 +4297,12 @@
           "Q8_0",
           "fp16"
         ],
-        "model_id": "MaziyarPanahi/Mistral-7B-Instruct-v0.3-GGUF",
-        "model_file_name_template": "Mistral-7B-Instruct-v0.3.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "MaziyarPanahi/Mistral-7B-Instruct-v0.3-GGUF",
+            "model_file_name_template": "Mistral-7B-Instruct-v0.3.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{%- if messages[0][\"role\"] == \"system\" %}\n    {%- set system_message = messages[0][\"content\"] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n{%- set user_messages = loop_messages | selectattr(\"role\", \"equalto\", \"user\") | list %}\n\n{#- This block checks for alternating user/assistant messages, skipping tool calling messages #}\n{%- set ns = namespace() %}\n{%- set ns.index = 0 %}\n{%- for message in loop_messages %}\n    {%- if not (message.role == \"tool\" or message.role == \"tool_results\" or (message.tool_calls is defined and message.tool_calls is not none)) %}\n        {%- if (message[\"role\"] == \"user\") != (ns.index % 2 == 0) %}\n            {{- raise_exception(\"After the optional system message, conversation roles must alternate user/assistant/user/assistant/...\") }}\n        {%- endif %}\n        {%- set ns.index = ns.index + 1 %}\n    {%- endif %}\n{%- endfor %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if message[\"role\"] == \"user\" %}\n        {%- if tools is not none and (message == user_messages[-1]) %}\n            {{- \"[AVAILABLE_TOOLS] [\" }}\n            {%- for tool in tools %}\n                {%- set tool = tool.function %}\n                {{- '{\"type\": \"function\", \"function\": {' }}\n                {%- for key, val in tool.items() if key != \"return\" %}\n                    {%- if val is string %}\n                        {{- '\"' + key + '\": \"' + val + '\"' }}\n                    {%- else %}\n                        {{- '\"' + key + '\": ' + val|tojson }}\n                    {%- endif %}\n                    {%- if not loop.last %}\n                        {{- \", \" }}\n                    {%- endif %}\n                {%- endfor %}\n                {{- \"}}\" }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- else %}\n                    {{- \"]\" }}\n                {%- endif %}\n            {%- endfor %}\n            {{- \"[/AVAILABLE_TOOLS]\" }}\n            {%- endif %}\n        {%- if loop.last and system_message is defined %}\n            {{- \"[INST] \" + system_message + \"\n\n\" + message[\"content\"] + \"[/INST]\" }}\n        {%- else %}\n            {{- \"[INST] \" + message[\"content\"] + \"[/INST]\" }}\n        {%- endif %}\n    {%- elif message.tool_calls is defined and message.tool_calls is not none %}\n        {{- \"[TOOL_CALLS] [\" }}\n        {%- for tool_call in message.tool_calls %}\n            {%- set out = tool_call.function|tojson %}\n            {{- out[:-1] }}\n            {%- if not tool_call.id is defined or tool_call.id|length != 9 %}\n                {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n            {%- endif %}\n            {{- ', \"id\": \"' + tool_call.id + '\"}' }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- else %}\n                {{- \"]\" + '</s>' }}\n            {%- endif %}\n        {%- endfor %}\n    {%- elif message[\"role\"] == \"assistant\" %}\n        {{- \" \" + message[\"content\"]|trim + '</s>'}}\n    {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n        {%- if message.content is defined and message.content.content is defined %}\n            {%- set content = message.content.content %}\n        {%- else %}\n            {%- set content = message.content %}\n        {%- endif %}\n        {{- '[TOOL_RESULTS] {\"content\": ' + content|string + \", \" }}\n        {%- if not message.tool_call_id is defined or message.tool_call_id|length != 9 %}\n            {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n        {%- endif %}\n        {{- '\"call_id\": \"' + message.tool_call_id + '\"}[/TOOL_RESULTS]' }}\n    {%- else %}\n        {{- raise_exception(\"Only user and assistant roles are supported, with the exception of an initial optional system message!\") }}\n    {%- endif %}\n{%- endfor %}\n",
@@ -3064,8 +4339,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mistralai/Mistral-Nemo-Instruct-2407",
-        "model_revision": "05b1e4f3e189ec1b5189fb3c973d4cf3369c27af"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-Nemo-Instruct-2407",
+            "model_revision": "05b1e4f3e189ec1b5189fb3c973d4cf3369c27af"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Mistral-Nemo-Instruct-2407"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3073,8 +4355,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "unsloth/Mistral-Nemo-Instruct-2407-bnb-4bit",
-        "model_revision": "1d85adc9e0fff0b8e4479a037bd75fe1346333ca"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "unsloth/Mistral-Nemo-Instruct-2407-bnb-4bit",
+            "model_revision": "1d85adc9e0fff0b8e4479a037bd75fe1346333ca"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3082,8 +4368,12 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "afrizalha/Mistral-Nemo-Instruct-2407-bnb-8bit",
-        "model_revision": "1d2dacf18a486c745219317d1507441406bc7e25"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "afrizalha/Mistral-Nemo-Instruct-2407-bnb-8bit",
+            "model_revision": "1d2dacf18a486c745219317d1507441406bc7e25"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -3091,7 +4381,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "ModelCloud/Mistral-Nemo-Instruct-2407-gptq-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "ModelCloud/Mistral-Nemo-Instruct-2407-gptq-4bit"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Mistral-Nemo-Instruct-2407-gptq-4bit"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -3099,7 +4396,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "casperhansen/mistral-nemo-instruct-2407-awq"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "casperhansen/mistral-nemo-instruct-2407-awq"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3117,8 +4418,12 @@
           "Q8_0",
           "fp16"
         ],
-        "model_id": "MaziyarPanahi/Mistral-Nemo-Instruct-2407-GGUF",
-        "model_file_name_template": "Mistral-Nemo-Instruct-2407.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "MaziyarPanahi/Mistral-Nemo-Instruct-2407-GGUF",
+            "model_file_name_template": "Mistral-Nemo-Instruct-2407.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3126,7 +4431,11 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mlx-community/Mistral-Nemo-Instruct-2407-bf16"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Mistral-Nemo-Instruct-2407-bf16"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3134,7 +4443,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Mistral-Nemo-Instruct-2407-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Mistral-Nemo-Instruct-2407-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3142,7 +4455,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Mistral-Nemo-Instruct-2407-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Mistral-Nemo-Instruct-2407-8bit"
+          }
+        }
       }
     ],
     "chat_template": "{%- if messages[0][\"role\"] == \"system\" %}\n    {%- set system_message = messages[0][\"content\"] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n{%- set user_messages = loop_messages | selectattr(\"role\", \"equalto\", \"user\") | list %}\n\n{#- This block checks for alternating user/assistant messages, skipping tool calling messages #}\n{%- set ns = namespace() %}\n{%- set ns.index = 0 %}\n{%- for message in loop_messages %}\n    {%- if not (message.role == \"tool\" or message.role == \"tool_results\" or (message.tool_calls is defined and message.tool_calls is not none)) %}\n        {%- if (message[\"role\"] == \"user\") != (ns.index % 2 == 0) %}\n            {{- raise_exception(\"After the optional system message, conversation roles must alternate user/assistant/user/assistant/...\") }}\n        {%- endif %}\n        {%- set ns.index = ns.index + 1 %}\n    {%- endif %}\n{%- endfor %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if message[\"role\"] == \"user\" %}\n        {%- if tools is not none and (message == user_messages[-1]) %}\n            {{- \"[AVAILABLE_TOOLS][\" }}\n            {%- for tool in tools %}\n                {%- set tool = tool.function %}\n                {{- '{\"type\": \"function\", \"function\": {' }}\n                {%- for key, val in tool.items() if key != \"return\" %}\n                    {%- if val is string %}\n                        {{- '\"' + key + '\": \"' + val + '\"' }}\n                    {%- else %}\n                        {{- '\"' + key + '\": ' + val|tojson }}\n                    {%- endif %}\n                    {%- if not loop.last %}\n                        {{- \", \" }}\n                    {%- endif %}\n                {%- endfor %}\n                {{- \"}}\" }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- else %}\n                    {{- \"]\" }}\n                {%- endif %}\n            {%- endfor %}\n            {{- \"[/AVAILABLE_TOOLS]\" }}\n            {%- endif %}\n        {%- if loop.last and system_message is defined %}\n            {{- \"[INST]\" + system_message + \"\n\n\" + message[\"content\"] + \"[/INST]\" }}\n        {%- else %}\n            {{- \"[INST]\" + message[\"content\"] + \"[/INST]\" }}\n        {%- endif %}\n    {%- elif (message.tool_calls is defined and message.tool_calls is not none) %}\n        {{- \"[TOOL_CALLS][\" }}\n        {%- for tool_call in message.tool_calls %}\n            {%- set out = tool_call.function|tojson %}\n            {{- out[:-1] }}\n            {%- if not tool_call.id is defined or tool_call.id|length != 9 %}\n                {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n            {%- endif %}\n            {{- ', \"id\": \"' + tool_call.id + '\"}' }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- else %}\n                {{- \"]\" + '</s>' }}\n            {%- endif %}\n        {%- endfor %}\n    {%- elif message[\"role\"] == \"assistant\" %}\n        {{- message[\"content\"] + '</s>'}}\n    {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n        {%- if message.content is defined and message.content.content is defined %}\n            {%- set content = message.content.content %}\n        {%- else %}\n            {%- set content = message.content %}\n        {%- endif %}\n        {{- '[TOOL_RESULTS]{\"content\": ' + content|string + \", \" }}\n        {%- if not message.tool_call_id is defined or message.tool_call_id|length != 9 %}\n            {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n        {%- endif %}\n        {{- '\"call_id\": \"' + message.tool_call_id + '\"}[/TOOL_RESULTS]' }}\n    {%- else %}\n        {{- raise_exception(\"Only user and assistant roles are supported, with the exception of an initial optional system message!\") }}\n    {%- endif %}\n{%- endfor %}\n",
@@ -3180,7 +4497,14 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mistralai/Mistral-Large-Instruct-2407"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-Large-Instruct-2407"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/Mistral-Large-Instruct-2407-bnb-4bit"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3188,7 +4512,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "unsloth/Mistral-Large-Instruct-2407-bnb-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "unsloth/Mistral-Large-Instruct-2407-bnb-4bit"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -3196,7 +4524,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "ModelCloud/Mistral-Large-Instruct-2407-gptq-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "ModelCloud/Mistral-Large-Instruct-2407-gptq-4bit"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -3204,7 +4536,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TechxGenus/Mistral-Large-Instruct-2407-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TechxGenus/Mistral-Large-Instruct-2407-AWQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3217,8 +4553,6 @@
           "Q4_K_S",
           "Q4_K_M"
         ],
-        "model_id": "MaziyarPanahi/Mistral-Large-Instruct-2407-GGUF",
-        "model_file_name_template": "Mistral-Large-Instruct-2407.{quantization}.gguf",
         "model_file_name_split_template": "Mixtral-8x22B-Instruct-v0.1.{quantization}-{part}.gguf",
         "quantization_parts": {
           "Q3_K_L": [
@@ -3266,6 +4600,12 @@
             "00006-of-00007",
             "00007-of-00007"
           ]
+        },
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "MaziyarPanahi/Mistral-Large-Instruct-2407-GGUF",
+            "model_file_name_template": "Mistral-Large-Instruct-2407.{quantization}.gguf"
+          }
         }
       },
       {
@@ -3274,7 +4614,11 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "mlx-community/Mistral-Large-Instruct-2407-bf16"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Mistral-Large-Instruct-2407-bf16"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3282,7 +4626,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Mistral-Large-Instruct-2407-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Mistral-Large-Instruct-2407-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3290,7 +4638,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Mistral-Large-Instruct-2407-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Mistral-Large-Instruct-2407-8bit"
+          }
+        }
       }
     ],
     "chat_template": "{%- if messages[0][\"role\"] == \"system\" %}\n    {%- set system_message = messages[0][\"content\"] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n{%- set user_messages = loop_messages | selectattr(\"role\", \"equalto\", \"user\") | list %}\n\n{#- This block checks for alternating user/assistant messages, skipping tool calling messages #}\n{%- set ns = namespace() %}\n{%- set ns.index = 0 %}\n{%- for message in loop_messages %}\n    {%- if not (message.role == \"tool\" or message.role == \"tool_results\" or (message.tool_calls is defined and message.tool_calls is not none)) %}\n        {%- if (message[\"role\"] == \"user\") != (ns.index % 2 == 0) %}\n            {{- raise_exception(\"After the optional system message, conversation roles must alternate user/assistant/user/assistant/...\") }}\n        {%- endif %}\n        {%- set ns.index = ns.index + 1 %}\n    {%- endif %}\n{%- endfor %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if message[\"role\"] == \"user\" %}\n        {%- if tools is not none and (message == user_messages[-1]) %}\n            {{- \"[AVAILABLE_TOOLS][\" }}\n            {%- for tool in tools %}\n                {%- set tool = tool.function %}\n                {{- '{\"type\": \"function\", \"function\": {' }}\n                {%- for key, val in tool.items() if key != \"return\" %}\n                    {%- if val is string %}\n                        {{- '\"' + key + '\": \"' + val + '\"' }}\n                    {%- else %}\n                        {{- '\"' + key + '\": ' + val|tojson }}\n                    {%- endif %}\n                    {%- if not loop.last %}\n                        {{- \", \" }}\n                    {%- endif %}\n                {%- endfor %}\n                {{- \"}}\" }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- else %}\n                    {{- \"]\" }}\n                {%- endif %}\n            {%- endfor %}\n            {{- \"[/AVAILABLE_TOOLS]\" }}\n            {%- endif %}\n        {%- if loop.last and system_message is defined %}\n            {{- \"[INST]\" + system_message + \"\n\n\" + message[\"content\"] + \"[/INST]\" }}\n        {%- else %}\n            {{- \"[INST]\" + message[\"content\"] + \"[/INST]\" }}\n        {%- endif %}\n    {%- elif (message.tool_calls is defined and message.tool_calls is not none) %}\n        {{- \"[TOOL_CALLS][\" }}\n        {%- for tool_call in message.tool_calls %}\n            {%- set out = tool_call.function|tojson %}\n            {{- out[:-1] }}\n            {%- if not tool_call.id is defined or tool_call.id|length != 9 %}\n                {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n            {%- endif %}\n            {{- ', \"id\": \"' + tool_call.id + '\"}' }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- else %}\n                {{- \"]\" + '</s>' }}\n            {%- endif %}\n        {%- endfor %}\n    {%- elif message[\"role\"] == \"assistant\" %}\n        {{- message[\"content\"] + '</s>'}}\n    {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n        {%- if message.content is defined and message.content.content is defined %}\n            {%- set content = message.content.content %}\n        {%- else %}\n            {%- set content = message.content %}\n        {%- endif %}\n        {{- '[TOOL_RESULTS]{\"content\": ' + content|string + \", \" }}\n        {%- if not message.tool_call_id is defined or message.tool_call_id|length != 9 %}\n            {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n        {%- endif %}\n        {{- '\"call_id\": \"' + message.tool_call_id + '\"}[/TOOL_RESULTS]' }}\n    {%- else %}\n        {{- raise_exception(\"Only user and assistant roles are supported, with the exception of an initial optional system message!\") }}\n    {%- endif %}\n{%- endfor %}\n",
@@ -3321,8 +4673,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mistral-7B-Instruct-v0.2",
-        "model_revision": "9552e7b1d9b2d5bbd87a5aa7221817285dbb6366"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mistral-7B-Instruct-v0.2",
+            "model_revision": "9552e7b1d9b2d5bbd87a5aa7221817285dbb6366"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3339,8 +4695,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "bartowski/Codestral-22B-v0.1-GGUF",
-        "model_file_name_template": "Codestral-22B-v0.1-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "bartowski/Codestral-22B-v0.1-GGUF",
+            "model_file_name_template": "Codestral-22B-v0.1-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3348,8 +4708,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Codestral-22B-v0.1-4bit",
-        "model_revision": "544626b38eb1c9524f0fa570ec7b29550c26b78d"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Codestral-22B-v0.1-4bit",
+            "model_revision": "544626b38eb1c9524f0fa570ec7b29550c26b78d"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -3357,8 +4721,12 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Codestral-22B-v0.1-8bit",
-        "model_revision": "0399a53970663950d57010e61a2796af524a1588"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Codestral-22B-v0.1-8bit",
+            "model_revision": "0399a53970663950d57010e61a2796af524a1588"
+          }
+        }
       }
     ]
   },
@@ -3382,8 +4750,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "teknium/OpenHermes-2.5-Mistral-7B",
-        "model_revision": "91ed666be78da7556f3d79abbb26fff0ee26cb54"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "teknium/OpenHermes-2.5-Mistral-7B",
+            "model_revision": "91ed666be78da7556f3d79abbb26fff0ee26cb54"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3402,8 +4774,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/OpenHermes-2.5-Mistral-7B-GGUF",
-        "model_file_name_template": "openhermes-2.5-mistral-7b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/OpenHermes-2.5-Mistral-7B-GGUF",
+            "model_file_name_template": "openhermes-2.5-mistral-7b.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -3443,8 +4819,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/TinyLlama-1.1B-Chat-v0.3-GGUF",
-        "model_file_name_template": "tinyllama-1.1b-chat-v0.3.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/TinyLlama-1.1B-Chat-v0.3-GGUF",
+            "model_file_name_template": "tinyllama-1.1b-chat-v0.3.{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Xorbits/TinyLlama-1.1B-step-50K-105b-GGUF",
+            "model_revision": "v0.0.1",
+            "model_file_name_template": "ggml-model-{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -3472,8 +4857,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mixtral-8x7B-v0.1",
-        "model_revision": "58301445dc1378584211722b7ebf8743ec4e192b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mixtral-8x7B-v0.1",
+            "model_revision": "58301445dc1378584211722b7ebf8743ec4e192b"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Mixtral-8x7B-v0.1",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -3481,7 +4874,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mixtral-8x7B-v0.1-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mixtral-8x7B-v0.1-GPTQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3496,8 +4893,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Mixtral-8x7B-v0.1-GGUF",
-        "model_file_name_template": "mixtral-8x7b-v0.1.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mixtral-8x7B-v0.1-GGUF",
+            "model_file_name_template": "mixtral-8x7b-v0.1.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -3525,8 +4926,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mixtral-8x7B-Instruct-v0.1",
-        "model_revision": "125c431e2ff41a156b9f9076f744d2f35dd6e67a"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mixtral-8x7B-Instruct-v0.1",
+            "model_revision": "125c431e2ff41a156b9f9076f744d2f35dd6e67a"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Mixtral-8x7B-Instruct-v0.1",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -3534,7 +4943,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mixtral-8x7B-Instruct-v0.1-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mixtral-8x7B-Instruct-v0.1-AWQ"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -3542,7 +4955,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/Mixtral-8x7B-Instruct-v0.1-GPTQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mixtral-8x7B-Instruct-v0.1-GPTQ"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3557,8 +4974,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Mixtral-8x7B-Instruct-v0.1-GGUF",
-        "model_file_name_template": "mixtral-8x7b-instruct-v0.1.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Mixtral-8x7B-Instruct-v0.1-GGUF",
+            "model_file_name_template": "mixtral-8x7b-instruct-v0.1.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content'] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n        {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif %}\n    {%- if message['role'] == 'user' %}\n        {%- if loop.first and system_message is defined %}\n            {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}\n        {%- else %}\n            {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n        {%- endif %}\n    {%- elif message['role'] == 'assistant' %}\n        {{- ' ' + message['content'] + '</s>'}}\n    {%- else %}\n        {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n    {%- endif %}\n{%- endfor %}\n",
@@ -3593,8 +5014,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "mistralai/Mixtral-8x22B-Instruct-v0.1",
-        "model_revision": "ebb919ac9e9f7f9a900644621bae7963bc593f4f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mistralai/Mixtral-8x22B-Instruct-v0.1",
+            "model_revision": "ebb919ac9e9f7f9a900644621bae7963bc593f4f"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -3602,7 +5027,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "MaziyarPanahi/Mixtral-8x22B-Instruct-v0.1-AWQ"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "MaziyarPanahi/Mixtral-8x22B-Instruct-v0.1-AWQ"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -3610,7 +5039,11 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "jarrelscy/Mixtral-8x22B-Instruct-v0.1-GPTQ-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "jarrelscy/Mixtral-8x22B-Instruct-v0.1-GPTQ-4bit"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3628,8 +5061,6 @@
           "Q8_0",
           "fp16"
         ],
-        "model_id": "MaziyarPanahi/Mixtral-8x22B-Instruct-v0.1-GGUF",
-        "model_file_name_template": "Mixtral-8x22B-Instruct-{quantization}.gguf",
         "model_file_name_split_template": "Mixtral-8x22B-Instruct-v0.1.{quantization}-{part}.gguf",
         "quantization_parts": {
           "Q2_K": [
@@ -3691,6 +5122,12 @@
             "00006-of-00007",
             "00007-of-00007"
           ]
+        },
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "MaziyarPanahi/Mixtral-8x22B-Instruct-v0.1-GGUF",
+            "model_file_name_template": "Mixtral-8x22B-Instruct-{quantization}.gguf"
+          }
         }
       }
     ],
@@ -3732,8 +5169,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Yi-34B-GGUF",
-        "model_file_name_template": "yi-34b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Yi-34B-GGUF",
+            "model_file_name_template": "yi-34b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3743,8 +5184,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-6B",
-        "model_revision": "25beebcb1166b9f49458459eb7b68130b9f9cf4d"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-6B",
+            "model_revision": "25beebcb1166b9f49458459eb7b68130b9f9cf4d"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-6B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3754,8 +5203,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-9B",
-        "model_revision": "f70a5ff8b2e51c5d5b20e649d7b5f4238ffe6d5b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-9B",
+            "model_revision": "f70a5ff8b2e51c5d5b20e649d7b5f4238ffe6d5b"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-9B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3765,8 +5222,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-34B",
-        "model_revision": "168c48e05e1429779a896c7ef0d2e01b85e6bd8d"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-34B",
+            "model_revision": "168c48e05e1429779a896c7ef0d2e01b85e6bd8d"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-34B",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -3791,8 +5256,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-6B-200K",
-        "model_revision": "70649e36d43f91dff1357b576e6713cac03c1d4c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-6B-200K",
+            "model_revision": "70649e36d43f91dff1357b576e6713cac03c1d4c"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-6B-200K",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3802,8 +5275,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-34B-200K",
-        "model_revision": "591ae83b8f9c269700ef27f9dbd548934d800302"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-34B-200K",
+            "model_revision": "591ae83b8f9c269700ef27f9dbd548934d800302"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-34B-200K",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -3826,7 +5307,15 @@
         "quantizations": [
           "8bits"
         ],
-        "model_id": "01-ai/Yi-34B-Chat-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-34B-Chat-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-34B-Chat-{quantization}",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3836,8 +5325,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-6B-Chat",
-        "model_revision": "1c20c960895e4c3877cf478bc2df074221b81d7b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-6B-Chat",
+            "model_revision": "1c20c960895e4c3877cf478bc2df074221b81d7b"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-6B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3847,8 +5344,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-34B-Chat",
-        "model_revision": "a99ec35331cbfc9da596af7d4538fe2efecff03c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-34B-Chat",
+            "model_revision": "a99ec35331cbfc9da596af7d4538fe2efecff03c"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-34B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3867,8 +5372,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/Yi-34B-Chat-GGUF",
-        "model_file_name_template": "yi-34b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/Yi-34B-Chat-GGUF",
+            "model_file_name_template": "yi-34b-chat.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -3906,8 +5415,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-6B",
-        "model_revision": "741a657c42d2081f777ce4c6c5572090f8b8c886"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-6B",
+            "model_revision": "741a657c42d2081f777ce4c6c5572090f8b8c886"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-6B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3917,8 +5434,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-9B",
-        "model_revision": "9a6839c5b9db3dbb245fb98a072bfabc242621f2"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-9B",
+            "model_revision": "9a6839c5b9db3dbb245fb98a072bfabc242621f2"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-9B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3928,8 +5453,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-34B",
-        "model_revision": "4f83007957ec3eec76d87df19ad061eb0f57b5c5"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-34B",
+            "model_revision": "4f83007957ec3eec76d87df19ad061eb0f57b5c5"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-34B",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -3954,8 +5487,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-6B-Chat",
-        "model_revision": "d68dab90947a3c869e28c9cb2806996af99a6080"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-6B-Chat",
+            "model_revision": "d68dab90947a3c869e28c9cb2806996af99a6080"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-6B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3965,8 +5506,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-9B-Chat",
-        "model_revision": "1dc6e2b8dcfc12b95bede8dec67e6b6332ac64c6"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-9B-Chat",
+            "model_revision": "1dc6e2b8dcfc12b95bede8dec67e6b6332ac64c6"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-9B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -3976,8 +5525,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-34B-Chat",
-        "model_revision": "fa695ee438bfcd0ec2b378fa1c7e0dea1b40393e"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-34B-Chat",
+            "model_revision": "fa695ee438bfcd0ec2b378fa1c7e0dea1b40393e"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-34B-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -3990,8 +5547,12 @@
           "Q8_0",
           "f32"
         ],
-        "model_id": "lmstudio-community/Yi-1.5-6B-Chat-GGUF",
-        "model_file_name_template": "Yi-1.5-6B-Chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Yi-1.5-6B-Chat-GGUF",
+            "model_file_name_template": "Yi-1.5-6B-Chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4004,8 +5565,12 @@
           "Q8_0",
           "f32"
         ],
-        "model_id": "lmstudio-community/Yi-1.5-9B-Chat-GGUF",
-        "model_file_name_template": "Yi-1.5-9B-Chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Yi-1.5-9B-Chat-GGUF",
+            "model_file_name_template": "Yi-1.5-9B-Chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4018,8 +5583,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "lmstudio-community/Yi-1.5-34B-Chat-GGUF",
-        "model_file_name_template": "Yi-1.5-34B-Chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "lmstudio-community/Yi-1.5-34B-Chat-GGUF",
+            "model_file_name_template": "Yi-1.5-34B-Chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4027,8 +5596,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "modelscope/Yi-1.5-6B-Chat-GPTQ",
-        "model_revision": "2ad3a602e64d1c79e28e6e92beced2935047367c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "modelscope/Yi-1.5-6B-Chat-GPTQ",
+            "model_revision": "2ad3a602e64d1c79e28e6e92beced2935047367c"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Yi-1.5-6B-Chat-GPTQ",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4036,8 +5613,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "modelscope/Yi-1.5-9B-Chat-GPTQ",
-        "model_revision": "76f47d16982923f7b6674c4e23ddac7c3b1d2e03"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "modelscope/Yi-1.5-9B-Chat-GPTQ",
+            "model_revision": "76f47d16982923f7b6674c4e23ddac7c3b1d2e03"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Yi-1.5-9B-Chat-GPTQ",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4045,8 +5630,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "modelscope/Yi-1.5-34B-Chat-GPTQ",
-        "model_revision": "173fb4036265b2dac1d6296a8e2fd2f652c19968"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "modelscope/Yi-1.5-34B-Chat-GPTQ",
+            "model_revision": "173fb4036265b2dac1d6296a8e2fd2f652c19968"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Yi-1.5-34B-Chat-GPTQ",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4054,8 +5647,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "modelscope/Yi-1.5-6B-Chat-AWQ",
-        "model_revision": "23bf37f1666874e15e239422de0d3948d8735fa9"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "modelscope/Yi-1.5-6B-Chat-AWQ",
+            "model_revision": "23bf37f1666874e15e239422de0d3948d8735fa9"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Yi-1.5-6B-Chat-AWQ",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4063,8 +5664,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "modelscope/Yi-1.5-9B-Chat-AWQ",
-        "model_revision": "2605f388332672789eae1f422644add2901b433f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "modelscope/Yi-1.5-9B-Chat-AWQ",
+            "model_revision": "2605f388332672789eae1f422644add2901b433f"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Yi-1.5-9B-Chat-AWQ",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4072,18 +5681,29 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "modelscope/Yi-1.5-34B-Chat-AWQ",
-        "model_revision": "26234fea6ac49d456f32f8017289021fb1087a04"
-      }
-      ,
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "modelscope/Yi-1.5-34B-Chat-AWQ",
+            "model_revision": "26234fea6ac49d456f32f8017289021fb1087a04"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/Yi-1.5-34B-Chat-AWQ",
+            "model_revision": "master"
+          }
+        }
+      },
       {
         "model_format": "mlx",
         "model_size_in_billions": 6,
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Yi-1.5-6B-Chat-4bit",
-        "model_revision": "0177c9a12b869d6bc73f772b5a1981a7c966adb6"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Yi-1.5-6B-Chat-4bit",
+            "model_revision": "0177c9a12b869d6bc73f772b5a1981a7c966adb6"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -4091,8 +5711,12 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Yi-1.5-6B-Chat-8bit",
-        "model_revision": "7756e65d1bf1e2e6e97aef6bc9484307225f536b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Yi-1.5-6B-Chat-8bit",
+            "model_revision": "7756e65d1bf1e2e6e97aef6bc9484307225f536b"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -4100,8 +5724,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Yi-1.5-9B-Chat-4bit",
-        "model_revision": "e15f886479c44e7d90f0ac13ace69b2319b71c2f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Yi-1.5-9B-Chat-4bit",
+            "model_revision": "e15f886479c44e7d90f0ac13ace69b2319b71c2f"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -4109,8 +5737,12 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Yi-1.5-9B-Chat-8bit",
-        "model_revision": "c1f742fcf3683edbe2d2c2fd1ad7ac2bb6c5ca36"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Yi-1.5-9B-Chat-8bit",
+            "model_revision": "c1f742fcf3683edbe2d2c2fd1ad7ac2bb6c5ca36"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -4118,8 +5750,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/Yi-1.5-34B-Chat-4bit",
-        "model_revision": "945e3b306ef37c46ab444fdc857d1f3ea7247374"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Yi-1.5-34B-Chat-4bit",
+            "model_revision": "945e3b306ef37c46ab444fdc857d1f3ea7247374"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -4127,8 +5763,12 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/Yi-1.5-34B-Chat-8bit",
-        "model_revision": "3c12761a2c6663f216caab6dff84b0dd29b472ac"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/Yi-1.5-34B-Chat-8bit",
+            "model_revision": "3c12761a2c6663f216caab6dff84b0dd29b472ac"
+          }
+        }
       }
     ],
     "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = messages[0]['content'] %}{% endif %}{% if system_message is defined %}{{ system_message }}{% endif %}{% for message in messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|im_start|>user\n' + content + '<|im_end|>\n<|im_start|>assistant\n' }}{% elif message['role'] == 'assistant' %}{{ content + '<|im_end|>' + '\n' }}{% endif %}{% endfor %}",
@@ -4166,8 +5806,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-9B-Chat-16K",
-        "model_revision": "551220fb24d69b6bfec5defceeb160395ce5da8d"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-9B-Chat-16K",
+            "model_revision": "551220fb24d69b6bfec5defceeb160395ce5da8d"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-9B-Chat-16K",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4177,8 +5825,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "01-ai/Yi-1.5-34B-Chat-16K",
-        "model_revision": "dfdbc67be750972bfcc1ac7ffd7fe48689c856fd"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-1.5-34B-Chat-16K",
+            "model_revision": "dfdbc67be750972bfcc1ac7ffd7fe48689c856fd"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-1.5-34B-Chat-16K",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4199,8 +5855,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "QuantFactory/Yi-1.5-9B-Chat-16K-GGUF",
-        "model_file_name_template": "Yi-1.5-9B-Chat-16K.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "QuantFactory/Yi-1.5-9B-Chat-16K-GGUF",
+            "model_file_name_template": "Yi-1.5-9B-Chat-16K.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4217,8 +5877,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "bartowski/Yi-1.5-34B-Chat-16K-GGUF",
-        "model_file_name_template": "Yi-1.5-34B-Chat-16K-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "bartowski/Yi-1.5-34B-Chat-16K-GGUF",
+            "model_file_name_template": "Yi-1.5-34B-Chat-16K-{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = messages[0]['content'] %}{% endif %}{% if system_message is defined %}{{ system_message }}{% endif %}{% for message in messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|im_start|>user\n' + content + '<|im_end|>\n<|im_start|>assistant\n' }}{% elif message['role'] == 'assistant' %}{{ content + '<|im_end|>' + '\n' }}{% endif %}{% endfor %}",
@@ -4254,8 +5918,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "WizardLMTeam/WizardCoder-Python-13B-V1.0",
-        "model_revision": "5ac6748b1f5a4c282107ddc7d3b69fdc4a686d75"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "WizardLMTeam/WizardCoder-Python-13B-V1.0",
+            "model_revision": "5ac6748b1f5a4c282107ddc7d3b69fdc4a686d75"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/WizardCoder-Python-13B-V1.0",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4265,8 +5937,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "WizardLMTeam/WizardCoder-Python-34B-V1.0",
-        "model_revision": "897fc6d9e12136c68c441b2350d015902c144b20"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "WizardLMTeam/WizardCoder-Python-34B-V1.0",
+            "model_revision": "897fc6d9e12136c68c441b2350d015902c144b20"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/WizardCoder-Python-34B-V1.0",
+            "model_revision": "v1.0.0"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4285,8 +5965,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/WizardCoder-Python-7B-V1.0-GGUF",
-        "model_file_name_template": "wizardcoder-python-7b-v1.0.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/WizardCoder-Python-7B-V1.0-GGUF",
+            "model_file_name_template": "wizardcoder-python-7b-v1.0.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4305,8 +5989,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/WizardCoder-Python-13B-V1.0-GGUF",
-        "model_file_name_template": "wizardcoder-python-13b-v1.0.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/WizardCoder-Python-13B-V1.0-GGUF",
+            "model_file_name_template": "wizardcoder-python-13b-v1.0.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4325,8 +6013,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/WizardCoder-Python-34B-V1.0-GGUF",
-        "model_file_name_template": "wizardcoder-python-34b-v1.0.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/WizardCoder-Python-34B-V1.0-GGUF",
+            "model_file_name_template": "wizardcoder-python-34b-v1.0.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n\n### ' }}{% elif loop.first %}{{ 'Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### ' }}{% endif %}{% if item['role'] == 'user' %}{{ 'Instruction: ' + item['content'] + '\n\n### ' }}{% elif item['role'] == 'assistant' %}{{ 'Response: ' + item['content'] + '\n\n### ' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'Response: Let\\'s think step by step.' }}{% endif %}",
@@ -4355,8 +6047,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "gorilla-llm/gorilla-openfunctions-v2",
-        "model_revision": "0f91d705e64b77fb55e35a7eab5d03bf965c9b5c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "gorilla-llm/gorilla-openfunctions-v2",
+            "model_revision": "0f91d705e64b77fb55e35a7eab5d03bf965c9b5c"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4373,8 +6069,12 @@
           "Q5_K_S",
           "Q6_K"
         ],
-        "model_id": "gorilla-llm//gorilla-openfunctions-v2-GGUF",
-        "model_file_name_template": "gorilla-openfunctions-v2.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "gorilla-llm//gorilla-openfunctions-v2-GGUF",
+            "model_file_name_template": "gorilla-openfunctions-v2.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}\n{% set add_generation_prompt = false %}\n{% endif %}\n{%- set ns = namespace(found=false) -%}\n{%- for message in messages -%}\n    {%- if message['role'] == 'system' -%}\n        {%- set ns.found = true -%}\n    {%- endif -%}\n{%- endfor -%}\n{{'<｜begin▁of▁sentence｜>'}}{%- if not ns.found -%}\n{{'You are an AI programming assistant, utilizing the Gorilla LLM model, developed by Gorilla LLM, and you only answer questions related to computer science. For politically sensitive questions, security and privacy issues, and other non-computer science questions, you will refuse to answer\n'}}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message['role'] == 'system' %}\n{{ message['content'] }}\n    {%- else %}\n        {%- if message['role'] == 'user' %}\n{{'### Instruction:\n' + message['content'] + '\n'}}\n        {%- else %}\n{{'### Response:\n' + message['content'] + '\n<|EOT|>\n'}}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{% if add_generation_prompt %}\n{{'### Response:'}}\n{% endif %}",
@@ -4407,8 +6107,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-vl-1.3b-chat",
-        "model_revision": "8f13a8e00dbdc381d614a9d29d61b07e8fe91b3f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-vl-1.3b-chat",
+            "model_revision": "8f13a8e00dbdc381d614a9d29d61b07e8fe91b3f"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-vl-1.3b-chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4416,8 +6123,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-vl-7b-chat",
-        "model_revision": "6f16f00805f45b5249f709ce21820122eeb43556"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-vl-7b-chat",
+            "model_revision": "6f16f00805f45b5249f709ce21820122eeb43556"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-vl-7b-chat"
+          }
+        }
       }
     ],
     "chat_template": "",
@@ -4449,8 +6163,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-llm-7b-base",
-        "model_revision": "7683fea62db869066ddaff6a41d032262c490d4f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-llm-7b-base",
+            "model_revision": "7683fea62db869066ddaff6a41d032262c490d4f"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-llm-7b-base"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4460,8 +6181,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-llm-67b-base",
-        "model_revision": "c3f813a1121c95488a20132d3a4da89f4a46452f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-llm-67b-base",
+            "model_revision": "c3f813a1121c95488a20132d3a4da89f4a46452f"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-llm-67b-base"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4480,8 +6208,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-llm-7B-chat-GGUF",
-        "model_file_name_template": "deepseek-llm-7b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-llm-7B-chat-GGUF",
+            "model_file_name_template": "deepseek-llm-7b-chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4500,8 +6232,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-llm-67b-chat-GGUF",
-        "model_file_name_template": "deepseek-llm-67b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-llm-67b-chat-GGUF",
+            "model_file_name_template": "deepseek-llm-67b-chat.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -4526,8 +6262,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-llm-7b-chat",
-        "model_revision": "afbda8b347ec881666061fa67447046fc5164ec8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-llm-7b-chat",
+            "model_revision": "afbda8b347ec881666061fa67447046fc5164ec8"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-llm-7b-chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4537,8 +6280,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-llm-67b-chat",
-        "model_revision": "79648bef7658bb824e4630740f6e1484c1b0620b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-llm-67b-chat",
+            "model_revision": "79648bef7658bb824e4630740f6e1484c1b0620b"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-llm-67b-chat"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4557,8 +6307,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-llm-7B-chat-GGUF",
-        "model_file_name_template": "deepseek-llm-7b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-llm-7B-chat-GGUF",
+            "model_file_name_template": "deepseek-llm-7b-chat.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4577,8 +6331,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-llm-67b-chat-GGUF",
-        "model_file_name_template": "deepseek-llm-67b-chat.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-llm-67b-chat-GGUF",
+            "model_file_name_template": "deepseek-llm-67b-chat.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{{ '<｜begin▁of▁sentence｜>' }}{% for message in messages %}{% if message['role'] == 'user' %}{{ 'User: ' + message['content'] + '\n\n' }}{% elif message['role'] == 'assistant' %}{{ 'Assistant: ' + message['content'] + '<｜end▁of▁sentence｜>' }}{% elif message['role'] == 'system' %}{{ message['content'] + '\n\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'Assistant:' }}{% endif %}",
@@ -4610,8 +6368,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-1.3b-base",
-        "model_revision": "c919139c3a9b4070729c8b2cca4847ab29ca8d94"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-1.3b-base",
+            "model_revision": "c919139c3a9b4070729c8b2cca4847ab29ca8d94"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-coder-1.3b-base"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4621,8 +6386,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-6.7b-base",
-        "model_revision": "ce2207a8bfef3ee92bd7dd4cc31c52cfa0046912"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-6.7b-base",
+            "model_revision": "ce2207a8bfef3ee92bd7dd4cc31c52cfa0046912"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-coder-6.7b-base"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4632,8 +6404,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-7b-base-v1.5",
-        "model_revision": "98f0904cee2237e235f10408ae12292037b21dac"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-7b-base-v1.5",
+            "model_revision": "98f0904cee2237e235f10408ae12292037b21dac"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4643,8 +6419,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-33b-base",
-        "model_revision": "45c85cadf3720ef3e85a492e24fd4b8c5d21d8ac"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-33b-base",
+            "model_revision": "45c85cadf3720ef3e85a492e24fd4b8c5d21d8ac"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-coder-33b-base"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4663,8 +6446,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-coder-1.3b-base-GGUF",
-        "model_file_name_template": "deepseek-coder-1.3b-base.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-1.3b-base-GGUF",
+            "model_file_name_template": "deepseek-coder-1.3b-base.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4683,8 +6470,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-coder-6.7B-base-GGUF",
-        "model_file_name_template": "deepseek-coder-6.7b-base.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-6.7B-base-GGUF",
+            "model_file_name_template": "deepseek-coder-6.7b-base.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4702,8 +6493,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "dagbs/deepseek-coder-7b-base-v1.5-GGUF",
-        "model_file_name_template": "deepseek-coder-7b-base-v1.5.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "dagbs/deepseek-coder-7b-base-v1.5-GGUF",
+            "model_file_name_template": "deepseek-coder-7b-base-v1.5.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4722,8 +6517,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-coder-33B-base-GGUF",
-        "model_file_name_template": "deepseek-coder-33b-base.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-33B-base-GGUF",
+            "model_file_name_template": "deepseek-coder-33b-base.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4731,8 +6530,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-1.3b-base-GPTQ",
-        "model_revision": "a5bf3b76d70cda53327311a631b1003024d5de29"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-1.3b-base-GPTQ",
+            "model_revision": "a5bf3b76d70cda53327311a631b1003024d5de29"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4740,8 +6543,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-6.7B-base-GPTQ",
-        "model_revision": "6476ea3d6e623a1313d363dbc6e172773e031bb1"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-6.7B-base-GPTQ",
+            "model_revision": "6476ea3d6e623a1313d363dbc6e172773e031bb1"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4749,8 +6556,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-33B-base-GPTQ",
-        "model_revision": "f527d7325e463a5cb091d044e4f2b15902674a70"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-33B-base-GPTQ",
+            "model_revision": "f527d7325e463a5cb091d044e4f2b15902674a70"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4758,8 +6569,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-1.3b-base-AWQ",
-        "model_revision": "ffb66f1a2a194401b4f29025edcd261d7f0a08a7"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-1.3b-base-AWQ",
+            "model_revision": "ffb66f1a2a194401b4f29025edcd261d7f0a08a7"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4767,8 +6582,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-6.7B-base-AWQ",
-        "model_revision": "e3d4bdf39712665f5e9d5c05c9df6f20fe1e2d5a"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-6.7B-base-AWQ",
+            "model_revision": "e3d4bdf39712665f5e9d5c05c9df6f20fe1e2d5a"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4776,8 +6595,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-33B-base-AWQ",
-        "model_revision": "c7edb2d5868d61a5dcf2591933a8992c8cbe3ef4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-33B-base-AWQ",
+            "model_revision": "c7edb2d5868d61a5dcf2591933a8992c8cbe3ef4"
+          }
+        }
       }
     ]
   },
@@ -4802,8 +6625,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-1.3b-instruct",
-        "model_revision": "2df081ceaca101a867fef2844e44f4d6a4857039"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-1.3b-instruct",
+            "model_revision": "2df081ceaca101a867fef2844e44f4d6a4857039"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-coder-1.3b-instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4813,8 +6643,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-6.7b-instruct",
-        "model_revision": "cbb77d7448ea3168d884758817e7f895e3828d1c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-6.7b-instruct",
+            "model_revision": "cbb77d7448ea3168d884758817e7f895e3828d1c"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-coder-6.7b-instruct"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4824,8 +6661,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-7b-instruct-v1.5",
-        "model_revision": "2a050a4c59d687a85324d32e147517992117ed30"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-7b-instruct-v1.5",
+            "model_revision": "2a050a4c59d687a85324d32e147517992117ed30"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -4835,8 +6676,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "deepseek-ai/deepseek-coder-33b-instruct",
-        "model_revision": "ea15d17db84d1fc94ac5cba8e6fa97764c9549d3"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "deepseek-ai/deepseek-coder-33b-instruct",
+            "model_revision": "ea15d17db84d1fc94ac5cba8e6fa97764c9549d3"
+          },
+          "modelscope": {
+            "model_id": "deepseek-ai/deepseek-coder-33b-instruct"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4855,8 +6703,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-coder-1.3b-instruct-GGUF",
-        "model_file_name_template": "deepseek-coder-1.3b-instruct.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-1.3b-instruct-GGUF",
+            "model_file_name_template": "deepseek-coder-1.3b-instruct.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4875,8 +6727,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-coder-6.7B-instruct-GGUF",
-        "model_file_name_template": "deepseek-coder-6.7b-instruct.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-6.7B-instruct-GGUF",
+            "model_file_name_template": "deepseek-coder-6.7b-instruct.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4894,8 +6750,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "LoneStriker/deepseek-coder-7b-instruct-v1.5-GGUF",
-        "model_file_name_template": "deepseek-coder-7b-instruct-v1.5-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "LoneStriker/deepseek-coder-7b-instruct-v1.5-GGUF",
+            "model_file_name_template": "deepseek-coder-7b-instruct-v1.5-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -4914,8 +6774,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/deepseek-coder-33B-instruct-GGUF",
-        "model_file_name_template": "deepseek-coder-33b-instruct.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-33B-instruct-GGUF",
+            "model_file_name_template": "deepseek-coder-33b-instruct.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4923,8 +6787,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-1.3b-instruct-GPTQ",
-        "model_revision": "9c002e9af6cbdf3bd9244e2d7264b6a35d1dcacf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-1.3b-instruct-GPTQ",
+            "model_revision": "9c002e9af6cbdf3bd9244e2d7264b6a35d1dcacf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4932,8 +6800,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-6.7B-instruct-GPTQ",
-        "model_revision": "13ccea6e3a43dcfdcb655d92097610018b431a17"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-6.7B-instruct-GPTQ",
+            "model_revision": "13ccea6e3a43dcfdcb655d92097610018b431a17"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -4941,8 +6813,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-33B-instruct-GPTQ",
-        "model_revision": "08372729d98dfc248f9531a412fe69e14e607027"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-33B-instruct-GPTQ",
+            "model_revision": "08372729d98dfc248f9531a412fe69e14e607027"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4950,8 +6826,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-1.3b-instruct-AWQ",
-        "model_revision": "a2a484da6e4146d055316a9a63cf5b13955715a4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-1.3b-instruct-AWQ",
+            "model_revision": "a2a484da6e4146d055316a9a63cf5b13955715a4"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4959,8 +6839,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-6.7B-instruct-AWQ",
-        "model_revision": "502ae3e19e57ae78dc30a791ba33c565da72dc62"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-6.7B-instruct-AWQ",
+            "model_revision": "502ae3e19e57ae78dc30a791ba33c565da72dc62"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -4968,8 +6852,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/deepseek-coder-33B-instruct-AWQ",
-        "model_revision": "c40b499bac2712cd3c445cf1b05d2c6558ab0d29"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/deepseek-coder-33B-instruct-AWQ",
+            "model_revision": "c40b499bac2712cd3c445cf1b05d2c6558ab0d29"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}\n{% set add_generation_prompt = false %}\n{% endif %}\n{%- set ns = namespace(found=false) -%}\n{%- for message in messages -%}\n    {%- if message['role'] == 'system' -%}\n        {%- set ns.found = true -%}\n    {%- endif -%}\n{%- endfor -%}\n{{'<｜begin▁of▁sentence｜>'}}{%- if not ns.found -%}\n{{'You are an AI programming assistant, utilizing the Deepseek Coder model, developed by Deepseek Company, and you only answer questions related to computer science. For politically sensitive questions, security and privacy issues, and other non-computer science questions, you will refuse to answer\n'}}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message['role'] == 'system' %}\n{{ message['content'] }}\n    {%- else %}\n        {%- if message['role'] == 'user' %}\n{{'### Instruction:\n' + message['content'] + '\n'}}\n        {%- else %}\n{{'### Response:\n' + message['content'] + '\n<|EOT|>\n'}}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{% if add_generation_prompt %}\n{{'### Response:'}}\n{% endif %}",
@@ -5000,8 +6888,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "skywork/Skywork-13B-base",
-        "model_revision": "bc35915066fbbf15b77a1a4a74e9b574ab167816"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "skywork/Skywork-13B-base",
+            "model_revision": "bc35915066fbbf15b77a1a4a74e9b574ab167816"
+          },
+          "modelscope": {
+            "model_id": "skywork/Skywork-13B-base",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -5025,8 +6921,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "skywork/Skywork-13B-Math",
-        "model_revision": "70d1740208c8ba39f9ba250b22117ec25311ab33"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "skywork/Skywork-13B-Math",
+            "model_revision": "70d1740208c8ba39f9ba250b22117ec25311ab33"
+          },
+          "modelscope": {
+            "model_id": "skywork/Skywork-13B-Math",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -5049,8 +6953,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "internlm/internlm2-chat-7b",
-        "model_revision": "2292b86b21cb856642782cebed0a453997453b1f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2-chat-7b",
+            "model_revision": "2292b86b21cb856642782cebed0a453997453b1f"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2-chat-7b",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5058,8 +6970,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "internlm/internlm2-chat-20b",
-        "model_revision": "b666125047cd98c5a7c85ca28720b44a06aed124"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2-chat-20b",
+            "model_revision": "b666125047cd98c5a7c85ca28720b44a06aed124"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2-chat-20b",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -5091,8 +7011,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "internlm/internlm2_5-1_8b-chat",
-        "model_revision": "4426f00b854561fa60d555d2b628064b56bcb758"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-1_8b-chat",
+            "model_revision": "4426f00b854561fa60d555d2b628064b56bcb758"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2_5-1_8b-chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5100,8 +7027,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "internlm/internlm2_5-7b-chat",
-        "model_revision": "9dc8536a922ab4954726aad1b37fa199004a291a"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-7b-chat",
+            "model_revision": "9dc8536a922ab4954726aad1b37fa199004a291a"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2_5-7b-chat"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5109,8 +7043,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "internlm/internlm2_5-20b-chat",
-        "model_revision": "ef17bde929761255fee76d95e2c25969ccd93b0d"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-20b-chat",
+            "model_revision": "ef17bde929761255fee76d95e2c25969ccd93b0d"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2_5-20b-chat"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -5118,8 +7059,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "ModelCloud/internlm-2.5-7b-chat-gptq-4bit",
-        "model_revision": "2e2dda735c326544921a4035bbeb6c6e316a8254"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "ModelCloud/internlm-2.5-7b-chat-gptq-4bit",
+            "model_revision": "2e2dda735c326544921a4035bbeb6c6e316a8254"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5135,8 +7080,12 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "internlm/internlm2_5-1_8b-chat-gguf",
-        "model_file_name_template": "internlm2_5-1_8b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-1_8b-chat-gguf",
+            "model_file_name_template": "internlm2_5-1_8b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5152,8 +7101,16 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "internlm/internlm2_5-7b-chat-gguf",
-        "model_file_name_template": "internlm2_5-7b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-7b-chat-gguf",
+            "model_file_name_template": "internlm2_5-7b-chat-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2_5-7b-chat-gguf",
+            "model_file_name_template": "internlm2_5-7b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5169,8 +7126,12 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "internlm/internlm2_5-20b-chat-gguf",
-        "model_file_name_template": "internlm2_5-20b-chat-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-20b-chat-gguf",
+            "model_file_name_template": "internlm2_5-20b-chat-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5178,8 +7139,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/internlm2_5-7b-chat-4bit",
-        "model_revision": "d12097a867721978142a6048399f470a3d18beee"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/internlm2_5-7b-chat-4bit",
+            "model_revision": "d12097a867721978142a6048399f470a3d18beee"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5187,8 +7152,12 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/internlm2_5-7b-chat-8bit",
-        "model_revision": "0ec94d61d30ab161b49c69f9bf92ec2b9986d234"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/internlm2_5-7b-chat-8bit",
+            "model_revision": "0ec94d61d30ab161b49c69f9bf92ec2b9986d234"
+          }
+        }
       }
     ],
     "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -5220,8 +7189,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "internlm/internlm2_5-7b-chat-1m",
-        "model_revision": "8d1a709a04d71440ef3df6ebbe204672f411c8b6"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-7b-chat-1m",
+            "model_revision": "8d1a709a04d71440ef3df6ebbe204672f411c8b6"
+          },
+          "modelscope": {
+            "model_id": "Shanghai_AI_Laboratory/internlm2_5-7b-chat-1m"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -5229,8 +7205,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "ModelCloud/internlm-2.5-7b-chat-1m-gptq-4bit",
-        "model_revision": "022e59cb30f03b271d56178478acb038b2b9b58c"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "ModelCloud/internlm-2.5-7b-chat-1m-gptq-4bit",
+            "model_revision": "022e59cb30f03b271d56178478acb038b2b9b58c"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5246,8 +7226,12 @@
           "q8_0",
           "fp16"
         ],
-        "model_id": "internlm/internlm2_5-7b-chat-1m-gguf",
-        "model_file_name_template": "internlm2_5-7b-chat-1m-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "internlm/internlm2_5-7b-chat-1m-gguf",
+            "model_file_name_template": "internlm2_5-7b-chat-1m-{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -5261,36 +7245,52 @@
     ]
   },
   {
-    "version":1,
-    "context_length":2048,
-    "model_name":"OmniLMM",
-    "model_lang":[
+    "version": 1,
+    "context_length": 2048,
+    "model_name": "OmniLMM",
+    "model_lang": [
       "en",
       "zh"
     ],
-    "model_ability":[
+    "model_ability": [
       "chat",
       "vision"
     ],
-    "model_description":"OmniLMM is a family of open-source large multimodal models (LMMs) adept at vision & language modeling.",
-    "model_specs":[
+    "model_description": "OmniLMM is a family of open-source large multimodal models (LMMs) adept at vision & language modeling.",
+    "model_specs": [
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":3,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 3,
+        "quantizations": [
           "none"
         ],
-        "model_id":"openbmb/MiniCPM-V",
-        "model_revision":"bec7d1cd1c9e804c064ec291163e40624825eaaa"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-V",
+            "model_revision": "bec7d1cd1c9e804c064ec291163e40624825eaaa"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-V",
+            "model_revision": "master"
+          }
+        }
       },
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":12,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 12,
+        "quantizations": [
           "none"
         ],
-        "model_id":"openbmb/OmniLMM-12B",
-        "model_revision":"ef62bae5af34be653b9801037cd613e05ab24fdc"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/OmniLMM-12B",
+            "model_revision": "ef62bae5af34be653b9801037cd613e05ab24fdc"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/OmniLMM-12B",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "",
@@ -5302,36 +7302,48 @@
     ]
   },
   {
-    "version":1,
-    "context_length":8192,
-    "model_name":"MiniCPM-Llama3-V-2_5",
-    "model_lang":[
+    "version": 1,
+    "context_length": 8192,
+    "model_name": "MiniCPM-Llama3-V-2_5",
+    "model_lang": [
       "en",
       "zh"
     ],
-    "model_ability":[
+    "model_ability": [
       "chat",
       "vision"
     ],
-    "model_description":"MiniCPM-Llama3-V 2.5 is the latest model in the MiniCPM-V series. The model is built on SigLip-400M and Llama3-8B-Instruct with a total of 8B parameters.",
-    "model_specs":[
+    "model_description": "MiniCPM-Llama3-V 2.5 is the latest model in the MiniCPM-V series. The model is built on SigLip-400M and Llama3-8B-Instruct with a total of 8B parameters.",
+    "model_specs": [
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 8,
+        "quantizations": [
           "none"
         ],
-        "model_id":"openbmb/MiniCPM-Llama3-V-2_5",
-        "model_revision":"285a637ba8a30a0660dfcccad16f9a864f75abfd"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-Llama3-V-2_5",
+            "model_revision": "285a637ba8a30a0660dfcccad16f9a864f75abfd"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-Llama3-V-2_5-{quantization}",
+            "model_revision": "master"
+          }
+        }
       },
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 8,
+        "quantizations": [
           "int4"
         ],
-        "model_id":"openbmb/MiniCPM-Llama3-V-2_5-{quantization}",
-        "model_revision":"f92aff28552de35de3be204e8fe292dd4824e544"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-Llama3-V-2_5-{quantization}",
+            "model_revision": "f92aff28552de35de3be204e8fe292dd4824e544"
+          }
+        }
       }
     ],
     "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
@@ -5343,36 +7355,48 @@
     ]
   },
   {
-    "version":1,
-    "context_length":32768,
-    "model_name":"MiniCPM-V-2.6",
-    "model_lang":[
+    "version": 1,
+    "context_length": 32768,
+    "model_name": "MiniCPM-V-2.6",
+    "model_lang": [
       "en",
       "zh"
     ],
-    "model_ability":[
+    "model_ability": [
       "chat",
       "vision"
     ],
-    "model_description":"MiniCPM-V 2.6 is the latest model in the MiniCPM-V series. The model is built on SigLip-400M and Qwen2-7B with a total of 8B parameters.",
-    "model_specs":[
+    "model_description": "MiniCPM-V 2.6 is the latest model in the MiniCPM-V series. The model is built on SigLip-400M and Qwen2-7B with a total of 8B parameters.",
+    "model_specs": [
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 8,
+        "quantizations": [
           "none"
         ],
-        "model_id":"openbmb/MiniCPM-V-2_6",
-        "model_revision":"3f7a8da1b7a8b928b5ee229fae33cf43fd64cf31"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-V-2_6",
+            "model_revision": "3f7a8da1b7a8b928b5ee229fae33cf43fd64cf31"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-V-2_6-int4",
+            "model_revision": "master"
+          }
+        }
       },
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 8,
+        "quantizations": [
           "4-bit"
         ],
-        "model_id":"openbmb/MiniCPM-V-2_6-int4",
-        "model_revision":"051e2df6505f1fc4305f2c9bd42ed90db8bf4874"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-V-2_6-int4",
+            "model_revision": "051e2df6505f1fc4305f2c9bd42ed90db8bf4874"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -5405,8 +7429,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "Qwen/Qwen-VL-Chat",
-        "model_revision": "6665c780ade5ff3f08853b4262dcb9c8f9598d42"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-VL-Chat",
+            "model_revision": "6665c780ade5ff3f08853b4262dcb9c8f9598d42"
+          },
+          "modelscope": {
+            "model_id": "Qwen/Qwen-VL-Chat",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -5414,8 +7446,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "Qwen/Qwen-VL-Chat-{quantization}",
-        "model_revision": "5d3a5aa033ed2c502300d426c81cc5b13bcd1409"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen-VL-Chat-{quantization}",
+            "model_revision": "5d3a5aa033ed2c502300d426c81cc5b13bcd1409"
+          },
+          "modelscope": {
+            "model_id": "Qwen/Qwen-VL-Chat-{quantization}",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "",
@@ -5451,8 +7491,15 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "OrionStarAI/Orion-14B-Chat",
-        "model_revision": "ea6fb9b7e1917f3693935accbeb0bfecfd6552a7"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OrionStarAI/Orion-14B-Chat",
+            "model_revision": "ea6fb9b7e1917f3693935accbeb0bfecfd6552a7"
+          },
+          "modelscope": {
+            "model_id": "OrionStarAI/Orion-14B-Chat"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -5460,7 +7507,14 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "OrionStarAI/Orion-14B-Chat-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OrionStarAI/Orion-14B-Chat-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "OrionStarAI/Orion-14B-Chat-{quantization}"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if loop.first %}{{ '<s>' }}{% endif %}{% if message['role'] == 'user' %}{{ 'Human: ' + message['content'] + '\n\nAssistant: ' + '</s>' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + '</s>' }}{% endif %}{% endfor %}",
@@ -5496,8 +7550,15 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "OrionStarAI/Orion-14B-Chat-RAG",
-        "model_revision": "eba2e20808407fb431a76b90d5d506e04a0325f2"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OrionStarAI/Orion-14B-Chat-RAG",
+            "model_revision": "eba2e20808407fb431a76b90d5d506e04a0325f2"
+          },
+          "modelscope": {
+            "model_id": "OrionStarAI/Orion-14B-Chat-RAG"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if loop.first %}{{ '<s>' }}{% endif %}{% if message['role'] == 'user' %}{{ 'Human: ' + message['content'] + '\n\nAssistant: ' + '</s>' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + '</s>' }}{% endif %}{% endfor %}",
@@ -5532,8 +7593,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "01-ai/Yi-VL-6B",
-        "model_revision": "897c938da1ec860330e2ba2d425ab3004495ba38"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-VL-6B",
+            "model_revision": "897c938da1ec860330e2ba2d425ab3004495ba38"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-VL-6B"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5541,8 +7609,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "01-ai/Yi-VL-34B",
-        "model_revision": "ea29a9a430f27893e780366dae81d4ca5ebab561"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "01-ai/Yi-VL-34B",
+            "model_revision": "ea29a9a430f27893e780366dae81d4ca5ebab561"
+          },
+          "modelscope": {
+            "model_id": "01ai/Yi-VL-34B"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
@@ -5579,7 +7654,14 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "google/gemma-2b-it"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "google/gemma-2b-it"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/gemma-2b-it"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5589,7 +7671,14 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "google/gemma-7b-it"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "google/gemma-7b-it"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/gemma-7b-it"
+          }
+        }
       }
     ],
     "chat_template": "{{ '<bos>' }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
@@ -5624,7 +7713,14 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "google/gemma-2-2b-it"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "google/gemma-2-2b-it"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/gemma-2-2b-it"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5634,7 +7730,14 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "google/gemma-2-9b-it"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "google/gemma-2-9b-it"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/gemma-2-9b-it"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5644,7 +7747,14 @@
           "4-bit",
           "8-bit"
         ],
-        "model_id": "google/gemma-2-27b-it"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "google/gemma-2-27b-it"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/gemma-2-27b-it"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5660,8 +7770,12 @@
           "Q8_0",
           "f32"
         ],
-        "model_id": "bartowski/gemma-2-2b-it-GGUF",
-        "model_file_name_template": "gemma-2-2b-it-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "bartowski/gemma-2-2b-it-GGUF",
+            "model_file_name_template": "gemma-2-2b-it-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5683,8 +7797,16 @@
           "Q8_0",
           "f32"
         ],
-        "model_id": "bartowski/gemma-2-9b-it-GGUF",
-        "model_file_name_template": "gemma-2-9b-it-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "bartowski/gemma-2-9b-it-GGUF",
+            "model_file_name_template": "gemma-2-9b-it-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "LLM-Research/gemma-2-9b-it-GGUF",
+            "model_file_name_template": "gemma-2-9b-it-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5706,8 +7828,12 @@
           "Q8_0",
           "f32"
         ],
-        "model_id": "bartowski/gemma-2-27b-it-GGUF",
-        "model_file_name_template": "gemma-2-27b-it-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "bartowski/gemma-2-27b-it-GGUF",
+            "model_file_name_template": "gemma-2-27b-it-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5715,7 +7841,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/gemma-2-2b-it-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-2b-it-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5723,7 +7853,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/gemma-2-2b-it-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-2b-it-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5731,7 +7865,11 @@
         "quantizations": [
           "None"
         ],
-        "model_id": "mlx-community/gemma-2-2b-it"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-2b-it"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5739,7 +7877,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/gemma-2-9b-it-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-9b-it-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5747,7 +7889,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/gemma-2-9b-it-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-9b-it-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5755,7 +7901,11 @@
         "quantizations": [
           "None"
         ],
-        "model_id": "mlx-community/gemma-2-9b-it-fp16"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-9b-it-fp16"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5763,7 +7913,11 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "mlx-community/gemma-2-27b-it-4bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-27b-it-4bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5771,7 +7925,11 @@
         "quantizations": [
           "8-bit"
         ],
-        "model_id": "mlx-community/gemma-2-27b-it-8bit"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-27b-it-8bit"
+          }
+        }
       },
       {
         "model_format": "mlx",
@@ -5779,7 +7937,11 @@
         "quantizations": [
           "None"
         ],
-        "model_id": "mlx-community/gemma-2-27b-it-fp16"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "mlx-community/gemma-2-27b-it-fp16"
+          }
+        }
       }
     ],
     "chat_template": "{{ '<bos>' }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
@@ -5812,8 +7974,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "garage-bAInd/Platypus2-70B-instruct",
-        "model_revision": "31389b50953688e4e542be53e6d2ab04d5c34e87"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "garage-bAInd/Platypus2-70B-instruct",
+            "model_revision": "31389b50953688e4e542be53e6d2ab04d5c34e87"
+          }
+        }
       }
     ]
   },
@@ -5835,8 +8001,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/Aquila2-7B",
-        "model_revision": "9c76e143c6e9621689ca76e078c465b0dee75eb8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/Aquila2-7B",
+            "model_revision": "9c76e143c6e9621689ca76e078c465b0dee75eb8"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5844,8 +8014,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/Aquila2-34B",
-        "model_revision": "356733caf6221e9dd898cde8ff189a98175526ec"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/Aquila2-34B",
+            "model_revision": "356733caf6221e9dd898cde8ff189a98175526ec"
+          },
+          "modelscope": {
+            "model_id": "BAAI/Aquila2-34B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5853,8 +8031,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/Aquila2-70B-Expr",
-        "model_revision": "32a2897235541b9f5238bbe88f8d76a19993c0ba"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/Aquila2-70B-Expr",
+            "model_revision": "32a2897235541b9f5238bbe88f8d76a19993c0ba"
+          },
+          "modelscope": {
+            "model_id": "BAAI/Aquila2-70B-Expr",
+            "model_revision": "master"
+          }
+        }
       }
     ]
   },
@@ -5876,8 +8062,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/AquilaChat2-7B",
-        "model_revision": "0d060c4edeb4e0febd81130c17f6868653184fb3"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/AquilaChat2-7B",
+            "model_revision": "0d060c4edeb4e0febd81130c17f6868653184fb3"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5896,8 +8086,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/AquilaChat2-34B-GGUF",
-        "model_file_name_template": "aquilachat2-34b.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/AquilaChat2-34B-GGUF",
+            "model_file_name_template": "aquilachat2-34b.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -5905,8 +8099,16 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/AquilaChat2-34B-GPTQ",
-        "model_revision": "9a9d21424f7db608be51df769885514ab6e052db"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/AquilaChat2-34B-GPTQ",
+            "model_revision": "9a9d21424f7db608be51df769885514ab6e052db"
+          },
+          "modelscope": {
+            "model_id": "BAAI/AquilaChat2-34B-Int4-GPTQ",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -5914,8 +8116,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/AquilaChat2-34B-AWQ",
-        "model_revision": "ad1dec1c8adb7fa6cb07b7e261aaa04fccf1c4c0"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/AquilaChat2-34B-AWQ",
+            "model_revision": "ad1dec1c8adb7fa6cb07b7e261aaa04fccf1c4c0"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5923,8 +8129,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/AquilaChat2-34B",
-        "model_revision": "b9cd9c7436435ab9cfa5e4f009be2b0354979ca8"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/AquilaChat2-34B",
+            "model_revision": "b9cd9c7436435ab9cfa5e4f009be2b0354979ca8"
+          },
+          "modelscope": {
+            "model_id": "BAAI/AquilaChat2-34B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -5932,8 +8146,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/AquilaChat2-70B-Expr",
-        "model_revision": "0df19b6e10f1a19ca663f7cc1141aae10f1825f4"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/AquilaChat2-70B-Expr",
+            "model_revision": "0df19b6e10f1a19ca663f7cc1141aae10f1825f4"
+          },
+          "modelscope": {
+            "model_id": "BAAI/AquilaChat2-70B-Expr",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n' }}{% endif %}{% if item['role'] == 'user' %}{{ 'USER: ' + item['content'] + '\n' }}{% elif item['role'] == 'assistant' %}{{ 'ASSISTANT: ' + item['content'] + '\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'ASSISTANT: ' }}{% endif %}",
@@ -5964,8 +8186,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/AquilaChat2-7B-16K",
-        "model_revision": "fb46d48479d05086ccf6952f19018322fcbb54cd"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/AquilaChat2-7B-16K",
+            "model_revision": "fb46d48479d05086ccf6952f19018322fcbb54cd"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -5984,8 +8210,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "TheBloke/AquilaChat2-34B-16K-GGUF",
-        "model_file_name_template": "aquilachat2-34b-16k.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/AquilaChat2-34B-16K-GGUF",
+            "model_file_name_template": "aquilachat2-34b-16k.{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -5993,8 +8223,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/AquilaChat2-34B-16K-GPTQ",
-        "model_revision": "0afa1c2a55a4ee1a6f0dba81d9ec296dc7936b91"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/AquilaChat2-34B-16K-GPTQ",
+            "model_revision": "0afa1c2a55a4ee1a6f0dba81d9ec296dc7936b91"
+          }
+        }
       },
       {
         "model_format": "awq",
@@ -6002,8 +8236,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "TheBloke/AquilaChat2-34B-16K-AWQ",
-        "model_revision": "db7403ca492416903c84a7a38b11cb5506de48b1"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "TheBloke/AquilaChat2-34B-16K-AWQ",
+            "model_revision": "db7403ca492416903c84a7a38b11cb5506de48b1"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6011,8 +8249,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "BAAI/AquilaChat2-34B-16K",
-        "model_revision": "a06fd164c7170714924d2881c61c8348425ebc94"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "BAAI/AquilaChat2-34B-16K",
+            "model_revision": "a06fd164c7170714924d2881c61c8348425ebc94"
+          },
+          "modelscope": {
+            "model_id": "BAAI/AquilaChat2-34B-16K",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n' }}{% endif %}{% if item['role'] == 'user' %}{{ 'USER: ' + item['content'] + '\n' }}{% elif item['role'] == 'assistant' %}{{ 'ASSISTANT: ' + item['content'] + '\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'ASSISTANT: ' }}{% endif %}",
@@ -6043,8 +8289,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "openbmb/MiniCPM-2B-sft-bf16",
-        "model_revision": "fe1d74027ebdd81cef5f815fa3a2d432a6b5de2a"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-2B-sft-bf16",
+            "model_revision": "fe1d74027ebdd81cef5f815fa3a2d432a6b5de2a"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/miniCPM-bf16",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
@@ -6075,8 +8329,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "openbmb/MiniCPM-2B-sft-fp32",
-        "model_revision": "35b90dd57d977b6e5bc4907986fa5b77aa15a82e"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-2B-sft-fp32",
+            "model_revision": "35b90dd57d977b6e5bc4907986fa5b77aa15a82e"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-2B-sft-fp32",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
@@ -6107,8 +8369,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "openbmb/MiniCPM-2B-dpo-bf16",
-        "model_revision": "f4a3ba49f3f18695945c2a7c12400d4da99da498"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-2B-dpo-bf16",
+            "model_revision": "f4a3ba49f3f18695945c2a7c12400d4da99da498"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-2B-dpo-bf16",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
@@ -6139,8 +8409,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "openbmb/MiniCPM-2B-dpo-fp16",
-        "model_revision": "e7a50289e4f839674cf8d4a5a2ce032ccacf64ac"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-2B-dpo-fp16",
+            "model_revision": "e7a50289e4f839674cf8d4a5a2ce032ccacf64ac"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-2B-dpo-fp16",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
@@ -6171,8 +8449,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "openbmb/MiniCPM-2B-dpo-fp32",
-        "model_revision": "b560a1593779b735a84a6daf72fba96ae38da288"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "openbmb/MiniCPM-2B-dpo-fp32",
+            "model_revision": "b560a1593779b735a84a6daf72fba96ae38da288"
+          },
+          "modelscope": {
+            "model_id": "OpenBMB/MiniCPM-2B-dpo-fp32",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
@@ -6212,8 +8498,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "SeaLLMs/SeaLLM-7B-v2",
-        "model_revision": "f1bd48e0d75365c24a3c5ad006b2d0a0c9dca30f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "SeaLLMs/SeaLLM-7B-v2",
+            "model_revision": "f1bd48e0d75365c24a3c5ad006b2d0a0c9dca30f"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -6222,8 +8512,12 @@
           "Q4_0",
           "Q8_0"
         ],
-        "model_id": "SeaLLMs/SeaLLM-7B-v2-gguf",
-        "model_file_name_template": "SeaLLM-7B-v2.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "SeaLLMs/SeaLLM-7B-v2-gguf",
+            "model_file_name_template": "SeaLLM-7B-v2.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -6254,8 +8548,12 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "SeaLLMs/SeaLLM-7B-v2.5",
-        "model_revision": "c54a8eb8e2d58c5a680bfbbe3a7ae71753bb644b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "SeaLLMs/SeaLLM-7B-v2.5",
+            "model_revision": "c54a8eb8e2d58c5a680bfbbe3a7ae71753bb644b"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -6264,8 +8562,12 @@
           "Q4_K_M",
           "Q8_0"
         ],
-        "model_id": "SeaLLMs/SeaLLM-7B-v2.5-GGUF",
-        "model_file_name_template": "SeaLLM-7B-v2.5.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "SeaLLMs/SeaLLM-7B-v2.5-GGUF",
+            "model_file_name_template": "SeaLLM-7B-v2.5.{quantization}.gguf"
+          }
+        }
       }
     ]
   },
@@ -6296,8 +8598,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "CohereForAI/c4ai-command-r-v01",
-        "model_revision": "16881ccde1c68bbc7041280e6a66637bc46bfe88"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "CohereForAI/c4ai-command-r-v01",
+            "model_revision": "16881ccde1c68bbc7041280e6a66637bc46bfe88"
+          },
+          "modelscope": {
+            "model_id": "mirror013/c4ai-command-r-v01-4bit",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6305,8 +8615,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "CohereForAI/c4ai-command-r-v01-4bit",
-        "model_revision": "f2e87936a146643c9dd143422dcafb9cb1552611"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "CohereForAI/c4ai-command-r-v01-4bit",
+            "model_revision": "f2e87936a146643c9dd143422dcafb9cb1552611"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -6325,8 +8639,17 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "andrewcanis/c4ai-command-r-v01-GGUF",
-        "model_file_name_template": "c4ai-command-r-v01-{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "andrewcanis/c4ai-command-r-v01-GGUF",
+            "model_file_name_template": "c4ai-command-r-v01-{quantization}.gguf"
+          },
+          "modelscope": {
+            "model_id": "mirror013/C4AI-Command-R-v01-GGUF",
+            "model_revision": "master",
+            "model_file_name_template": "c4ai-command-r-v01-{quantization}.gguf"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6334,8 +8657,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "CohereForAI/c4ai-command-r-plus",
-        "model_revision": "ba7f1d954c9d1609013677d87e4142ab95c34e62"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "CohereForAI/c4ai-command-r-plus",
+            "model_revision": "ba7f1d954c9d1609013677d87e4142ab95c34e62"
+          },
+          "modelscope": {
+            "model_id": "AI-ModelScope/c4ai-command-r-plus",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6343,8 +8674,12 @@
         "quantizations": [
           "4-bit"
         ],
-        "model_id": "CohereForAI/c4ai-command-r-plus-4bit",
-        "model_revision": "bb63b5b7005ecedb30b0cfd0d5953b02a5817f7b"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "CohereForAI/c4ai-command-r-plus-4bit",
+            "model_revision": "bb63b5b7005ecedb30b0cfd0d5953b02a5817f7b"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -6352,8 +8687,12 @@
         "quantizations": [
           "Int4"
         ],
-        "model_id": "alpindale/c4ai-command-r-plus-GPTQ",
-        "model_revision": "35febfc08f723ac0df32480eb4af349a7d08656e"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "alpindale/c4ai-command-r-plus-GPTQ",
+            "model_revision": "35febfc08f723ac0df32480eb4af349a7d08656e"
+          }
+        }
       }
     ],
     "chat_template": "{{ '<BOS_TOKEN>' }}{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% elif false == true %}{% set loop_messages = messages %}{% set system_message = 'You are Command-R, a brilliant, sophisticated, AI-assistant trained to assist human users by providing thorough responses. You are trained by Cohere.' %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% if system_message != false %}{{ '<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>' + system_message + '<|END_OF_TURN_TOKEN|>' }}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|START_OF_TURN_TOKEN|><|USER_TOKEN|>' + content.strip() + '<|END_OF_TURN_TOKEN|>' }}{% elif message['role'] == 'assistant' %}{{ '<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>'  + content.strip() + '<|END_OF_TURN_TOKEN|>' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>' }}{% endif %}",
@@ -6387,8 +8726,12 @@
           "8-bit",
           "none"
         ],
-        "model_id": "berkeley-nest/Starling-LM-7B-alpha",
-        "model_revision": "1dddf3b95bc1391f6307299eb1c162c194bde9bd"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "berkeley-nest/Starling-LM-7B-alpha",
+            "model_revision": "1dddf3b95bc1391f6307299eb1c162c194bde9bd"
+          }
+        }
       }
     ],
     "chat_template": "ssage in messages %}{{ 'GPT4 Correct ' + message['role'].title() + ': ' + message['content'] + '<|end_of_turn|>'}}{% endfor %}{% if add_generation_prompt %}{{ 'GPT4 Correct Assistant:' }}{% endif %}",
@@ -6406,48 +8749,64 @@
     "context_length": 32768,
     "model_name": "internvl-chat",
     "model_lang": [
-        "en",
-        "zh"
+      "en",
+      "zh"
     ],
     "model_ability": [
-        "chat",
-        "vision"
+      "chat",
+      "vision"
     ],
     "model_description": "InternVL 1.5 is an open-source multimodal large language model (MLLM) to bridge the capability gap between open-source and proprietary commercial models in multimodal understanding. ",
     "model_specs": [
       {
-          "model_format": "pytorch",
-          "model_size_in_billions": 2,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/Mini-InternVL-Chat-2B-V1-5",
-          "model_revision": "ecbbd21dcf38caa74d925967b997167b0c7b3f47"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 4,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/Mini-InternVL-Chat-4B-V1-5",
-          "model_revision": "ce1559ddf9d87f5130aa5233b0e93b95e4e4161a"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 26,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL-Chat-V1-5",
-          "model_revision": "9db32d9127cac0c85961e169d75da57a18a847b1"
+        "model_format": "pytorch",
+        "model_size_in_billions": 2,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/Mini-InternVL-Chat-2B-V1-5",
+            "model_revision": "ecbbd21dcf38caa74d925967b997167b0c7b3f47"
+          }
         }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 4,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/Mini-InternVL-Chat-4B-V1-5",
+            "model_revision": "ce1559ddf9d87f5130aa5233b0e93b95e4e4161a"
+          }
+        }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 26,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL-Chat-V1-5",
+            "model_revision": "9db32d9127cac0c85961e169d75da57a18a847b1"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL-Chat-V1-5",
+            "model_revision": "master"
+          }
+        }
+      }
     ],
     "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
     "stop_token_ids": [
@@ -6466,137 +8825,233 @@
     "context_length": 32768,
     "model_name": "internvl2",
     "model_lang": [
-        "en",
-        "zh"
+      "en",
+      "zh"
     ],
     "model_ability": [
-        "chat",
-        "vision"
+      "chat",
+      "vision"
     ],
     "model_description": "InternVL 2 is an open-source multimodal large language model (MLLM) to bridge the capability gap between open-source and proprietary commercial models in multimodal understanding. ",
     "model_specs": [
       {
-          "model_format": "pytorch",
-          "model_size_in_billions": 1,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-1B",
-          "model_revision": "a9fc14aea824b6ea1d44f8778cad6b35512c4ce1"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 2,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-2B",
-          "model_revision": "422ad7c6335917bfb514958233955512338485a6"
-        },
-        {
-          "model_format": "awq",
-          "model_size_in_billions": 2,
-          "quantizations": [
-            "Int4"
-          ],
-          "model_id": "OpenGVLab/InternVL2-2B-AWQ",
-          "model_revision": "701bc3fc098a8a3b686b3b4135cfb77202be89e0"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 4,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-4B",
-          "model_revision": "b50544dafada6c41e80bfde2f57cc9b0140fc21c"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 8,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-8B",
-          "model_revision": "3bfd3664dea4f3da628785f5125d30f889701253"
-        },
-        {
-          "model_format": "awq",
-          "model_size_in_billions": 8,
-          "quantizations": [
-            "Int4"
-          ],
-          "model_id": "OpenGVLab/InternVL2-8B-AWQ",
-          "model_revision": "9f1a4756b7ae18eb26d8a22b618dfc283e8193b3"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 26,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-26B",
-          "model_revision": "b9f3c7e6d575b0115e076a3ffc46fd20b7586899"
-        },
-        {
-          "model_format": "awq",
-          "model_size_in_billions": 26,
-          "quantizations": [
-            "Int4"
-          ],
-          "model_id": "OpenGVLab/InternVL2-26B-AWQ",
-          "model_revision": "469e0019ffd251e22ff6501a5c2321964e86ef0d"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 40,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-40B",
-          "model_revision": "725a12063bb855c966e30a0617d0ccd9e870d772"
-        },
-        {
-          "model_format": "awq",
-          "model_size_in_billions": 40,
-          "quantizations": [
-            "Int4"
-          ],
-          "model_id": "OpenGVLab/InternVL2-40B-AWQ",
-          "model_revision": "d92e140f6dfe8ea9679924c6a31898f42c4e1846"
-        },
-        {
-          "model_format": "pytorch",
-          "model_size_in_billions": 76,
-          "quantizations": [
-            "4-bit",
-            "8-bit",
-            "none"
-          ],
-          "model_id": "OpenGVLab/InternVL2-Llama3-76B",
-          "model_revision": "cf7914905f78e9e3560ddbd6f5dfc39becac494f"
-        },
-        {
-          "model_format": "awq",
-          "model_size_in_billions": 76,
-          "quantizations": [
-            "Int4"
-          ],
-          "model_id": "OpenGVLab/InternVL2-Llama3-76B-AWQ",
-          "model_revision": "1bc796bf80f2ebc7d6a14c15f55217a4600d50a4"
+        "model_format": "pytorch",
+        "model_size_in_billions": 1,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-1B",
+            "model_revision": "a9fc14aea824b6ea1d44f8778cad6b35512c4ce1"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-1B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 2,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-2B",
+            "model_revision": "422ad7c6335917bfb514958233955512338485a6"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-2B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "awq",
+        "model_size_in_billions": 2,
+        "quantizations": [
+          "Int4"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-2B-AWQ",
+            "model_revision": "701bc3fc098a8a3b686b3b4135cfb77202be89e0"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-2B-AWQ",
+            "model_revision": "master"
+          }
         }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 4,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-4B",
+            "model_revision": "b50544dafada6c41e80bfde2f57cc9b0140fc21c"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-4B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 8,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-8B",
+            "model_revision": "3bfd3664dea4f3da628785f5125d30f889701253"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-8B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "awq",
+        "model_size_in_billions": 8,
+        "quantizations": [
+          "Int4"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-8B-AWQ",
+            "model_revision": "9f1a4756b7ae18eb26d8a22b618dfc283e8193b3"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-8B-AWQ",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 26,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-26B",
+            "model_revision": "b9f3c7e6d575b0115e076a3ffc46fd20b7586899"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-26B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "awq",
+        "model_size_in_billions": 26,
+        "quantizations": [
+          "Int4"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-26B-AWQ",
+            "model_revision": "469e0019ffd251e22ff6501a5c2321964e86ef0d"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-26B-AWQ",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 40,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-40B",
+            "model_revision": "725a12063bb855c966e30a0617d0ccd9e870d772"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-40B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "awq",
+        "model_size_in_billions": 40,
+        "quantizations": [
+          "Int4"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-40B-AWQ",
+            "model_revision": "d92e140f6dfe8ea9679924c6a31898f42c4e1846"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-40B-AWQ",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "pytorch",
+        "model_size_in_billions": 76,
+        "quantizations": [
+          "4-bit",
+          "8-bit",
+          "none"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-Llama3-76B",
+            "model_revision": "cf7914905f78e9e3560ddbd6f5dfc39becac494f"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-Llama3-76B",
+            "model_revision": "master"
+          }
+        }
+      },
+      {
+        "model_format": "awq",
+        "model_size_in_billions": 76,
+        "quantizations": [
+          "Int4"
+        ],
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "OpenGVLab/InternVL2-Llama3-76B-AWQ",
+            "model_revision": "1bc796bf80f2ebc7d6a14c15f55217a4600d50a4"
+          },
+          "modelscope": {
+            "model_id": "OpenGVLab/InternVL2-Llama3-76B-AWQ",
+            "model_revision": "master"
+          }
+        }
+      }
     ],
     "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
     "stop_token_ids": [],
@@ -6607,12 +9062,12 @@
     "context_length": 8192,
     "model_name": "cogvlm2",
     "model_lang": [
-        "en",
-        "zh"
+      "en",
+      "zh"
     ],
     "model_ability": [
-        "chat",
-        "vision"
+      "chat",
+      "vision"
     ],
     "model_description": "CogVLM2 have achieved good results in many lists compared to the previous generation of CogVLM open source models. Its excellent performance can compete with some non-open source models.",
     "model_specs": [
@@ -6622,8 +9077,16 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "THUDM/cogvlm2-llama3-chinese-chat-19B",
-        "model_revision": "d88b352bce5ee58a289b1ac8328553eb31efa2ef"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/cogvlm2-llama3-chinese-chat-19B",
+            "model_revision": "d88b352bce5ee58a289b1ac8328553eb31efa2ef"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/cogvlm2-llama3-chinese-chat-19B-{quantization}",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6631,8 +9094,12 @@
         "quantizations": [
           "int4"
         ],
-        "model_id": "THUDM/cogvlm2-llama3-chinese-chat-19B-{quantization}",
-        "model_revision": "7863e362174f4718c2fe9cba4befd0b580a3194f"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/cogvlm2-llama3-chinese-chat-19B-{quantization}",
+            "model_revision": "7863e362174f4718c2fe9cba4befd0b580a3194f"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% else %}{{ '<|end_of_text|>' }}{% endif %}",
@@ -6650,12 +9117,12 @@
     "context_length": 8192,
     "model_name": "cogvlm2-video-llama3-chat",
     "model_lang": [
-        "en",
-        "zh"
+      "en",
+      "zh"
     ],
     "model_ability": [
-        "chat",
-        "vision"
+      "chat",
+      "vision"
     ],
     "model_description": "CogVLM2-Video achieves state-of-the-art performance on multiple video question answering tasks.",
     "model_specs": [
@@ -6667,8 +9134,16 @@
           "8-bit",
           "none"
         ],
-        "model_id": "THUDM/cogvlm2-video-llama3-chat",
-        "model_revision": "f375ead7d8202ebe2c3d09f1068abdddeb2929fa"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "THUDM/cogvlm2-video-llama3-chat",
+            "model_revision": "f375ead7d8202ebe2c3d09f1068abdddeb2929fa"
+          },
+          "modelscope": {
+            "model_id": "ZhipuAI/cogvlm2-video-llama3-chat",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% else %}{{ '<|end_of_text|>' }}{% endif %}",
@@ -6702,7 +9177,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Tele-AI/telechat-7B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Tele-AI/telechat-7B"
+          },
+          "modelscope": {
+            "model_id": "TeleAI/telechat-7B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -6711,7 +9194,15 @@
           "int4",
           "int8"
         ],
-        "model_id": "Tele-AI/telechat-7B-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Tele-AI/telechat-7B-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "TeleAI/telechat-7B-{quantization}",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6721,7 +9212,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Tele-AI/TeleChat-12B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Tele-AI/TeleChat-12B"
+          },
+          "modelscope": {
+            "model_id": "TeleAI/TeleChat-12B",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "gptq",
@@ -6730,7 +9229,15 @@
           "int4",
           "int8"
         ],
-        "model_id": "Tele-AI/TeleChat-12B-{quantization}"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Tele-AI/TeleChat-12B-{quantization}"
+          },
+          "modelscope": {
+            "model_id": "TeleAI/TeleChat-12B-{quantization}",
+            "model_revision": "master"
+          }
+        }
       },
       {
         "model_format": "pytorch",
@@ -6740,7 +9247,15 @@
           "8-bit",
           "none"
         ],
-        "model_id": "Tele-AI/TeleChat-52B"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Tele-AI/TeleChat-52B"
+          },
+          "modelscope": {
+            "model_id": "TeleAI/TeleChat-52B",
+            "model_revision": "master"
+          }
+        }
       }
     ],
     "chat_template": "{{ (messages|selectattr('role', 'equalto', 'system')|list|last).content|trim if (messages|selectattr('role', 'equalto', 'system')|list) else '' }}{%- for message in messages -%}{%- if message['role'] == 'user' -%}{{- '<_user>' + message['content'] +'<_bot>' -}}{%- elif message['role'] == 'assistant' -%}{{- message['content'] + '<_end>' -}}{%- endif -%}{%- endfor -%}",
@@ -6771,8 +9286,15 @@
         "quantizations": [
           "none"
         ],
-        "model_id": "opencsg/csg-wukong-1B-chat-v0.1",
-        "model_revision": "2443c903d46074af0856e2ba11398dcd01d35536"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "opencsg/csg-wukong-1B-chat-v0.1",
+            "model_revision": "2443c903d46074af0856e2ba11398dcd01d35536"
+          },
+          "csghub": {
+            "model_id": "OpenCSG/csg-wukong-1B-chat-v0.1"
+          }
+        }
       },
       {
         "model_format": "ggufv2",
@@ -6794,8 +9316,12 @@
           "Q6_K",
           "Q8_0"
         ],
-        "model_id": "RichardErkhov/opencsg_-_csg-wukong-1B-chat-v0.1-gguf",
-        "model_file_name_template": "csg-wukong-1B-chat-v0.1.{quantization}.gguf"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "RichardErkhov/opencsg_-_csg-wukong-1B-chat-v0.1-gguf",
+            "model_file_name_template": "csg-wukong-1B-chat-v0.1.{quantization}.gguf"
+          }
+        }
       }
     ],
     "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n' }}{% elif loop.first %}{{ '<|system|>\nYou are a creative super artificial intelligence assistant, possessing all the knowledge of humankind. Your name is csg-wukong, developed by OpenCSG. You need to understand and infer the true intentions of users based on the topics discussed in the chat history, and respond to user questions correctly as required. You enjoy responding to users with accurate and insightful answers. Please pay attention to the appropriate style and format when replying, try to avoid repetitive words and sentences, and keep your responses as concise and profound as possible. You carefully consider the context of the discussion when replying to users. When the user says \"continue,\" please proceed with the continuation of the previous assistant\\'s response.</s>\n' }}{% endif %}{% if item['role'] == 'user' %}{{ '<|user|>\n' + item['content'] + '</s>\n' }}{% elif item['role'] == 'assistant' %}{{ '<|assistant|>\n' + item['content'] + '</s>\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% endif %}",
@@ -6807,42 +9333,58 @@
     ]
   },
   {
-    "version":1,
-    "context_length":32768,
-    "model_name":"qwen2-vl-instruct",
-    "model_lang":[
+    "version": 1,
+    "context_length": 32768,
+    "model_name": "qwen2-vl-instruct",
+    "model_lang": [
       "en",
       "zh"
     ],
-    "model_ability":[
+    "model_ability": [
       "chat",
       "vision"
     ],
-    "model_description":"Qwen2-VL: To See the World More Clearly.Qwen2-VL is the latest version of the vision language models in the Qwen model familities.",
-    "model_specs":[
+    "model_description": "Qwen2-VL: To See the World More Clearly.Qwen2-VL is the latest version of the vision language models in the Qwen model familities.",
+    "model_specs": [
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":2,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 2,
+        "quantizations": [
           "none"
         ],
-        "model_id":"Qwen/Qwen2-VL-2B-Instruct",
-        "model_revision":"096da3b96240e3d66d35be0e5ccbe282eea8d6b1"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-VL-2B-Instruct",
+            "model_revision": "096da3b96240e3d66d35be0e5ccbe282eea8d6b1"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-VL-2B-Instruct",
+            "model_revision": "master"
+          }
+        }
       },
       {
-        "model_format":"pytorch",
-        "model_size_in_billions":7,
-        "quantizations":[
+        "model_format": "pytorch",
+        "model_size_in_billions": 7,
+        "quantizations": [
           "none"
         ],
-        "model_id":"Qwen/Qwen2-VL-7B-Instruct",
-        "model_revision":"6010982c1010c3b222fa98afc81575f124aa9bd6"
+        "model_hubs": {
+          "huggingface": {
+            "model_id": "Qwen/Qwen2-VL-7B-Instruct",
+            "model_revision": "6010982c1010c3b222fa98afc81575f124aa9bd6"
+          },
+          "modelscope": {
+            "model_id": "qwen/Qwen2-VL-7B-Instruct",
+            "model_revision": "master"
+          }
+        }
       }
     ],
-    "prompt_style":{
-      "style_name":"QWEN",
-      "system_prompt":"You are a helpful assistant",
-      "roles":[
+    "prompt_style": {
+      "style_name": "QWEN",
+      "system_prompt": "You are a helpful assistant",
+      "roles": [
         "user",
         "assistant"
       ],
@@ -6852,4 +9394,4 @@
       ]
     }
   }
-]
+]
\ No newline at end of file
diff --git a/xinference/model/llm/llm_family_csghub.json b/xinference/model/llm/llm_family_csghub.json
deleted file mode 100644
index d607b580b7..0000000000
--- a/xinference/model/llm/llm_family_csghub.json
+++ /dev/null
@@ -1,88 +0,0 @@
-[
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen2-instruct",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "Qwen2 is the new series of Qwen large language models",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "Qwen/Qwen2-0.5B-Instruct",
-        "model_hub": "csghub"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "qwen/Qwen2-0.5B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-0_5b-instruct-{quantization}.gguf",
-        "model_hub": "csghub"
-      }
-    ],
-    "chat_template": "{%- macro json_to_python_type(json_spec) %}\n    {%- set basic_type_map = {\n    \"string\": \"str\",\n    \"number\": \"float\",\n    \"integer\": \"int\",\n    \"boolean\": \"bool\"\n} %}\n    {%- if basic_type_map[json_spec.type] is defined %}\n        {{- basic_type_map[json_spec.type] }}\n    {%- elif json_spec.type == \"array\" %}\n        {{- \"list[\" +  json_to_python_type(json_spec|items) + \"]\" }}\n    {%- elif json_spec.type == \"object\" %}\n        {%- if json_spec.additionalProperties is defined %}\n            {{- \"dict[str, \" + json_to_python_type(json_spec.additionalProperties) + ']' }}\n        {%- else %}\n            {{- \"dict\" }}\n        {%- endif %}\n    {%- elif json_spec.type is iterable %}\n        {{- \"Union[\" }}\n        {%- for t in json_spec.type %}\n            {{- json_to_python_type({\"type\": t}) }}\n            {%- if not loop.last %}\n                {{- \",\" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \"]\" }}\n    {%- else %}\n        {{- \"Any\" }}\n    {%- endif %}\n{%- endmacro %}\n\n{%- if tools %}\n    {{- '<|im_start|>system\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] + '\n\n' }}\n    {%- endif %}\n    {{- '# Tools\n\n' }}\n    {{- \"You are a function calling AI model. You are provided with function signatures within <tools></tools> XML tags. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: <tools> \" }}\n    {%- for tool in tools %}\n        {%- if tool.function is defined %}\n            {%- set tool = tool.function %}\n        {%- endif %}\n        {{- '{\"type\": \"function\", \"function\": ' }}\n        {{- '{\"name\": ' + tool.name + '\", ' }}\n        {{- '\"description\": \"' + tool.name + '(' }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {{- param_name + \": \" + json_to_python_type(param_fields) }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \")\" }}\n        {%- if tool.return is defined %}\n            {{- \" -> \" + json_to_python_type(tool.return) }}\n        {%- endif %}\n        {{- \" - \" + tool.description + \"\n\n\" }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {%- if loop.first %}\n                {{- \"    Args:\n\" }}\n            {%- endif %}\n            {{- \"        \" + param_name + \"(\" + json_to_python_type(param_fields) + \"): \" + param_fields.description|trim }}\n        {%- endfor %}\n        {%- if tool.return is defined and tool.return.description is defined %}\n            {{- \"\n    Returns:\n        \" + tool.return.description }}\n        {%- endif %}\n        {{- '\"' }}\n        {{- ', \"parameters\": ' }}\n        {%- if tool.parameters.properties | length == 0 %}\n            {{- \"{}\" }}\n        {%- else %}\n            {{- tool.parameters|tojson }}\n        {%- endif %}\n        {{- \"}\" }}\n        {%- if not loop.last %}\n            {{- \"\n\" }}\n        {%- endif %}\n    {%- endfor %}\n    {{- \" </tools>\" }}\n    {{- 'Use the following pydantic model json schema for each tool call you will make: {\"properties\": {\"arguments\": {\"title\": \"Arguments\", \"type\": \"object\"}, \"name\": {\"title\": \"Name\", \"type\": \"string\"}}, \"required\": [\"arguments\", \"name\"], \"title\": \"FunctionCall\", \"type\": \"object\"}\n' }}\n    {{- \"For each function call return a json object with function name and arguments within <tool_call></tool_call> XML tags as follows:\n\" }}\n    {{- \"<tool_call>\n\" }}\n    {{- '{\"name\": <function-name>, \"arguments\": <args-json-object>}\n' }}\n    {{- '</tool_call><|im_end|>\n' }}\n{%- else %}\n    {%- if messages[0]['role'] != 'system' %}\n        {{- '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message.role == \"user\" or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and message.tool_calls is not defined) %}\n        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role + '\n<tool_call>\n' }}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '{' }}\n            {{- '\"name\": \"' }}\n            {{- tool_call.name }}\n            {%- if tool_call.arguments is defined %}\n                {{- ', ' }}\n                {{- '\"arguments\": ' }}\n                {{- tool_call.arguments|tojson }}\n            {%- endif %}\n            {{- '\"}' }}\n            {{- '\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if not message.name is defined %}\n            {{- raise_exception(\"Tool response dicts require a 'name' key indicating the name of the called function!\") }}\n        {%- endif %}\n        {{- '<|im_start|>user\n<tool_response>\n' }}\n        {{- '{\"name\": \"' }}\n        {{- message.name }}\n        {{- '\", \"content\": ' }}\n        {{- message.content|tojson + '}' }}\n        {{- '\n</tool_response><|im_end|>\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\n' }}\n{%- endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "csg-wukong-chat-v0.1",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "csg-wukong-1B is a 1 billion-parameter small language model(SLM) pretrained on 1T tokens.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 1,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "OpenCSG/csg-wukong-1B-chat-v0.1",
-        "model_hub": "csghub"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n' }}{% elif loop.first %}{{ '<|system|>\nYou are a creative super artificial intelligence assistant, possessing all the knowledge of humankind. Your name is csg-wukong, developed by OpenCSG. You need to understand and infer the true intentions of users based on the topics discussed in the chat history, and respond to user questions correctly as required. You enjoy responding to users with accurate and insightful answers. Please pay attention to the appropriate style and format when replying, try to avoid repetitive words and sentences, and keep your responses as concise and profound as possible. You carefully consider the context of the discussion when replying to users. When the user says \"continue,\" please proceed with the continuation of the previous assistant\\'s response.</s>\n' }}{% endif %}{% if item['role'] == 'user' %}{{ '<|user|>\n' + item['content'] + '</s>\n' }}{% elif item['role'] == 'assistant' %}{{ '<|assistant|>\n' + item['content'] + '</s>\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% endif %}",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  }
-]
diff --git a/xinference/model/llm/llm_family_modelscope.json b/xinference/model/llm/llm_family_modelscope.json
deleted file mode 100644
index f6ac13e06c..0000000000
--- a/xinference/model/llm/llm_family_modelscope.json
+++ /dev/null
@@ -1,4556 +0,0 @@
-[
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "llama-2-chat",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Llama-2-Chat is a fine-tuned version of the Llama-2 LLM, specializing in chatting.",
-    "model_specs": [
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_id": "Xorbits/Llama-2-7b-Chat-GGUF",
-        "model_file_name_template": "llama-2-7b-chat.{quantization}.gguf",
-        "model_hub": "modelscope",
-        "model_revision": "v0.0.1"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_id": "Xorbits/Llama-2-13b-Chat-GGUF",
-        "model_file_name_template": "llama-2-13b-chat.{quantization}.gguf",
-        "model_hub": "modelscope",
-        "model_revision": "v0.0.1"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "modelscope/Llama-2-7b-chat-ms",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.5"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "modelscope/Llama-2-13b-chat-ms",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.2"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "modelscope/Llama-2-70b-chat-ms",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.1"
-      }
-    ],
-    "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = '<<SYS>>\n' + messages[0]['content'] | trim + '\n<</SYS>>\n\n' %}{% set messages = messages[1:] %}{% else %}{% set system_message = '' %}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 %}{% set content = system_message + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ '<s>' + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + '</s>' }}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-        2
-    ],
-    "stop": []
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "llama-3",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Llama 3 is an auto-regressive language model that uses an optimized transformer architecture",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3-8B",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3-70B",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "llama-3-instruct",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Llama 3 instruction tuned models are optimized for dialogue use cases and outperform many of the available open source chat models on common industry benchmarks..",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3-8B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3-70B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "swift/Meta-Llama-3-8B-Instruct-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "swift/Meta-Llama-3-70B-Instruct-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}",
-    "stop_token_ids": [
-      128001,
-      128009
-    ],
-    "stop": [
-      "<|end_of_text|>",
-      "<|eot_id|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 131072,
-    "model_name": "llama-3.1",
-    "model_lang": [
-      "en",
-      "de",
-      "fr",
-      "it",
-      "pt",
-      "hi",
-      "es",
-      "th"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Llama 3.1 is an auto-regressive language model that uses an optimized transformer architecture",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-8B",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-70B",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 405,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-405B",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 131072,
-    "model_name": "llama-3.1-instruct",
-    "model_lang": [
-      "en",
-      "de",
-      "fr",
-      "it",
-      "pt",
-      "hi",
-      "es",
-      "th"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Llama 3.1 instruction tuned models are optimized for dialogue use cases and outperform many of the available open source chat models on common industry benchmarks..",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct-GPTQ-INT4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct-AWQ-INT4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 8,
-        "quantizations": [
-          "Q3_K_L",
-          "Q4_K_M",
-          "Q5_K_M",
-          "Q6_K",
-          "Q8_0"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-8B-Instruct-GGUF",
-        "model_file_name_template": "Meta-Llama-3.1-8B-Instruct-{quantization}.gguf",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-70B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-70B-Instruct-GPTQ-INT4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-70B-Instruct-AWQ-INT4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 405,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-405B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 405,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-405B-Instruct-AWQ-INT4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 405,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Meta-Llama-3.1-405B-Instruct-GPTQ-INT4",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{{- '<|begin_of_text|>' }}\n{%- if custom_tools is defined %}\n    {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n    {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n    {%- set date_string = \"26 Jul 2024\" %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content']|trim %}\n    {%- set messages = messages[1:] %}\n{%- else %}\n    {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message + builtin tools #}\n{{- \"<|start_header_id|>system<|end_header_id|>\n\n\" }}\n{%- if builtin_tools is defined or tools is not none %}\n    {{- \"Environment: ipython\n\" }}\n{%- endif %}\n{%- if builtin_tools is defined %}\n    {{- \"Tools: \" + builtin_tools | reject('equalto', 'code_interpreter') | join(\", \") + \"\n\n\"}}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\n\" }}\n{{- \"Today Date: \" + date_string + \"\n\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n    {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n    {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n    {{- \"Do not use variables.\n\n\" }}\n    {%- for t in tools %}\n        {{- t | tojson(indent=4) }}\n        {{- \"\n\n\" }}\n    {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n    {#- Extract the first user message so we can plug it in here #}\n    {%- if messages | length != 0 %}\n        {%- set first_user_message = messages[0]['content']|trim %}\n        {%- set messages = messages[1:] %}\n    {%- else %}\n        {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n    {{- '<|start_header_id|>user<|end_header_id|>\n\n' -}}\n    {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n    {{- \"with its proper arguments that best answers the given prompt.\n\n\" }}\n    {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n    {{- \"Do not use variables.\n\n\" }}\n    {%- for t in tools %}\n        {{- t | tojson(indent=4) }}\n        {{- \"\n\n\" }}\n    {%- endfor %}\n    {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n    {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n        {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' }}\n    {%- elif 'tool_calls' in message %}\n        {%- if not message.tool_calls|length == 1 %}\n            {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n        {%- endif %}\n        {%- set tool_call = message.tool_calls[0].function %}\n        {%- if builtin_tools is defined and tool_call.name in builtin_tools %}\n            {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}\n            {{- \"<|python_tag|>\" + tool_call.name + \".call(\" }}\n            {%- for arg_name, arg_val in tool_call.arguments | items %}\n                {{- arg_name + '=\"' + arg_val + '\"' }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- endif %}\n                {%- endfor %}\n            {{- \")\" }}\n        {%- else  %}\n            {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' -}}\n            {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n            {{- '\"parameters\": ' }}\n            {{- tool_call.arguments | tojson }}\n            {{- \"}\" }}\n        {%- endif %}\n        {%- if builtin_tools is defined %}\n            {#- This means we're in ipython mode #}\n            {{- \"<|eom_id|>\" }}\n        {%- else %}\n            {{- \"<|eot_id|>\" }}\n        {%- endif %}\n    {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n        {{- \"<|start_header_id|>ipython<|end_header_id|>\n\n\" }}\n        {%- if message.content is mapping or message.content is iterable %}\n            {{- message.content | tojson }}\n        {%- else %}\n            {{- message.content }}\n        {%- endif %}\n        {{- \"<|eot_id|>\" }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|start_header_id|>assistant<|end_header_id|>\n\n' }}\n{%- endif %}\n",
-    "stop_token_ids": [
-      128001,
-      128009
-    ],
-    "stop": [
-      "<|end_of_text|>",
-      "<|eot_id|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 2048,
-    "model_name": "tiny-llama",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "The TinyLlama project aims to pretrain a 1.1B Llama model on 3 trillion tokens.",
-    "model_specs": [
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 1,
-        "quantizations": [
-          "Q2_K"
-        ],
-        "model_id": "Xorbits/TinyLlama-1.1B-step-50K-105b-GGUF",
-        "model_hub": "modelscope",
-        "model_revision": "v0.0.1",
-        "model_file_name_template": "ggml-model-{quantization}.gguf"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "baichuan-2-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Baichuan2-chat is a fine-tuned version of the Baichuan LLM, specializing in chatting.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "baichuan-inc/Baichuan2-7B-Chat",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.4"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "baichuan-inc/Baichuan2-13B-Chat",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.3"
-      }
-    ],
-    "chat_template": "{{ (messages|selectattr('role', 'equalto', 'system')|list|last).content|trim if (messages|selectattr('role', 'equalto', 'system')|list) else '' }}\n\n{% for message in messages %}\n{% if message['role'] == 'user' %}\n<reserved_106>\n{{ message['content']|trim -}}\n{% if not loop.last %}\n\n\n{% endif %}\n{% elif message['role'] == 'assistant' %}\n<reserved_107>\n{{ message['content']|trim -}}\n{% if not loop.last %}\n\n\n{% endif %}\n{% endif %}\n{% endfor %}\n{% if add_generation_prompt and messages[-1]['role'] != 'assistant' %}\n<reserved_107>\n{% endif %}",
-    "stop_token_ids": [
-      2,
-      195
-    ],
-    "stop": []
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "baichuan-2",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Baichuan2 is an open-source Transformer based LLM that is trained on both Chinese and English data.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "baichuan-inc/Baichuan2-7B-Base",
-        "model_revision": "v1.0.2",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "baichuan-inc/Baichuan2-13B-Base",
-        "model_revision": "v1.0.3",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 131072,
-    "model_name": "glm4-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "GLM4 is the open source version of the latest generation of pre-trained models in the GLM-4 series launched by Zhipu AI.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "ZhipuAI/glm-4-9b-chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "Q2_K",
-          "IQ3_XS",
-          "IQ3_S",
-          "IQ3_M",
-          "Q3_K_S",
-          "Q3_K_L",
-          "Q3_K",
-          "IQ4_XS",
-          "IQ4_NL",
-          "Q4_K_S",
-          "Q4_K",
-          "Q5_K_S",
-          "Q5_K",
-          "Q6_K",
-          "Q8_0",
-          "BF16",
-          "FP16"
-        ],
-        "model_file_name_template": "glm-4-9b-chat.{quantization}.gguf",
-        "model_hub": "modelscope",
-        "model_id": "LLM-Research/glm-4-9b-chat-GGUF",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "[gMASK]<sop>{% for item in messages %}{% if item['tools'] is defined %}<|system|>\n你是一个名为 ChatGLM 的人工智能助手。你是基于智谱AI训练的语言模型 GLM-4 模型开发的，你的任务是针对用户的问题和要求提供适当的答复和支持。\n\n# 可用工具{% set tools = item['tools'] %}{% for tool in tools %}{% if tool['type'] == 'function' %}\n\n## {{ tool['function']['name'] }}\n\n{{ tool['function'] | tojson(indent=4) }}\n在调用上述函数时，请使用 Json 格式表示调用的参数。{% elif tool['type'] == 'python' %}\n\n## python\n\n当你向 `python` 发送包含 Python 代码的消息时，该代码将会在一个有状态的 Jupyter notebook 环境中执行。\n`python` 返回代码执行的输出，或在执行 60 秒后返回超时。\n`/mnt/data` 将会持久化存储你的文件。在此会话中，`python` 无法访问互联网。不要使用 `python` 进行任何网络请求或者在线 API 调用，这些在线内容的访问将不会成功。{% elif tool['type'] == 'simple_browser' %}\n\n## simple_browser\n\n你可以使用 `simple_browser` 工具。该工具支持以下函数：\n`search(query: str, recency_days: int)`：使用搜索引擎进行查询并显示结果，可以使用 `recency_days` 参数控制搜索内容的时效性。\n`mclick(ids: list[int])`：获取一系列指定 id 的页面内容。每次调用时，须选择3-10个页面。选择多个角度的页面，同时尽可能选择可信任的信息来源。考虑到部分页面是无法加载的，你也可以多打开一些可能有用的页面而不用担心内容过多。\n`open_url(url: str)`：打开指定的 URL。\n\n使用 `【{引用 id}†{引用文本}】` 来引用内容。\n\n操作步骤：1. 使用 `search` 来获得信息列表; 2. 使用 `mclick` 来获取指定 ID 页面的内容; 3. 根据获得的内容进行回复。在回复中应当引用信息来源。\n 如果用户提供了 URL，也可以用 `open_url` 直接打开页面。\n如果初次搜索结果没有找到合适的信息，也可以再次使用 `search` 进行搜索。{% elif tool['type'] == 'cogview' %}\n\n## cogview\n\n如果用户的请求中包含了对图像的描述，你可以使用 `cogview` 来生成图像并展示给用户。你需要向 `cogview` 发送图像描述，规则：\n- 发送给 `cogview` 的消息必须使用英语。用户的中文描述必须完全翻译为英语。\n- 应当尽可能详细地描述图像生成的需求，需求描述约 100 英文单词。\n- 保持用户原始描述的意图。不要虚构内容或者没见过的人物。\n- 如无特殊说明，所在地为中国，持有中国立场并遵循中国社会主义价值观。{% endif %}{% endfor %}{% endif %}{% if item['content'] %}<|{{ item['role'] }}|>{{ item['metadata'] }}\n{{ item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>{% endif %}",
-    "stop_token_ids": [
-      151329,
-      151336,
-      151338
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|user|>",
-      "<|observation|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 1048576,
-    "model_name": "glm4-chat-1m",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "GLM4 is the open source version of the latest generation of pre-trained models in the GLM-4 series launched by Zhipu AI.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "ZhipuAI/glm-4-9b-chat-1m",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "Q2_K",
-          "IQ3_XS",
-          "IQ3_S",
-          "IQ3_M",
-          "Q3_K_S",
-          "Q3_K_L",
-          "Q3_K",
-          "IQ4_XS",
-          "IQ4_NL",
-          "Q4_K_S",
-          "Q4_K",
-          "Q5_K_S",
-          "Q5_K",
-          "Q6_K",
-          "Q8_0",
-          "BF16",
-          "FP16"
-        ],
-        "model_file_name_template": "glm-4-9b-chat-1m.{quantization}.gguf",
-        "model_hub": "modelscope",
-        "model_id": "LLM-Research/glm-4-9b-chat-1m-GGUF",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "[gMASK]<sop>{% for item in messages %}{% if item['tools'] is defined %}<|system|>\n你是一个名为 GLM-4 的人工智能助手。你是基于智谱AI训练的语言模型 GLM-4 模型开发的，你的任务是针对用户的问题和要求提供适当的答复和支持。\n\n# 可用工具{% set tools = item['tools'] %}{% for tool in tools %}{% if tool['type'] == 'function' %}\n\n## {{ tool['function']['name'] }}\n\n{{ tool['function'] | tojson(indent=4) }}\n在调用上述函数时，请使用 Json 格式表示调用的参数。{% elif tool['type'] == 'python' %}\n\n## python\n\n当你向 `python` 发送包含 Python 代码的消息时，该代码将会在一个有状态的 Jupyter notebook 环境中执行。\n`python` 返回代码执行的输出，或在执行 60 秒后返回超时。\n`/mnt/data` 将会持久化存储你的文件。在此会话中，`python` 无法访问互联网。不要使用 `python` 进行任何网络请求或者在线 API 调用，这些在线内容的访问将不会成功。{% elif tool['type'] == 'simple_browser' %}\n\n## simple_browser\n\n你可以使用 `simple_browser` 工具。该工具支持以下函数：\n`search(query: str, recency_days: int)`：使用搜索引擎进行查询并显示结果，可以使用 `recency_days` 参数控制搜索内容的时效性。\n`mclick(ids: list[int])`：获取一系列指定 id 的页面内容。每次调用时，须选择3-10个页面。选择多个角度的页面，同时尽可能选择可信任的信息来源。考虑到部分页面是无法加载的，你也可以多打开一些可能有用的页面而不用担心内容过多。\n`open_url(url: str)`：打开指定的 URL。\n\n使用 `【{引用 id}†{引用文本}】` 来引用内容。\n\n操作步骤：1. 使用 `search` 来获得信息列表; 2. 使用 `mclick` 来获取指定 ID 页面的内容; 3. 根据获得的内容进行回复。在回复中应当引用信息来源。\n 如果用户提供了 URL，也可以用 `open_url` 直接打开页面。\n如果初次搜索结果没有找到合适的信息，也可以再次使用 `search` 进行搜索。{% elif tool['type'] == 'cogview' %}\n\n## cogview\n\n如果用户的请求中包含了对图像的描述，你可以使用 `cogview` 来生成图像并展示给用户。你需要向 `cogview` 发送图像描述，规则：\n- 发送给 `cogview` 的消息必须使用英语。用户的中文描述必须完全翻译为英语。\n- 应当尽可能详细地描述图像生成的需求，需求描述约 100 英文单词。\n- 保持用户原始描述的意图。不要虚构内容或者没见过的人物。\n- 如无特殊说明，所在地为中国，持有中国立场并遵循中国社会主义价值观。{% endif %}{% endfor %}{% endif %}{% if item['content'] %}<|{{ item['role'] }}|>{{ item['metadata'] }}\n{{ item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant|>{% endif %}",
-    "stop_token_ids": [
-      151329,
-      151336,
-      151338
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|user|>",
-      "<|observation|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "glm-4v",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "vision"
-    ],
-    "model_description": "GLM4 is the open source version of the latest generation of pre-trained models in the GLM-4 series launched by Zhipu AI.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "ZhipuAI/glm-4v-9b",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "",
-    "stop_token_ids": [
-      151329,
-      151336,
-      151338
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|user|>",
-      "<|observation|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 131072,
-    "model_name": "codegeex4",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "the open-source version of the latest CodeGeeX4 model series",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "ZhipuAI/codegeex4-all-9b",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "IQ2_M",
-          "IQ3_M",
-          "Q4_K_M",
-          "Q5_K_M",
-          "Q6_K_L",
-          "Q8_0"
-        ],
-        "model_file_name_template": "codegeex4-all-9b-{quantization}.gguf",
-        "model_id": "ZhipuAI/codegeex4-all-9b-GGUF",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ '<|system|>\n' + item['content'] }}{% elif loop.first %}{{ '<|system|>\n你是一位智能编程助手，你叫CodeGeeX。你会为用户回答关于编程、代码、计算机方面的任何问题，并提供格式规范、可以执行、准确安全的代码，并在必要时提供详细的解释。' }}{% endif %}{% if item['role'] == 'user' %}{{ '<|user|>\n' + item['content'] }}{% elif item['role'] == 'assistant' %}{{ '<|assistant|>\n' + item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% endif %}",
-    "stop_token_ids": [
-      151329,
-      151336,
-      151338
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|user|>",
-      "<|observation|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 2048,
-    "model_name": "xverse-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "XVERSE-7B is a multilingual large language model, independently developed by Shenzhen Yuanxiang Technology.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "xverse/XVERSE-7B-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "xverse/XVERSE-13B-Chat",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ '<|system|> \n' + item['content'] }}{% endif %}{% if item['role'] == 'user' %}{{ '<|user|> \n' + item['content'] }}{% elif item['role'] == 'assistant' %}{{ '<|assistant|> \n' + item['content'] }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>' }}{% endif %}",
-    "stop_token_ids": [
-      3
-    ],
-    "stop": [
-      "<|endoftext|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 2048,
-    "model_name": "xverse",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "XVERSE is a multilingual large language model, independently developed by Shenzhen Yuanxiang Technology.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "xverse/XVERSE-7B",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "xverse/XVERSE-13B",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 65,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "xverse/XVERSE-65B",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "internlm2.5-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "InternLM2.5 series of the InternLM model.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2_5-1_8b-chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2_5-7b-chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2_5-7b-chat-gguf",
-        "model_file_name_template": "internlm2_5-7b-chat-{quantization}.gguf",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 20,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2_5-20b-chat",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      2,
-      92542
-    ],
-    "stop": [
-      "</s>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 262144,
-    "model_name": "internlm2.5-chat-1m",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "InternLM2.5 series of the InternLM model supports 1M long-context",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2_5-7b-chat-1m",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      2,
-      92542
-    ],
-    "stop": [
-      "</s>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 100000,
-    "model_name": "wizardcoder-python-v1.0",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/WizardCoder-Python-13B-V1.0",
-        "model_revision": "v1.0.0"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/WizardCoder-Python-34B-V1.0",
-        "model_revision": "v1.0.0"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n\n### ' }}{% elif loop.first %}{{ 'Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### ' }}{% endif %}{% if item['role'] == 'user' %}{{ 'Instruction: ' + item['content'] + '\n\n### ' }}{% elif item['role'] == 'assistant' %}{{ 'Response: ' + item['content'] + '\n\n### ' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'Response: Let\\'s think step by step.' }}{% endif %}",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 100000,
-    "model_name": "code-llama",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Code-Llama is an open-source LLM trained by fine-tuning LLaMA2 for generating and discussing code.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-7b-hf",
-        "model_revision": "v1.0.2"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-13b-hf",
-        "model_revision": "v1.0.1"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-34b-hf",
-        "model_revision": "v1.0.1"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8194,
-    "model_name": "codeshell",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "CodeShell is a multi-language code LLM developed by the Knowledge Computing Lab of Peking University. ",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "WisdomShell/CodeShell-7B",
-        "model_revision": "master",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8194,
-    "model_name": "codeshell-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "CodeShell is a multi-language code LLM developed by the Knowledge Computing Lab of Peking University.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "WisdomShell/CodeShell-7B-Chat",
-        "model_revision": "master",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if item['role'] == 'user' %}{{ '## human: ' + item['content'] + '|<end>|' }}{% elif item['role'] == 'assistant' %}{{ '## assistant: ' + item['content'] + '|<end>|' }}{% endif %}{% endfor %}{{ '## assistant: ' }}",
-    "stop_token_ids": [
-      70000
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "|||",
-      "|<end>|"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 100000,
-    "model_name": "code-llama-instruct",
-    "model_description": "Code-Llama-Instruct is an instruct-tuned version of the Code-Llama LLM.",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-7b-Instruct-hf",
-        "model_revision": "v1.0.1"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-13b-Instruct-hf",
-        "model_revision": "v1.0.1"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-34b-Instruct-hf",
-        "model_revision": "v1.0.2"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/CodeLlama-7B-Instruct-GGUF",
-        "model_file_name_template": "codellama-7b-instruct.{quantization}.gguf",
-        "model_revision": "v0.0.1"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/CodeLlama-13B-Instruct-GGUF",
-        "model_file_name_template": "codellama-13b-instruct.{quantization}.gguf",
-        "model_revision": "v0.0.1"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/CodeLlama-34B-Instruct-GGUF",
-        "model_file_name_template": "codellama-34b-instruct.{quantization}.gguf",
-        "model_revision": "v0.1.0"
-      }
-    ],
-    "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = '<<SYS>>\n' + messages[0]['content'] | trim + '\n<</SYS>>\n\n' %}{% set messages = messages[1:] %}{% else %}{% set system_message = '' %}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 %}{% set content = system_message + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ '<s>' + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + '</s>' }}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-        2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "mistral-v0.1",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Mistral-7B is a unmoderated Transformer based LLM claiming to outperform Llama2 on all benchmarks.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/Mistral-7B-v0.1",
-        "model_revision": "v1.0.0"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Q2_K",
-          "Q3_K_S",
-          "Q3_K_M",
-          "Q3_K_L",
-          "Q4_0",
-          "Q4_K_S",
-          "Q4_K_M",
-          "Q5_0",
-          "Q5_K_S",
-          "Q5_K_M",
-          "Q6_K",
-          "Q8_0"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/Mistral-7B-v0.1-GGUF",
-        "model_file_name_template": "mistral-7b-v0.1.{quantization}.gguf",
-        "model_revision": "v1.0.0"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 100000,
-    "model_name": "code-llama-python",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Code-Llama-Python is a fine-tuned version of the Code-Llama LLM, specializing in Python.",
-    "model_specs": [
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Q2_K",
-          "Q3_K_L",
-          "Q3_K_M",
-          "Q3_K_S",
-          "Q4_0",
-          "Q4_K_M",
-          "Q4_K_S",
-          "Q5_0",
-          "Q5_K_M",
-          "Q5_K_S",
-          "Q6_K",
-          "Q8_0"
-        ],
-        "model_id": "Xorbits/CodeLlama-7B-Python-GGUF",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.0",
-        "model_file_name_template": "codellama-7b-python.{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "Q2_K",
-          "Q3_K_L",
-          "Q3_K_M",
-          "Q3_K_S",
-          "Q4_0",
-          "Q4_K_M",
-          "Q4_K_S",
-          "Q5_0",
-          "Q5_K_M",
-          "Q5_K_S",
-          "Q6_K",
-          "Q8_0"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/CodeLlama-13B-Python-GGUF",
-        "model_file_name_template": "codellama-13b-python.{quantization}.gguf"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/CodeLlama-13B-Python-fp16",
-        "model_revision": "v1.0.0"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/CodeLlama-7B-Python-fp16",
-        "model_revision": "v1.0.0"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/CodeLlama-13b-Python-hf",
-        "model_revision": "v1.0.1"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "mixtral-v0.1",
-    "model_lang": [
-      "en",
-      "fr",
-      "it",
-      "de",
-      "es"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "The Mixtral-8x7B Large Language Model (LLM) is a pretrained generative Sparse Mixture of Experts.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "46_7",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/Mixtral-8x7B-v0.1",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "mixtral-instruct-v0.1",
-    "model_lang": [
-      "en",
-      "fr",
-      "it",
-      "de",
-      "es"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Mistral-8x7B-Instruct is a fine-tuned version of the Mistral-8x7B LLM, specializing in chatting.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "46_7",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/Mixtral-8x7B-Instruct-v0.1",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content'] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n        {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif %}\n    {%- if message['role'] == 'user' %}\n        {%- if loop.first and system_message is defined %}\n            {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}\n        {%- else %}\n            {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n        {%- endif %}\n    {%- elif message['role'] == 'assistant' %}\n        {{- ' ' + message['content'] + '</s>'}}\n    {%- else %}\n        {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n    {%- endif %}\n{%- endfor %}\n",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "Yi",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "The Yi series models are large language models trained from scratch by developers at 01.AI.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-6B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-9B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-34B",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 262144,
-    "model_name": "Yi-200k",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "The Yi series models are large language models trained from scratch by developers at 01.AI. The first public release contains two bilingual (English/Chinese) base models with the parameter sizes of 6B and 34B. Both of them are trained with 4K sequence length and can be extended to 32K during inference time.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-6B-200K",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-34B-200K",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "Yi-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Yi series models are large language models trained from scratch by developers at 01.AI.",
-    "model_specs": [
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "8bits"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-34B-Chat-{quantization}",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-6B-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-34B-Chat",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      2,
-      6,
-      7,
-      8
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>",
-      "<|im_sep|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "Yi-1.5",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Yi-1.5 is an upgraded version of Yi. It is continuously pre-trained on Yi with a high-quality corpus of 500B tokens and fine-tuned on 3M diverse fine-tuning samples.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-6B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-9B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-34B",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "Yi-1.5-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Yi-1.5 is an upgraded version of Yi. It is continuously pre-trained on Yi with a high-quality corpus of 500B tokens and fine-tuned on 3M diverse fine-tuning samples.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-6B-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-9B-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-34B-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "AI-ModelScope/Yi-1.5-6B-Chat-GPTQ",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "AI-ModelScope/Yi-1.5-9B-Chat-GPTQ",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "AI-ModelScope/Yi-1.5-34B-Chat-GPTQ",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "AI-ModelScope/Yi-1.5-6B-Chat-AWQ",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "AI-ModelScope/Yi-1.5-9B-Chat-AWQ",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "AI-ModelScope/Yi-1.5-34B-Chat-AWQ",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = messages[0]['content'] %}{% endif %}{% if system_message is defined %}{{ system_message }}{% endif %}{% for message in messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|im_start|>user\n' + content + '<|im_end|>\n<|im_start|>assistant\n' }}{% elif message['role'] == 'assistant' %}{{ content + '<|im_end|>' + '\n' }}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      2,
-      6,
-      7,
-      8
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>",
-      "<|im_sep|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 16384,
-    "model_name": "Yi-1.5-chat-16k",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Yi-1.5 is an upgraded version of Yi. It is continuously pre-trained on Yi with a high-quality corpus of 500B tokens and fine-tuned on 3M diverse fine-tuning samples.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-9B-Chat-16K",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-1.5-34B-Chat-16K",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% if messages[0]['role'] == 'system' %}{% set system_message = messages[0]['content'] %}{% endif %}{% if system_message is defined %}{{ system_message }}{% endif %}{% for message in messages %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|im_start|>user\n' + content + '<|im_end|>\n<|im_start|>assistant\n' }}{% elif message['role'] == 'assistant' %}{{ content + '<|im_end|>' + '\n' }}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      2,
-      6,
-      7,
-      8
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>",
-      "<|im_sep|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 2048,
-    "model_name": "wizardmath-v1.0",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "WizardMath is an open-source LLM trained by fine-tuning Llama2 with Evol-Instruct, specializing in math.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/WizardMath-7B-V1.0",
-        "model_revision": "v1.0.0"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n\n### ' }}{% elif loop.first %}{{ 'Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### ' }}{% endif %}{% if item['role'] == 'user' %}{{ 'Instruction: ' + item['content'] + '\n\n### ' }}{% elif item['role'] == 'assistant' %}{{ 'Response: ' + item['content'] + '\n\n### ' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'Response: Let\\'s think step by step.' }}{% endif %}",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "mistral-instruct-v0.1",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Mistral-7B-Instruct is a fine-tuned version of the Mistral-7B LLM on public datasets, specializing in chatting.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/Mistral-7B-Instruct-v0.1",
-        "model_revision": "v1.0.0"
-      }
-    ],
-    "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content'] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n        {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif %}\n    {%- if message['role'] == 'user' %}\n        {%- if loop.first and system_message is defined %}\n            {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}\n        {%- else %}\n            {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n        {%- endif %}\n    {%- elif message['role'] == 'assistant' %}\n        {{- ' ' + message['content'] + '</s>'}}\n    {%- else %}\n        {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n    {%- endif %}\n{%- endfor %}\n",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "mistral-instruct-v0.2",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Mistral-7B-Instruct-v0.2 Large Language Model (LLM) is an improved instruct fine-tuned version of Mistral-7B-Instruct-v0.1.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/Mistral-7B-Instruct-v0.2"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/Mistral-7B-Instruct-v0.2-GGUF",
-        "model_file_name_template": "mistral-7b-instruct-v0.2.{quantization}.gguf"
-      }
-    ],
-    "chat_template": "{%- if messages[0]['role'] == 'system' %}\n    {%- set system_message = messages[0]['content'] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}\n        {{- raise_exception('After the optional system message, conversation roles must alternate user/assistant/user/assistant/...') }}\n    {%- endif %}\n    {%- if message['role'] == 'user' %}\n        {%- if loop.first and system_message is defined %}\n            {{- ' [INST] ' + system_message + '\n\n' + message['content'] + ' [/INST]' }}\n        {%- else %}\n            {{- ' [INST] ' + message['content'] + ' [/INST]' }}\n        {%- endif %}\n    {%- elif message['role'] == 'assistant' %}\n        {{- ' ' + message['content'] + '</s>'}}\n    {%- else %}\n        {{- raise_exception('Only user and assistant roles are supported, with the exception of an initial optional system message!') }}\n    {%- endif %}\n{%- endfor %}\n",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 1024000,
-    "model_name": "mistral-nemo-instruct",
-    "model_lang": [
-      "en",
-      "fr",
-      "de",
-      "es",
-      "it",
-      "pt",
-      "zh",
-      "ru",
-      "ja"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Mistral-Nemo-Instruct-2407 Large Language Model (LLM) is an instruct fine-tuned version of the Mistral-Nemo-Base-2407",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 12,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "AI-ModelScope/Mistral-Nemo-Instruct-2407",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 12,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "LLM-Research/Mistral-Nemo-Instruct-2407-gptq-4bit",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{%- if messages[0][\"role\"] == \"system\" %}\n    {%- set system_message = messages[0][\"content\"] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n{%- set user_messages = loop_messages | selectattr(\"role\", \"equalto\", \"user\") | list %}\n\n{#- This block checks for alternating user/assistant messages, skipping tool calling messages #}\n{%- set ns = namespace() %}\n{%- set ns.index = 0 %}\n{%- for message in loop_messages %}\n    {%- if not (message.role == \"tool\" or message.role == \"tool_results\" or (message.tool_calls is defined and message.tool_calls is not none)) %}\n        {%- if (message[\"role\"] == \"user\") != (ns.index % 2 == 0) %}\n            {{- raise_exception(\"After the optional system message, conversation roles must alternate user/assistant/user/assistant/...\") }}\n        {%- endif %}\n        {%- set ns.index = ns.index + 1 %}\n    {%- endif %}\n{%- endfor %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if message[\"role\"] == \"user\" %}\n        {%- if tools is not none and (message == user_messages[-1]) %}\n            {{- \"[AVAILABLE_TOOLS][\" }}\n            {%- for tool in tools %}\n                {%- set tool = tool.function %}\n                {{- '{\"type\": \"function\", \"function\": {' }}\n                {%- for key, val in tool.items() if key != \"return\" %}\n                    {%- if val is string %}\n                        {{- '\"' + key + '\": \"' + val + '\"' }}\n                    {%- else %}\n                        {{- '\"' + key + '\": ' + val|tojson }}\n                    {%- endif %}\n                    {%- if not loop.last %}\n                        {{- \", \" }}\n                    {%- endif %}\n                {%- endfor %}\n                {{- \"}}\" }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- else %}\n                    {{- \"]\" }}\n                {%- endif %}\n            {%- endfor %}\n            {{- \"[/AVAILABLE_TOOLS]\" }}\n            {%- endif %}\n        {%- if loop.last and system_message is defined %}\n            {{- \"[INST]\" + system_message + \"\n\n\" + message[\"content\"] + \"[/INST]\" }}\n        {%- else %}\n            {{- \"[INST]\" + message[\"content\"] + \"[/INST]\" }}\n        {%- endif %}\n    {%- elif (message.tool_calls is defined and message.tool_calls is not none) %}\n        {{- \"[TOOL_CALLS][\" }}\n        {%- for tool_call in message.tool_calls %}\n            {%- set out = tool_call.function|tojson %}\n            {{- out[:-1] }}\n            {%- if not tool_call.id is defined or tool_call.id|length != 9 %}\n                {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n            {%- endif %}\n            {{- ', \"id\": \"' + tool_call.id + '\"}' }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- else %}\n                {{- \"]\" + '</s>' }}\n            {%- endif %}\n        {%- endfor %}\n    {%- elif message[\"role\"] == \"assistant\" %}\n        {{- message[\"content\"] + '</s>'}}\n    {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n        {%- if message.content is defined and message.content.content is defined %}\n            {%- set content = message.content.content %}\n        {%- else %}\n            {%- set content = message.content %}\n        {%- endif %}\n        {{- '[TOOL_RESULTS]{\"content\": ' + content|string + \", \" }}\n        {%- if not message.tool_call_id is defined or message.tool_call_id|length != 9 %}\n            {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n        {%- endif %}\n        {{- '\"call_id\": \"' + message.tool_call_id + '\"}[/TOOL_RESULTS]' }}\n    {%- else %}\n        {{- raise_exception(\"Only user and assistant roles are supported, with the exception of an initial optional system message!\") }}\n    {%- endif %}\n{%- endfor %}\n",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 131072,
-    "model_name": "mistral-large-instruct",
-    "model_lang": [
-      "en",
-      "fr",
-      "de",
-      "es",
-      "it",
-      "pt",
-      "zh",
-      "ru",
-      "ja",
-      "ko"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Mistral-Large-Instruct-2407 is an advanced dense Large Language Model (LLM) of 123B parameters with state-of-the-art reasoning, knowledge and coding capabilities.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 123,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "LLM-Research/Mistral-Large-Instruct-2407",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 123,
-        "quantizations": [
-          "4-bit"
-        ],
-        "model_id": "LLM-Research/Mistral-Large-Instruct-2407-bnb-4bit",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{%- if messages[0][\"role\"] == \"system\" %}\n    {%- set system_message = messages[0][\"content\"] %}\n    {%- set loop_messages = messages[1:] %}\n{%- else %}\n    {%- set loop_messages = messages %}\n{%- endif %}\n{%- if not tools is defined %}\n    {%- set tools = none %}\n{%- endif %}\n{%- set user_messages = loop_messages | selectattr(\"role\", \"equalto\", \"user\") | list %}\n\n{#- This block checks for alternating user/assistant messages, skipping tool calling messages #}\n{%- set ns = namespace() %}\n{%- set ns.index = 0 %}\n{%- for message in loop_messages %}\n    {%- if not (message.role == \"tool\" or message.role == \"tool_results\" or (message.tool_calls is defined and message.tool_calls is not none)) %}\n        {%- if (message[\"role\"] == \"user\") != (ns.index % 2 == 0) %}\n            {{- raise_exception(\"After the optional system message, conversation roles must alternate user/assistant/user/assistant/...\") }}\n        {%- endif %}\n        {%- set ns.index = ns.index + 1 %}\n    {%- endif %}\n{%- endfor %}\n\n{{- '<s>' }}\n{%- for message in loop_messages %}\n    {%- if message[\"role\"] == \"user\" %}\n        {%- if tools is not none and (message == user_messages[-1]) %}\n            {{- \"[AVAILABLE_TOOLS][\" }}\n            {%- for tool in tools %}\n                {%- set tool = tool.function %}\n                {{- '{\"type\": \"function\", \"function\": {' }}\n                {%- for key, val in tool.items() if key != \"return\" %}\n                    {%- if val is string %}\n                        {{- '\"' + key + '\": \"' + val + '\"' }}\n                    {%- else %}\n                        {{- '\"' + key + '\": ' + val|tojson }}\n                    {%- endif %}\n                    {%- if not loop.last %}\n                        {{- \", \" }}\n                    {%- endif %}\n                {%- endfor %}\n                {{- \"}}\" }}\n                {%- if not loop.last %}\n                    {{- \", \" }}\n                {%- else %}\n                    {{- \"]\" }}\n                {%- endif %}\n            {%- endfor %}\n            {{- \"[/AVAILABLE_TOOLS]\" }}\n            {%- endif %}\n        {%- if loop.last and system_message is defined %}\n            {{- \"[INST]\" + system_message + \"\n\n\" + message[\"content\"] + \"[/INST]\" }}\n        {%- else %}\n            {{- \"[INST]\" + message[\"content\"] + \"[/INST]\" }}\n        {%- endif %}\n    {%- elif (message.tool_calls is defined and message.tool_calls is not none) %}\n        {{- \"[TOOL_CALLS][\" }}\n        {%- for tool_call in message.tool_calls %}\n            {%- set out = tool_call.function|tojson %}\n            {{- out[:-1] }}\n            {%- if not tool_call.id is defined or tool_call.id|length != 9 %}\n                {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n            {%- endif %}\n            {{- ', \"id\": \"' + tool_call.id + '\"}' }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- else %}\n                {{- \"]\" + '</s>' }}\n            {%- endif %}\n        {%- endfor %}\n    {%- elif message[\"role\"] == \"assistant\" %}\n        {{- message[\"content\"] + '</s>'}}\n    {%- elif message[\"role\"] == \"tool_results\" or message[\"role\"] == \"tool\" %}\n        {%- if message.content is defined and message.content.content is defined %}\n            {%- set content = message.content.content %}\n        {%- else %}\n            {%- set content = message.content %}\n        {%- endif %}\n        {{- '[TOOL_RESULTS]{\"content\": ' + content|string + \", \" }}\n        {%- if not message.tool_call_id is defined or message.tool_call_id|length != 9 %}\n            {{- raise_exception(\"Tool call IDs should be alphanumeric strings with length 9!\") }}\n        {%- endif %}\n        {{- '\"call_id\": \"' + message.tool_call_id + '\"}[/TOOL_RESULTS]' }}\n    {%- else %}\n        {{- raise_exception(\"Only user and assistant roles are supported, with the exception of an initial optional system message!\") }}\n    {%- endif %}\n{%- endfor %}\n",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Qwen-chat is a fine-tuned version of the Qwen LLM trained with alignment techniques, specializing in chatting.",
-    "model_specs": [
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/Qwen-7B-Chat-GGUF",
-        "model_file_name_template": "Qwen-7B-Chat.{quantization}.gguf",
-        "model_revision": "v0.0.1"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "Q4_K_M"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Xorbits/Qwen-14B-Chat-GGUF",
-        "model_file_name_template": "Qwen-14B-Chat.{quantization}.gguf",
-        "model_revision": "v0.0.1"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "qwen/Qwen-1_8B-Chat",
-        "model_revision": "v1.0.0"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "qwen/Qwen-7B-Chat",
-        "model_revision": "v1.1.9"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "qwen/Qwen-72B-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen-14B-Chat",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.7"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen-1_8B-Chat-{quantization}",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen-7B-Chat-{quantization}",
-        "model_hub": "modelscope",
-        "model_revision": "v1.1.7"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen-14B-Chat-{quantization}",
-        "model_hub": "modelscope",
-        "model_revision": "v1.0.7"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen-72B-Chat-{quantization}",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ '<|im_start|>system\n' + item['content'] + '<|im_end|>\n' }}{% elif loop.first %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{% if item['role'] == 'user' %}{{ '<|im_start|>user\n' + item['content'] + '<|im_end|>' }}{% elif item['role'] == 'assistant' %}{{ '<|im_start|>assistant\n' + item['content'] + '<|im_end|>' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen1.5-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "Qwen1.5 is the beta version of Qwen2, a transformer-based decoder-only language model pretrained on a large amount of data.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-0.5B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-1.8B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 4,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-4B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-7B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-14B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 32,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-32B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-72B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 110,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-110B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen1.5-0.5B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen1.5-1.8B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 4,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen1.5-4B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen1.5-7B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen1.5-14B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 32,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-32B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen1.5-72B-Chat-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 110,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-110B-Chat-GPTQ-Int4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-0.5B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-1.8B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 4,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-4B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-7B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-14B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 32,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-32B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-72B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 110,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-110B-Chat-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/Qwen1.5-0.5B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-0_5b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": "1_8",
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/Qwen1.5-1.8B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-1_8b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 4,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/Qwen1.5-4B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-4b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/Qwen1.5-7B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-7b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/Qwen1.5-14B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-14b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 32,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/Qwen1.5-32B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-32b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_k_m"
-        ],
-        "model_id": "qwen/Qwen1.5-72B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen1_5-72b-chat-{quantization}.gguf",
-        "model_file_name_split_template": "qwen1_5-72b-chat-{quantization}.gguf.{part}",
-        "quantization_parts": {
-          "q4_k_m": [
-            "a",
-            "b"
-          ]
-        }
-      }
-    ],
-    "chat_template": "{%- macro json_to_python_type(json_spec) %}\n    {%- set basic_type_map = {\n    \"string\": \"str\",\n    \"number\": \"float\",\n    \"integer\": \"int\",\n    \"boolean\": \"bool\"\n} %}\n    {%- if basic_type_map[json_spec.type] is defined %}\n        {{- basic_type_map[json_spec.type] }}\n    {%- elif json_spec.type == \"array\" %}\n        {{- \"list[\" +  json_to_python_type(json_spec|items) + \"]\" }}\n    {%- elif json_spec.type == \"object\" %}\n        {%- if json_spec.additionalProperties is defined %}\n            {{- \"dict[str, \" + json_to_python_type(json_spec.additionalProperties) + ']' }}\n        {%- else %}\n            {{- \"dict\" }}\n        {%- endif %}\n    {%- elif json_spec.type is iterable %}\n        {{- \"Union[\" }}\n        {%- for t in json_spec.type %}\n            {{- json_to_python_type({\"type\": t}) }}\n            {%- if not loop.last %}\n                {{- \",\" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \"]\" }}\n    {%- else %}\n        {{- \"Any\" }}\n    {%- endif %}\n{%- endmacro %}\n\n{%- if tools %}\n    {{- '<|im_start|>system\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] + '\n\n' }}\n    {%- endif %}\n    {{- '# Tools\n\n' }}\n    {{- \"You are a function calling AI model. You are provided with function signatures within <tools></tools> XML tags. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: <tools> \" }}\n    {%- for tool in tools %}\n        {%- if tool.function is defined %}\n            {%- set tool = tool.function %}\n        {%- endif %}\n        {{- '{\"type\": \"function\", \"function\": ' }}\n        {{- '{\"name\": ' + tool.name + '\", ' }}\n        {{- '\"description\": \"' + tool.name + '(' }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {{- param_name + \": \" + json_to_python_type(param_fields) }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \")\" }}\n        {%- if tool.return is defined %}\n            {{- \" -> \" + json_to_python_type(tool.return) }}\n        {%- endif %}\n        {{- \" - \" + tool.description + \"\n\n\" }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {%- if loop.first %}\n                {{- \"    Args:\n\" }}\n            {%- endif %}\n            {{- \"        \" + param_name + \"(\" + json_to_python_type(param_fields) + \"): \" + param_fields.description|trim }}\n        {%- endfor %}\n        {%- if tool.return is defined and tool.return.description is defined %}\n            {{- \"\n    Returns:\n        \" + tool.return.description }}\n        {%- endif %}\n        {{- '\"' }}\n        {{- ', \"parameters\": ' }}\n        {%- if tool.parameters.properties | length == 0 %}\n            {{- \"{}\" }}\n        {%- else %}\n            {{- tool.parameters|tojson }}\n        {%- endif %}\n        {{- \"}\" }}\n        {%- if not loop.last %}\n            {{- \"\n\" }}\n        {%- endif %}\n    {%- endfor %}\n    {{- \" </tools>\" }}\n    {{- 'Use the following pydantic model json schema for each tool call you will make: {\"properties\": {\"arguments\": {\"title\": \"Arguments\", \"type\": \"object\"}, \"name\": {\"title\": \"Name\", \"type\": \"string\"}}, \"required\": [\"arguments\", \"name\"], \"title\": \"FunctionCall\", \"type\": \"object\"}\n' }}\n    {{- \"For each function call return a json object with function name and arguments within <tool_call></tool_call> XML tags as follows:\n\" }}\n    {{- \"<tool_call>\n\" }}\n    {{- '{\"name\": <function-name>, \"arguments\": <args-json-object>}\n' }}\n    {{- '</tool_call><|im_end|>\n' }}\n{%- else %}\n    {%- if messages[0]['role'] != 'system' %}\n        {{- '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message.role == \"user\" or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and message.tool_calls is not defined) %}\n        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role + '\n<tool_call>\n' }}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '{' }}\n            {{- '\"name\": \"' }}\n            {{- tool_call.name }}\n            {%- if tool_call.arguments is defined %}\n                {{- ', ' }}\n                {{- '\"arguments\": ' }}\n                {{- tool_call.arguments|tojson }}\n            {%- endif %}\n            {{- '\"}' }}\n            {{- '\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if not message.name is defined %}\n            {{- raise_exception(\"Tool response dicts require a 'name' key indicating the name of the called function!\") }}\n        {%- endif %}\n        {{- '<|im_start|>user\n<tool_response>\n' }}\n        {{- '{\"name\": \"' }}\n        {{- message.name }}\n        {{- '\", \"content\": ' }}\n        {{- message.content|tojson + '}' }}\n        {{- '\n</tool_response><|im_end|>\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\n' }}\n{%- endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen1.5-moe-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "Qwen1.5-MoE is a transformer-based MoE decoder-only language model pretrained on a large amount of data.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "2_7",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen1.5-MoE-A2.7B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": "2_7",
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{%- macro json_to_python_type(json_spec) %}\n    {%- set basic_type_map = {\n    \"string\": \"str\",\n    \"number\": \"float\",\n    \"integer\": \"int\",\n    \"boolean\": \"bool\"\n} %}\n    {%- if basic_type_map[json_spec.type] is defined %}\n        {{- basic_type_map[json_spec.type] }}\n    {%- elif json_spec.type == \"array\" %}\n        {{- \"list[\" +  json_to_python_type(json_spec|items) + \"]\" }}\n    {%- elif json_spec.type == \"object\" %}\n        {%- if json_spec.additionalProperties is defined %}\n            {{- \"dict[str, \" + json_to_python_type(json_spec.additionalProperties) + ']' }}\n        {%- else %}\n            {{- \"dict\" }}\n        {%- endif %}\n    {%- elif json_spec.type is iterable %}\n        {{- \"Union[\" }}\n        {%- for t in json_spec.type %}\n            {{- json_to_python_type({\"type\": t}) }}\n            {%- if not loop.last %}\n                {{- \",\" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \"]\" }}\n    {%- else %}\n        {{- \"Any\" }}\n    {%- endif %}\n{%- endmacro %}\n\n{%- if tools %}\n    {{- '<|im_start|>system\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] + '\n\n' }}\n    {%- endif %}\n    {{- '# Tools\n\n' }}\n    {{- \"You are a function calling AI model. You are provided with function signatures within <tools></tools> XML tags. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: <tools> \" }}\n    {%- for tool in tools %}\n        {%- if tool.function is defined %}\n            {%- set tool = tool.function %}\n        {%- endif %}\n        {{- '{\"type\": \"function\", \"function\": ' }}\n        {{- '{\"name\": ' + tool.name + '\", ' }}\n        {{- '\"description\": \"' + tool.name + '(' }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {{- param_name + \": \" + json_to_python_type(param_fields) }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \")\" }}\n        {%- if tool.return is defined %}\n            {{- \" -> \" + json_to_python_type(tool.return) }}\n        {%- endif %}\n        {{- \" - \" + tool.description + \"\n\n\" }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {%- if loop.first %}\n                {{- \"    Args:\n\" }}\n            {%- endif %}\n            {{- \"        \" + param_name + \"(\" + json_to_python_type(param_fields) + \"): \" + param_fields.description|trim }}\n        {%- endfor %}\n        {%- if tool.return is defined and tool.return.description is defined %}\n            {{- \"\n    Returns:\n        \" + tool.return.description }}\n        {%- endif %}\n        {{- '\"' }}\n        {{- ', \"parameters\": ' }}\n        {%- if tool.parameters.properties | length == 0 %}\n            {{- \"{}\" }}\n        {%- else %}\n            {{- tool.parameters|tojson }}\n        {%- endif %}\n        {{- \"}\" }}\n        {%- if not loop.last %}\n            {{- \"\n\" }}\n        {%- endif %}\n    {%- endfor %}\n    {{- \" </tools>\" }}\n    {{- 'Use the following pydantic model json schema for each tool call you will make: {\"properties\": {\"arguments\": {\"title\": \"Arguments\", \"type\": \"object\"}, \"name\": {\"title\": \"Name\", \"type\": \"string\"}}, \"required\": [\"arguments\", \"name\"], \"title\": \"FunctionCall\", \"type\": \"object\"}\n' }}\n    {{- \"For each function call return a json object with function name and arguments within <tool_call></tool_call> XML tags as follows:\n\" }}\n    {{- \"<tool_call>\n\" }}\n    {{- '{\"name\": <function-name>, \"arguments\": <args-json-object>}\n' }}\n    {{- '</tool_call><|im_end|>\n' }}\n{%- else %}\n    {%- if messages[0]['role'] != 'system' %}\n        {{- '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message.role == \"user\" or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and message.tool_calls is not defined) %}\n        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role + '\n<tool_call>\n' }}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '{' }}\n            {{- '\"name\": \"' }}\n            {{- tool_call.name }}\n            {%- if tool_call.arguments is defined %}\n                {{- ', ' }}\n                {{- '\"arguments\": ' }}\n                {{- tool_call.arguments|tojson }}\n            {%- endif %}\n            {{- '\"}' }}\n            {{- '\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if not message.name is defined %}\n            {{- raise_exception(\"Tool response dicts require a 'name' key indicating the name of the called function!\") }}\n        {%- endif %}\n        {{- '<|im_start|>user\n<tool_response>\n' }}\n        {{- '{\"name\": \"' }}\n        {{- message.name }}\n        {{- '\", \"content\": ' }}\n        {{- message.content|tojson + '}' }}\n        {{- '\n</tool_response><|im_end|>\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\n' }}\n{%- endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 65536,
-    "model_name": "codeqwen1.5",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "CodeQwen1.5 is the Code-Specific version of Qwen1.5. It is a transformer-based decoder-only language model pretrained on a large amount of data of codes.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/CodeQwen1.5-7B",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 65536,
-    "model_name": "codeqwen1.5-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "CodeQwen1.5 is the Code-Specific version of Qwen1.5. It is a transformer-based decoder-only language model pretrained on a large amount of data of codes.",
-    "model_specs": [
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0"
-        ],
-        "model_id": "qwen/CodeQwen1.5-7B-Chat-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "codeqwen-1_5-7b-chat-{quantization}.gguf"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/CodeQwen1.5-7B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/CodeQwen1.5-7B-Chat-AWQ",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen2-instruct",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "Qwen2 is the new series of Qwen large language models",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen2-0.5B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_5",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen2-1.5B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen2-7B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen2-72B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen2-0.5B-Instruct-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": "1_5",
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen2-1.5B-Instruct-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen2-7B-Instruct-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "Int4",
-          "Int8"
-        ],
-        "model_id": "qwen/Qwen2-72B-Instruct-GPTQ-{quantization}",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen2-0.5B-Instruct-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": "1_5",
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen2-1.5B-Instruct-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen2-7B-Instruct-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen2-72B-Instruct-AWQ",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "fp8",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "fp8"
-        ],
-        "model_id": "liuzhenghua/Qwen2-7B-FP8-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "fp8",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "fp8"
-        ],
-        "model_id": "liuzhenghua/Qwen2-72B-FP8-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "mlx",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "4-bit"
-        ],
-        "model_id": "qwen/Qwen2-0.5B-Instruct-MLX",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "mlx",
-        "model_size_in_billions": "1_5",
-        "quantizations": [
-          "4-bit"
-        ],
-        "model_id": "qwen/Qwen2-1.5B-Instruct-MLX",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "mlx",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit"
-        ],
-        "model_id": "qwen/Qwen2-7B-Instruct-MLX",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": "0_5",
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "qwen/Qwen2-0.5B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-0_5b-instruct-{quantization}.gguf",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": "1_5",
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "qwen/Qwen2-1.5B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-1_5b-instruct-{quantization}.gguf",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "qwen/Qwen2-7B-Instruct-GGUF",
-        "model_file_name_template": "qwen2-7b-instruct-{quantization}.gguf",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 72,
-        "quantizations": [
-          "q2_k",
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "qwen/Qwen2-72B-Instruct-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen2-72b-instruct-{quantization}.gguf",
-        "model_file_name_split_template": "qwen2-72b-instruct-{quantization}-{part}.gguf",
-        "quantization_parts": {
-          "q5_0": [
-            "00001-of-00002",
-            "00002-of-00002"
-          ],
-          "q5_k_m": [
-            "00001-of-00002",
-            "00002-of-00002"
-          ],
-          "q6_k": [
-            "00001-of-00002",
-            "00002-of-00002"
-          ],
-          "q8_0": [
-            "00001-of-00002",
-            "00002-of-00002"
-          ],
-          "fp16": [
-            "00001-of-00004",
-            "00002-of-00004",
-            "00003-of-00004",
-            "00004-of-00004"
-          ]
-        }
-      }
-    ],
-    "chat_template": "{%- macro json_to_python_type(json_spec) %}\n    {%- set basic_type_map = {\n    \"string\": \"str\",\n    \"number\": \"float\",\n    \"integer\": \"int\",\n    \"boolean\": \"bool\"\n} %}\n    {%- if basic_type_map[json_spec.type] is defined %}\n        {{- basic_type_map[json_spec.type] }}\n    {%- elif json_spec.type == \"array\" %}\n        {{- \"list[\" +  json_to_python_type(json_spec|items) + \"]\" }}\n    {%- elif json_spec.type == \"object\" %}\n        {%- if json_spec.additionalProperties is defined %}\n            {{- \"dict[str, \" + json_to_python_type(json_spec.additionalProperties) + ']' }}\n        {%- else %}\n            {{- \"dict\" }}\n        {%- endif %}\n    {%- elif json_spec.type is iterable %}\n        {{- \"Union[\" }}\n        {%- for t in json_spec.type %}\n            {{- json_to_python_type({\"type\": t}) }}\n            {%- if not loop.last %}\n                {{- \",\" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \"]\" }}\n    {%- else %}\n        {{- \"Any\" }}\n    {%- endif %}\n{%- endmacro %}\n\n{%- if tools %}\n    {{- '<|im_start|>system\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] + '\n\n' }}\n    {%- endif %}\n    {{- '# Tools\n\n' }}\n    {{- \"You are a function calling AI model. You are provided with function signatures within <tools></tools> XML tags. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: <tools> \" }}\n    {%- for tool in tools %}\n        {%- if tool.function is defined %}\n            {%- set tool = tool.function %}\n        {%- endif %}\n        {{- '{\"type\": \"function\", \"function\": ' }}\n        {{- '{\"name\": ' + tool.name + '\", ' }}\n        {{- '\"description\": \"' + tool.name + '(' }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {{- param_name + \": \" + json_to_python_type(param_fields) }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \")\" }}\n        {%- if tool.return is defined %}\n            {{- \" -> \" + json_to_python_type(tool.return) }}\n        {%- endif %}\n        {{- \" - \" + tool.description + \"\n\n\" }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {%- if loop.first %}\n                {{- \"    Args:\n\" }}\n            {%- endif %}\n            {{- \"        \" + param_name + \"(\" + json_to_python_type(param_fields) + \"): \" + param_fields.description|trim }}\n        {%- endfor %}\n        {%- if tool.return is defined and tool.return.description is defined %}\n            {{- \"\n    Returns:\n        \" + tool.return.description }}\n        {%- endif %}\n        {{- '\"' }}\n        {{- ', \"parameters\": ' }}\n        {%- if tool.parameters.properties | length == 0 %}\n            {{- \"{}\" }}\n        {%- else %}\n            {{- tool.parameters|tojson }}\n        {%- endif %}\n        {{- \"}\" }}\n        {%- if not loop.last %}\n            {{- \"\n\" }}\n        {%- endif %}\n    {%- endfor %}\n    {{- \" </tools>\" }}\n    {{- 'Use the following pydantic model json schema for each tool call you will make: {\"properties\": {\"arguments\": {\"title\": \"Arguments\", \"type\": \"object\"}, \"name\": {\"title\": \"Name\", \"type\": \"string\"}}, \"required\": [\"arguments\", \"name\"], \"title\": \"FunctionCall\", \"type\": \"object\"}\n' }}\n    {{- \"For each function call return a json object with function name and arguments within <tool_call></tool_call> XML tags as follows:\n\" }}\n    {{- \"<tool_call>\n\" }}\n    {{- '{\"name\": <function-name>, \"arguments\": <args-json-object>}\n' }}\n    {{- '</tool_call><|im_end|>\n' }}\n{%- else %}\n    {%- if messages[0]['role'] != 'system' %}\n        {{- '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message.role == \"user\" or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and message.tool_calls is not defined) %}\n        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role + '\n<tool_call>\n' }}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '{' }}\n            {{- '\"name\": \"' }}\n            {{- tool_call.name }}\n            {%- if tool_call.arguments is defined %}\n                {{- ', ' }}\n                {{- '\"arguments\": ' }}\n                {{- tool_call.arguments|tojson }}\n            {%- endif %}\n            {{- '\"}' }}\n            {{- '\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if not message.name is defined %}\n            {{- raise_exception(\"Tool response dicts require a 'name' key indicating the name of the called function!\") }}\n        {%- endif %}\n        {{- '<|im_start|>user\n<tool_response>\n' }}\n        {{- '{\"name\": \"' }}\n        {{- message.name }}\n        {{- '\", \"content\": ' }}\n        {{- message.content|tojson + '}' }}\n        {{- '\n</tool_response><|im_end|>\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\n' }}\n{%- endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen2-moe-instruct",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "tools"
-    ],
-    "model_description": "Qwen2 is the new series of Qwen large language models. ",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "qwen/Qwen2-57B-A14B-Instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_id": "qwen/Qwen2-57B-A14B-Instruct-GPTQ-Int4",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "q3_k_m",
-          "q4_0",
-          "q4_k_m",
-          "q5_0",
-          "q5_k_m",
-          "q6_k",
-          "q8_0",
-          "fp16"
-        ],
-        "model_id": "qwen/Qwen2-57B-A14B-Instruct-GGUF",
-        "model_hub": "modelscope",
-        "model_file_name_template": "qwen2-57b-a14b-instruct-{quantization}.gguf",
-        "model_file_name_split_template": "qwen2-57b-a14b-instruct-{quantization}-{part}.gguf",
-        "quantization_parts": {
-          "q8_0": [
-            "00001-of-00002",
-            "00002-of-00002"
-          ],
-          "fp16": [
-            "00001-of-00003",
-            "00002-of-00003",
-            "00003-of-00003"
-          ]
-        }
-      }
-    ],
-    "chat_template": "{%- macro json_to_python_type(json_spec) %}\n    {%- set basic_type_map = {\n    \"string\": \"str\",\n    \"number\": \"float\",\n    \"integer\": \"int\",\n    \"boolean\": \"bool\"\n} %}\n    {%- if basic_type_map[json_spec.type] is defined %}\n        {{- basic_type_map[json_spec.type] }}\n    {%- elif json_spec.type == \"array\" %}\n        {{- \"list[\" +  json_to_python_type(json_spec|items) + \"]\" }}\n    {%- elif json_spec.type == \"object\" %}\n        {%- if json_spec.additionalProperties is defined %}\n            {{- \"dict[str, \" + json_to_python_type(json_spec.additionalProperties) + ']' }}\n        {%- else %}\n            {{- \"dict\" }}\n        {%- endif %}\n    {%- elif json_spec.type is iterable %}\n        {{- \"Union[\" }}\n        {%- for t in json_spec.type %}\n            {{- json_to_python_type({\"type\": t}) }}\n            {%- if not loop.last %}\n                {{- \",\" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \"]\" }}\n    {%- else %}\n        {{- \"Any\" }}\n    {%- endif %}\n{%- endmacro %}\n\n{%- if tools %}\n    {{- '<|im_start|>system\n' }}\n    {%- if messages[0]['role'] == 'system' %}\n        {{- messages[0]['content'] + '\n\n' }}\n    {%- endif %}\n    {{- '# Tools\n\n' }}\n    {{- \"You are a function calling AI model. You are provided with function signatures within <tools></tools> XML tags. You may call one or more functions to assist with the user query. Don't make assumptions about what values to plug into functions. Here are the available tools: <tools> \" }}\n    {%- for tool in tools %}\n        {%- if tool.function is defined %}\n            {%- set tool = tool.function %}\n        {%- endif %}\n        {{- '{\"type\": \"function\", \"function\": ' }}\n        {{- '{\"name\": ' + tool.name + '\", ' }}\n        {{- '\"description\": \"' + tool.name + '(' }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {{- param_name + \": \" + json_to_python_type(param_fields) }}\n            {%- if not loop.last %}\n                {{- \", \" }}\n            {%- endif %}\n        {%- endfor %}\n        {{- \")\" }}\n        {%- if tool.return is defined %}\n            {{- \" -> \" + json_to_python_type(tool.return) }}\n        {%- endif %}\n        {{- \" - \" + tool.description + \"\n\n\" }}\n        {%- for param_name, param_fields in tool.parameters.properties|items %}\n            {%- if loop.first %}\n                {{- \"    Args:\n\" }}\n            {%- endif %}\n            {{- \"        \" + param_name + \"(\" + json_to_python_type(param_fields) + \"): \" + param_fields.description|trim }}\n        {%- endfor %}\n        {%- if tool.return is defined and tool.return.description is defined %}\n            {{- \"\n    Returns:\n        \" + tool.return.description }}\n        {%- endif %}\n        {{- '\"' }}\n        {{- ', \"parameters\": ' }}\n        {%- if tool.parameters.properties | length == 0 %}\n            {{- \"{}\" }}\n        {%- else %}\n            {{- tool.parameters|tojson }}\n        {%- endif %}\n        {{- \"}\" }}\n        {%- if not loop.last %}\n            {{- \"\n\" }}\n        {%- endif %}\n    {%- endfor %}\n    {{- \" </tools>\" }}\n    {{- 'Use the following pydantic model json schema for each tool call you will make: {\"properties\": {\"arguments\": {\"title\": \"Arguments\", \"type\": \"object\"}, \"name\": {\"title\": \"Name\", \"type\": \"string\"}}, \"required\": [\"arguments\", \"name\"], \"title\": \"FunctionCall\", \"type\": \"object\"}\n' }}\n    {{- \"For each function call return a json object with function name and arguments within <tool_call></tool_call> XML tags as follows:\n\" }}\n    {{- \"<tool_call>\n\" }}\n    {{- '{\"name\": <function-name>, \"arguments\": <args-json-object>}\n' }}\n    {{- '</tool_call><|im_end|>\n' }}\n{%- else %}\n    {%- if messages[0]['role'] != 'system' %}\n        {{- '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}\n    {%- else %}\n        {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }}\n    {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message.role == \"user\" or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and message.tool_calls is not defined) %}\n        {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }}\n    {%- elif message.role == \"assistant\" %}\n        {{- '<|im_start|>' + message.role + '\n<tool_call>\n' }}\n        {%- for tool_call in message.tool_calls %}\n            {%- if tool_call.function is defined %}\n                {%- set tool_call = tool_call.function %}\n            {%- endif %}\n            {{- '{' }}\n            {{- '\"name\": \"' }}\n            {{- tool_call.name }}\n            {%- if tool_call.arguments is defined %}\n                {{- ', ' }}\n                {{- '\"arguments\": ' }}\n                {{- tool_call.arguments|tojson }}\n            {%- endif %}\n            {{- '\"}' }}\n            {{- '\n</tool_call>' }}\n        {%- endfor %}\n        {{- '<|im_end|>\n' }}\n    {%- elif message.role == \"tool\" %}\n        {%- if not message.name is defined %}\n            {{- raise_exception(\"Tool response dicts require a 'name' key indicating the name of the called function!\") }}\n        {%- endif %}\n        {{- '<|im_start|>user\n<tool_response>\n' }}\n        {{- '{\"name\": \"' }}\n        {{- message.name }}\n        {{- '\", \"content\": ' }}\n        {{- message.content|tojson + '}' }}\n        {{- '\n</tool_response><|im_end|>\n' }}\n    {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n    {{- '<|im_start|>assistant\n' }}\n{%- endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "deepseek-vl-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "vision"
-    ],
-    "model_description": "DeepSeek-VL possesses general multimodal understanding capabilities, capable of processing logical diagrams, web pages, formula recognition, scientific literature, natural images, and embodied intelligence in complex scenarios.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_3",
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-vl-1.3b-chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-vl-7b-chat",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "",
-    "stop_token_ids": [
-      100001
-    ],
-    "stop": [
-      "<｜end▁of▁sentence｜>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "deepseek",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "DDeepSeek LLM, trained from scratch on a vast dataset of 2 trillion tokens in both English and Chinese. ",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-llm-7b-base",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 67,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-llm-67b-base",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "deepseek-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "DeepSeek LLM is an advanced language model comprising 67 billion parameters. It has been trained from scratch on a vast dataset of 2 trillion tokens in both English and Chinese.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-llm-7b-chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 67,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-llm-67b-chat",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{{ '<｜begin▁of▁sentence｜>' }}{% for message in messages %}{% if message['role'] == 'user' %}{{ 'User: ' + message['content'] + '\n\n' }}{% elif message['role'] == 'assistant' %}{{ 'Assistant: ' + message['content'] + '<｜end▁of▁sentence｜>' }}{% elif message['role'] == 'system' %}{{ message['content'] + '\n\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'Assistant:' }}{% endif %}",
-    "stop_token_ids": [
-      100001
-    ],
-    "stop": [
-      "<｜end▁of▁sentence｜>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 16384,
-    "model_name": "deepseek-coder",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Deepseek Coder is composed of a series of code language models, each trained from scratch on 2T tokens, with a composition of 87% code and 13% natural language in both English and Chinese.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_3",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-coder-1.3b-base",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "6_7",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-coder-6.7b-base",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 33,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-coder-33b-base",
-        "model_hub": "modelscope"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 16384,
-    "model_name": "deepseek-coder-instruct",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "deepseek-coder-instruct is a model initialized from deepseek-coder-base and fine-tuned on 2B tokens of instruction data.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "1_3",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-coder-1.3b-instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": "6_7",
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-coder-6.7b-instruct",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 33,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "deepseek-ai/deepseek-coder-33b-instruct",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{% if not add_generation_prompt is defined %}\n{% set add_generation_prompt = false %}\n{% endif %}\n{%- set ns = namespace(found=false) -%}\n{%- for message in messages -%}\n    {%- if message['role'] == 'system' -%}\n        {%- set ns.found = true -%}\n    {%- endif -%}\n{%- endfor -%}\n{{'<｜begin▁of▁sentence｜>'}}{%- if not ns.found -%}\n{{'You are an AI programming assistant, utilizing the Deepseek Coder model, developed by Deepseek Company, and you only answer questions related to computer science. For politically sensitive questions, security and privacy issues, and other non-computer science questions, you will refuse to answer\n'}}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message['role'] == 'system' %}\n{{ message['content'] }}\n    {%- else %}\n        {%- if message['role'] == 'user' %}\n{{'### Instruction:\n' + message['content'] + '\n'}}\n        {%- else %}\n{{'### Response:\n' + message['content'] + '\n<|EOT|>\n'}}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n{% if add_generation_prompt %}\n{{'### Response:'}}\n{% endif %}",
-    "stop_token_ids": [
-      32021
-    ],
-    "stop": [
-      "<|EOT|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "Skywork",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Skywork is a series of large models developed by the Kunlun Group · Skywork team.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "skywork/Skywork-13B-base",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "Skywork-Math",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Skywork is a series of large models developed by the Kunlun Group · Skywork team.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 13,
-        "quantizations": [
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "skywork/Skywork-13B-Math",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 204800,
-    "model_name": "internlm2-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The second generation of the InternLM model, InternLM2.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2-chat-7b",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 20,
-        "quantizations": [
-          "none"
-        ],
-        "model_id": "Shanghai_AI_Laboratory/internlm2-chat-20b",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      2,
-      92542
-    ],
-    "stop": [
-      "</s>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "qwen-vl-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "vision"
-    ],
-    "model_description": "Qwen-VL-Chat supports more flexible interaction, such as multiple image inputs, multi-round question answering, and creative capabilities.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Qwen/Qwen-VL-Chat",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "Qwen/Qwen-VL-Chat-{quantization}",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "orion-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Orion-14B series models are open-source multilingual large language models trained from scratch by OrionStarAI.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_id": "OrionStarAI/Orion-14B-Chat",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "awq",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OrionStarAI/Orion-14B-Chat-{quantization}"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if loop.first %}{{ '<s>' }}{% endif %}{% if message['role'] == 'user' %}{{ 'Human: ' + message['content'] + '\n\nAssistant: ' + '</s>' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + '</s>' }}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2,
-      0
-    ],
-    "stop": [
-      "<s>",
-      "</s>",
-      "<unk>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "orion-chat-rag",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Orion-14B series models are open-source multilingual large language models trained from scratch by OrionStarAI.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 14,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OrionStarAI/Orion-14B-Chat-RAG"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if loop.first %}{{ '<s>' }}{% endif %}{% if message['role'] == 'user' %}{{ 'Human: ' + message['content'] + '\n\nAssistant: ' + '</s>' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + '</s>' }}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2,
-      0
-    ],
-    "stop": [
-      "<s>",
-      "</s>",
-      "<unk>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "yi-vl-chat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "vision"
-    ],
-    "model_description": "Yi Vision Language (Yi-VL) model is the open-source, multimodal version of the Yi Large Language Model (LLM) series, enabling content comprehension, recognition, and multi-round conversations about images.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 6,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-VL-6B"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "01ai/Yi-VL-34B"
-      }
-    ],
-    "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      2,
-      6,
-      7,
-      8
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>",
-      "<|im_sep|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "gemma-it",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Gemma is a family of lightweight, state-of-the-art open models from Google, built from the same research and technology used to create the Gemini models.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/gemma-2b-it"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/gemma-7b-it"
-      }
-    ],
-    "chat_template": "{{ '<bos>' }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
-    "stop_token_ids": [
-      1,
-      106,
-      107
-    ],
-    "stop": [
-      "<eos>",
-      "<end_of_turn>",
-      "<start_of_turn>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "gemma-2-it",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Gemma is a family of lightweight, state-of-the-art open models from Google, built from the same research and technology used to create the Gemini models.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_id": "LLM-Research/gemma-2-2b-it",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_id": "AI-ModelScope/gemma-2-9b-it",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 27,
-        "quantizations": [
-          "none",
-          "4-bit",
-          "8-bit"
-        ],
-        "model_id": "AI-ModelScope/gemma-2-27b-it",
-        "model_hub": "modelscope"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 9,
-        "quantizations": [
-          "Q2_K",
-          "Q3_K_L",
-          "Q3_K_M",
-          "Q3_K_S",
-          "Q4_K_L",
-          "Q4_K_M",
-          "Q4_K_S",
-          "Q5_K_L",
-          "Q5_K_M",
-          "Q5_K_S",
-          "Q6_K",
-          "Q6_K_L",
-          "Q8_0",
-          "f32"
-        ],
-        "model_id": "LLM-Research/gemma-2-9b-it-GGUF",
-        "model_file_name_template": "gemma-2-9b-it-{quantization}.gguf",
-        "model_hub": "modelscope"
-      }
-    ],
-    "chat_template": "{{ '<bos>' }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
-    "stop_token_ids": [
-      1,
-      106,
-      107
-    ],
-    "stop": [
-      "<eos>",
-      "<end_of_turn>",
-      "<start_of_turn>"
-    ]
-  },
-  {
-    "version":1,
-    "context_length":2048,
-    "model_name":"OmniLMM",
-    "model_lang":[
-      "en",
-      "zh"
-    ],
-    "model_ability":[
-      "chat",
-      "vision"
-    ],
-    "model_description":"OmniLMM is a family of open-source large multimodal models (LMMs) adept at vision & language modeling.",
-    "model_specs":[
-      {
-        "model_format":"pytorch",
-        "model_size_in_billions":3,
-        "quantizations":[
-          "none"
-        ],
-        "model_id":"OpenBMB/MiniCPM-V",
-        "model_hub":"modelscope",
-        "model_revision":"master"
-      },
-      {
-        "model_format":"pytorch",
-        "model_size_in_billions":12,
-        "quantizations":[
-          "none"
-        ],
-        "model_id":"OpenBMB/OmniLMM-12B",
-        "model_hub":"modelscope",
-        "model_revision":"master"
-      }
-    ],
-    "chat_template": "",
-    "stop_token_ids": [
-      2
-    ],
-    "stop": [
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "minicpm-2b-sft-bf16",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "MiniCPM is an End-Size LLM developed by ModelBest Inc. and TsinghuaNLP, with only 2.4B parameters excluding embeddings.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OpenBMB/miniCPM-bf16",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2
-    ],
-    "stop": [
-      "<s>",
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "minicpm-2b-sft-fp32",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "MiniCPM is an End-Size LLM developed by ModelBest Inc. and TsinghuaNLP, with only 2.4B parameters excluding embeddings.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OpenBMB/MiniCPM-2B-sft-fp32",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2
-    ],
-    "stop": [
-      "<s>",
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "minicpm-2b-dpo-bf16",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "MiniCPM is an End-Size LLM developed by ModelBest Inc. and TsinghuaNLP, with only 2.4B parameters excluding embeddings.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OpenBMB/MiniCPM-2B-dpo-bf16",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2
-    ],
-    "stop": [
-      "<s>",
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "minicpm-2b-dpo-fp16",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "MiniCPM is an End-Size LLM developed by ModelBest Inc. and TsinghuaNLP, with only 2.4B parameters excluding embeddings.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OpenBMB/MiniCPM-2B-dpo-fp16",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2
-    ],
-    "stop": [
-      "<s>",
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "minicpm-2b-dpo-fp32",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "MiniCPM is an End-Size LLM developed by ModelBest Inc. and TsinghuaNLP, with only 2.4B parameters excluding embeddings.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "OpenBMB/MiniCPM-2B-dpo-fp32",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}",
-    "stop_token_ids": [
-      1,
-      2
-    ],
-    "stop": [
-      "<s>",
-      "</s>"
-    ]
-  },
-  {
-    "version":1,
-    "context_length":8192,
-    "model_name":"MiniCPM-Llama3-V-2_5",
-    "model_lang":[
-      "en",
-      "zh"
-    ],
-    "model_ability":[
-      "chat",
-      "vision"
-    ],
-    "model_description":"MiniCPM-Llama3-V 2.5 is the latest model in the MiniCPM-V series. The model is built on SigLip-400M and Llama3-8B-Instruct with a total of 8B parameters.",
-    "model_specs":[
-      {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id":"OpenBMB/MiniCPM-Llama3-V-2_5",
-        "model_revision":"master"
-      },
-      {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
-          "int4"
-        ],
-        "model_hub": "modelscope",
-        "model_id":"OpenBMB/MiniCPM-Llama3-V-2_5-{quantization}",
-        "model_revision":"master"
-      }
-    ],
-    "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
-    "stop_token_ids": [
-      128001
-    ],
-    "stop": [
-      "<|end_of_text|>"
-    ]
-  },
-  {
-    "version":1,
-    "context_length":32768,
-    "model_name":"MiniCPM-V-2.6",
-    "model_lang":[
-      "en",
-      "zh"
-    ],
-    "model_ability":[
-      "chat",
-      "vision"
-    ],
-    "model_description":"MiniCPM-V 2.6 is the latest model in the MiniCPM-V series. The model is built on SigLip-400M and Qwen2-7B with a total of 8B parameters.",
-    "model_specs":[
-      {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id":"OpenBMB/MiniCPM-V-2_6",
-        "model_revision":"master"
-      },
-      {
-        "model_format":"pytorch",
-        "model_size_in_billions":8,
-        "quantizations":[
-          "4-bit"
-        ],
-        "model_hub": "modelscope",
-        "model_id":"OpenBMB/MiniCPM-V-2_6-int4",
-        "model_revision":"master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      151645,
-      151643
-    ],
-    "stop": [
-      "<|im_end|>",
-      "<|endoftext|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 2048,
-    "model_name": "aquila2",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "Aquila2 series models are the base language models",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "BAAI/Aquila2-34B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "BAAI/Aquila2-70B-Expr",
-        "model_revision": "master"
-      }
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 2048,
-    "model_name": "aquila2-chat",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "Aquila2-chat series models are the chat models",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "BAAI/AquilaChat2-34B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "Int4"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "BAAI/AquilaChat2-34B-Int4-GPTQ",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 70,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "BAAI/AquilaChat2-70B-Expr",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n' }}{% endif %}{% if item['role'] == 'user' %}{{ 'USER: ' + item['content'] + '\n' }}{% elif item['role'] == 'assistant' %}{{ 'ASSISTANT: ' + item['content'] + '\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'ASSISTANT: ' }}{% endif %}",
-    "stop_token_ids": [
-      100006,
-      100007
-    ],
-    "stop": [
-      "[CLS]",
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 16384,
-    "model_name": "aquila2-chat-16k",
-    "model_lang": [
-      "zh"
-    ],
-    "model_ability": [
-      "generate"
-    ],
-    "model_description": "AquilaChat2-16k series models are the long-text chat models",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 34,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "BAAI/AquilaChat2-34B-16K",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for item in messages %}{% if loop.first and item['role'] == 'system' %}{{ item['content'] + '\n' }}{% endif %}{% if item['role'] == 'user' %}{{ 'USER: ' + item['content'] + '\n' }}{% elif item['role'] == 'assistant' %}{{ 'ASSISTANT: ' + item['content'] + '\n' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'ASSISTANT: ' }}{% endif %}",
-    "stop_token_ids": [
-      100006,
-      100007
-    ],
-    "stop": [
-      "[CLS]",
-      "</s>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 131072,
-    "model_name": "c4ai-command-r-v01",
-    "model_lang": [
-      "en",
-      "fr",
-      "de",
-      "es",
-      "it",
-      "pt",
-      "ja",
-      "ko",
-      "zh",
-      "ar"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "C4AI Command-R is a research release of a 35 billion parameter highly performant generative model.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 35,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/c4ai-command-r-v01",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 35,
-        "quantizations": [
-          "4-bit"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "mirror013/c4ai-command-r-v01-4bit",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "ggufv2",
-        "model_size_in_billions": 35,
-        "quantizations": [
-          "Q2_K",
-          "Q3_K_M",
-          "Q4_K_M",
-          "Q5_K_M"
-        ],
-        "model_id": "mirror013/C4AI-Command-R-v01-GGUF",
-        "model_file_name_template": "c4ai-command-r-v01-{quantization}.gguf",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 104,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "AI-ModelScope/c4ai-command-r-plus",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{{ '<BOS_TOKEN>' }}{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% elif false == true %}{% set loop_messages = messages %}{% set system_message = 'You are Command-R, a brilliant, sophisticated, AI-assistant trained to assist human users by providing thorough responses. You are trained by Cohere.' %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% if system_message != false %}{{ '<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>' + system_message + '<|END_OF_TURN_TOKEN|>' }}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% set content = message['content'] %}{% if message['role'] == 'user' %}{{ '<|START_OF_TURN_TOKEN|><|USER_TOKEN|>' + content.strip() + '<|END_OF_TURN_TOKEN|>' }}{% elif message['role'] == 'assistant' %}{{ '<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>'  + content.strip() + '<|END_OF_TURN_TOKEN|>' }}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>' }}{% endif %}",
-    "stop_token_ids": [
-      6,
-      255001
-    ],
-    "stop": [
-      "<EOS_TOKEN>",
-      "<|END_OF_TURN_TOKEN|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 128000,
-    "model_name": "phi-3-mini-128k-instruct",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Phi-3-Mini-128K-Instruct is a 3.8 billion-parameter, lightweight, state-of-the-art open model trained using the Phi-3 datasets.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 4,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "LLM-Research/Phi-3-mini-128k-instruct",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ '<|endoftext|>' }}{% endif %}",
-    "stop_token_ids":[
-      32000,
-      32001,
-      32007
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|assistant|>",
-      "<|end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 4096,
-    "model_name": "phi-3-mini-4k-instruct",
-    "model_lang": [
-      "en"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The Phi-3-Mini-4k-Instruct is a 3.8 billion-parameter, lightweight, state-of-the-art open model trained using the Phi-3 datasets.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 4,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "LLM-Research/Phi-3-mini-4k-instruct",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{'<|system|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'user' %}{{'<|user|>\n' + message['content'] + '<|end|>\n'}}{% elif message['role'] == 'assistant' %}{{'<|assistant|>\n' + message['content'] + '<|end|>\n'}}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ '<|assistant|>\n' }}{% else %}{{ '<|endoftext|>' }}{% endif %}",
-    "stop_token_ids":[
-      32000,
-      32001,
-      32007
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|assistant|>",
-      "<|end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "internvl-chat",
-    "model_lang": [
-        "en",
-        "zh"
-    ],
-    "model_ability": [
-        "chat",
-        "vision"
-    ],
-    "model_description": "InternVL 1.5 is an open-source multimodal large language model (MLLM) to bridge the capability gap between open-source and proprietary commercial models in multimodal understanding. ",
-    "model_specs": [
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 26,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL-Chat-V1-5",
-            "model_revision": "master"
-        }
-    ],
-    "chat_template": "{{ '<s>' }}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      2,
-      92542,
-      92543
-    ],
-    "stop": [
-      "</s>",
-      "<|im_end|>",
-      "<|im_start|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "internvl2",
-    "model_lang": [
-        "en",
-        "zh"
-    ],
-    "model_ability": [
-        "chat",
-        "vision"
-    ],
-    "model_description": "InternVL 2 is an open-source multimodal large language model (MLLM) to bridge the capability gap between open-source and proprietary commercial models in multimodal understanding. ",
-    "model_specs": [
-
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 1,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-1B",
-            "model_revision": "master"
-        },
-      {
-            "model_format": "pytorch",
-            "model_size_in_billions": 2,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-2B",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "awq",
-            "model_size_in_billions": 2,
-            "quantizations": [
-              "Int4"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-2B-AWQ",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 4,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-4B",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 8,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-8B",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "awq",
-            "model_size_in_billions": 8,
-            "quantizations": [
-              "Int4"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-8B-AWQ",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 26,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-26B",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "awq",
-            "model_size_in_billions": 26,
-            "quantizations": [
-              "Int4"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-26B-AWQ",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 40,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-40B",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "awq",
-            "model_size_in_billions": 40,
-            "quantizations": [
-              "Int4"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-40B-AWQ",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "pytorch",
-            "model_size_in_billions": 76,
-            "quantizations": [
-              "4-bit",
-              "8-bit",
-              "none"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-Llama3-76B",
-            "model_revision": "master"
-        },
-        {
-            "model_format": "awq",
-            "model_size_in_billions": 76,
-            "quantizations": [
-              "Int4"
-            ],
-            "model_hub": "modelscope",
-            "model_id": "OpenGVLab/InternVL2-Llama3-76B-AWQ",
-            "model_revision": "master"
-        }
-    ],
-    "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
-    "stop_token_ids": [
-      151643,
-      151644,
-      151645
-    ],
-    "stop": [
-      "<|endoftext|>",
-      "<|im_start|>",
-      "<|im_end|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "cogvlm2",
-    "model_lang": [
-        "en",
-        "zh"
-    ],
-    "model_ability": [
-        "chat",
-        "vision"
-    ],
-    "model_description": "CogVLM2 have achieved good results in many lists compared to the previous generation of CogVLM open source models. Its excellent performance can compete with some non-open source models.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 20,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "ZhipuAI/cogvlm2-llama3-chinese-chat-19B",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 20,
-        "quantizations": [
-          "int4"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "ZhipuAI/cogvlm2-llama3-chinese-chat-19B-{quantization}",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% else %}{{ '<|end_of_text|>' }}{% endif %}",
-    "stop_token_ids": [
-      128001,
-      128009
-    ],
-    "stop": [
-      "<|end_of_text|>",
-      "<|eot_id|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "cogvlm2-video-llama3-chat",
-    "model_lang": [
-        "en",
-        "zh"
-    ],
-    "model_ability": [
-        "chat",
-        "vision"
-    ],
-    "model_description": "CogVLM2-Video achieves state-of-the-art performance on multiple video question answering tasks.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 12,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "ZhipuAI/cogvlm2-video-llama3-chat",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = '<|begin_of_text|>' + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% else %}{{ '<|end_of_text|>' }}{% endif %}",
-    "stop_token_ids": [
-      128001,
-      128009
-    ],
-    "stop": [
-      "<|end_of_text|>",
-      "<|eot_id|>"
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 8192,
-    "model_name": "telechat",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat"
-    ],
-    "model_description": "The TeleChat is a large language model developed and trained by China Telecom Artificial Intelligence Technology Co., LTD. The 7B model base is trained with 1.5 trillion Tokens and 3 trillion Tokens and Chinese high-quality corpus.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "TeleAI/telechat-7B",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "int4",
-          "int8"
-        ],
-        "model_id": "TeleAI/telechat-7B-{quantization}",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 12,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "TeleAI/TeleChat-12B",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "gptq",
-        "model_size_in_billions": 12,
-        "quantizations": [
-          "int4",
-          "int8"
-        ],
-        "model_id": "TeleAI/TeleChat-12B-{quantization}",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 52,
-        "quantizations": [
-          "4-bit",
-          "8-bit",
-          "none"
-        ],
-        "model_id": "TeleAI/TeleChat-52B",
-        "model_hub": "modelscope",
-        "model_revision": "master"
-      }
-    ],
-    "chat_template": "{{ (messages|selectattr('role', 'equalto', 'system')|list|last).content|trim if (messages|selectattr('role', 'equalto', 'system')|list) else '' }}{%- for message in messages -%}{%- if message['role'] == 'user' -%}{{- '<_user>' + message['content'] +'<_bot>' -}}{%- elif message['role'] == 'assistant' -%}{{- message['content'] + '<_end>' -}}{%- endif -%}{%- endfor -%}",
-    "stop": [
-      "<_end>",
-      "<_start>"
-    ],
-    "stop_token_ids": [
-      160133,
-      160132
-    ]
-  },
-  {
-    "version": 1,
-    "context_length": 32768,
-    "model_name": "qwen2-vl-instruct",
-    "model_lang": [
-      "en",
-      "zh"
-    ],
-    "model_ability": [
-      "chat",
-      "vision"
-    ],
-    "model_description": "Qwen2-VL: To See the World More Clearly.Qwen2-VL is the latest version of the vision language models in the Qwen model familities.",
-    "model_specs": [
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 2,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "qwen/Qwen2-VL-2B-Instruct",
-        "model_revision": "master"
-      },
-      {
-        "model_format": "pytorch",
-        "model_size_in_billions": 7,
-        "quantizations": [
-          "none"
-        ],
-        "model_hub": "modelscope",
-        "model_id": "qwen/Qwen2-VL-7B-Instruct",
-        "model_revision": "master"
-      }
-    ],
-    "prompt_style": {
-      "style_name": "QWEN",
-      "system_prompt": "You are a helpful assistant",
-      "roles": [
-        "user",
-        "assistant"
-      ]
-    }
-  }
-]