AutoGuess tests (#1650)

* whitespace * AutoGuess remove dot suffix in names * .gitignore update * test: added autoguess test suite * github workflow to run autoguess test when appropriate * git clone unavailable tokenizer configs rather than committing to repo * fix link to included tokenizer configs * skip storing downloaded tokenizer configs * typo * minor fixes * clean-up * limit workflow to trigger from experimental branch --------- Co-authored-by: Concedo <39025047+LostRuins@users.noreply.github.com>
2025-09-07 07:39:13 +00:00 · 2025-07-25 20:21:00 +09:00 · 2025-07-25 20:21:00 +09:00 · ff8f156fa0
commit ff8f156fa0
parent b87864144b
4 changed files with 144 additions and 7 deletions
--- a/.github/workflows/test-autoguess.yaml
+++ b/.github/workflows/test-autoguess.yaml
@ -0,0 +1,30 @@
+name: AutoGuess Tests
+
+on:
+  pull_request:
+    branches:
+      - concedo_experimental
+    paths:
+      - 'kcpp_adapters/AutoGuess.json'
+
+jobs:
+  test-autoguess:
+    runs-on: ubuntu-latest
+
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v4
+
+    - name: Set up Python
+      uses: actions/setup-python@v4
+      with:
+        python-version: '3.x'  # Adjust to your preferred Python version
+
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install requests
+        git clone https://github.com/kallewoof/gated-tokenizers.git tests/gated-tokenizers
+
+    - name: Run AutoGuess tests
+      run: python tests/test_autoguess.py
--- a/.gitignore
+++ b/.gitignore
@ -142,6 +142,7 @@ rocblas.dll
 hipblas.dll
 koboldcpp_hipblas.so
 koboldcpp_hipblas.dll
+.tokenizer_configs

 bin/
 conda/
--- a/kcpp_adapters/AutoGuess.json
+++ b/kcpp_adapters/AutoGuess.json
@ -12,7 +12,7 @@
    }
 }, {
    "search": ["<|im_start|>assistant", "<|im_end|>", "You are provided with function signatures within <tools>"],
-    "name": "ChatML (Qwen 2.5 based).",
+    "name": "ChatML (Qwen 2.5 based)",
    "adapter": {
        "system_start": "<|im_start|>system\n",
        "system_end": "<|im_end|>\n",
@ -25,7 +25,7 @@
    }
 }, {
    "search": ["<|im_user|>user<|im_middle|>", "<|im_assistant|>assistant<|im_middle|>", "<|im_end|>"],
-    "name": "ChatML (Kimi).",
+    "name": "ChatML (Kimi)",
    "adapter": {
        "system_start": "<|im_system|>system<|im_middle|>",
        "system_end": "<|im_end|>",
@ -36,7 +36,7 @@
    }
 }, {
    "search": ["System role not supported", "<start_of_turn>"],
-    "name": "Google Gemma 2.",
+    "name": "Google Gemma 2",
    "adapter": {
        "system_start": "<start_of_turn>user\n",
        "system_end": "<end_of_turn>\n",
@ -47,7 +47,7 @@
    }
 }, {
    "search": ["<start_of_image>", "<start_of_turn>", "<end_of_turn>"],
-    "name": "Google Gemma 3.",
+    "name": "Google Gemma 3",
    "adapter": {
        "system_start": "<start_of_turn>user\n",
        "system_end": "<end_of_turn>\n",
@ -58,7 +58,7 @@
    }
 }, {
    "search": ["<image_soft_token>", "<start_of_turn>model", "<end_of_turn>"],
-    "name": "Google Gemma 3n.",
+    "name": "Google Gemma 3n",
    "adapter": {
        "system_start": "<start_of_turn>user\n",
        "system_end": "<end_of_turn>\n",
@ -69,7 +69,7 @@
    }
 },{
    "search": ["<|start_header_id|>assistant<|end_header_id|>"],
-    "name": "Llama 3.x.",
+    "name": "Llama 3.x",
    "adapter": {
        "system_start": "<|start_header_id|>system<|end_header_id|>\n\n",
        "system_end": "<|eot_id|>",
@ -212,7 +212,7 @@
    }
 }, {
    "search": ["<|im_start|>assistant", "<|im_end|>"],
-    "name": "ChatML (Generic).",
+    "name": "ChatML (Generic)",
    "adapter": {
        "system_start": "<|im_start|>system\n",
        "system_end": "<|im_end|>\n",
--- a/tests/test_autoguess.py
+++ b/tests/test_autoguess.py
@ -0,0 +1,106 @@
+"""
+Test that the AutoGuess feature picks the correct model for every template.
+Also checks that every template is being tested so that when new AutoGuess additions are made, this test fails unless an accompanying test is included.
+"""
+import os
+import sys
+import requests
+import json
+
+
+# Map an AutoGuess name to a HuggingFace model ID
+# THIS LIST MUST BE UPDATED WHEN A NEW MODEL IS ADDED
+AUTOGUESS_MAPPING = {
+    "ChatML (Phi 4)": "microsoft/phi-4",
+    "ChatML (Qwen 2.5 based)": "Qwen/Qwen2.5-0.5B-Instruct",
+    "ChatML (Kimi)": "moonshotai/Kimi-K2-Instruct",
+    "Google Gemma 2": "Efficient-Large-Model/gemma-2-2b-it",
+    "Google Gemma 3": "scb10x/typhoon2.1-gemma3-12b",
+    "Google Gemma 3n": "lmstudio-community/gemma-3n-E4B-it-MLX-bf16",
+    "Llama 3.x": "Steelskull/L3.3-Shakudo-70b",
+    "Llama 4": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
+    "Mistral V7 (with system prompt)": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond",
+    "Mistral V3": "mistralai/Mistral-7B-Instruct-v0.3",
+    "GLM-4": "THUDM/glm-4-9b-chat-hf",
+    "Phi 3.5": "microsoft/Phi-3.5-mini-instruct",
+    "Phi 4 (mini)": "microsoft/Phi-4-mini-instruct",
+    "Cohere (Aya Expanse 32B based)": "CohereLabs/aya-expanse-32b",
+    "DeepSeek V2.5": "deepseek-ai/DeepSeek-V2.5",
+    "Jamba": "ai21labs/Jamba-tiny-dev",
+    "Dots": "rednote-hilab/dots.llm1.inst",
+    "RWKV World": "fla-hub/rwkv7-1.5B-world",
+    "Mistral (Generic)": "mistralai/Mistral-Nemo-Instruct-2407",
+    "ChatML (Generic)": "NewEden/Gemma-27B-chatml",
+}
+
+# User may be running this test from ./ or from ../ -- we want to be in ./ (i.e. tests)
+if os.path.exists("tests"):
+    os.chdir("tests")
+
+with open("../kcpp_adapters/AutoGuess.json") as f:
+    autoguess = json.load(f)
+
+def get_tokenizer_config_for_huggingface_model_id(huggingface_model_id: str):
+    fname = f"gated-tokenizers/tokenizer_configs/{huggingface_model_id.replace('/','_')}.json"
+    if os.path.exists(fname):
+        with open(fname) as f:
+            return json.load(f)
+
+    for filename in ["tokenizer_config.json", "chat_template.json"]:
+        url = f"https://huggingface.co/{huggingface_model_id}/resolve/main/{filename}"
+        response = requests.get(url)
+        if response.status_code == 200:
+            v = json.loads(response.text)
+            if 'chat_template' in v:
+                return v
+    raise ValueError(f"Failed to fetch tokenizer config for {huggingface_model_id}.")
+
+def match_chat_template_to_adapter(chat_template: str|list) -> tuple[str, str|None]|None:
+    # Additional code in tester not present in application: support for multiple chat templates, and use default if present
+    sub_template: str|None = None
+    if isinstance(chat_template, list):
+        found = False
+        for template in chat_template:
+            # {"name": .., "template": ...}
+            if template['name'] == "default":
+                sub_template = "default"
+                chat_template = template['template']
+                found = True
+                break
+        if not found:
+            # We pick the first template if no default is present
+            sub_template = chat_template[0]['name']
+            chat_template = chat_template[0]['template']
+    if chat_template != "":
+        for entry in autoguess:
+            if all(s in chat_template for s in entry['search']):
+                return entry['name'], sub_template
+
+failures = 0
+seen = set()
+namefmt = "{name:<" + str(max(len(name) for name in AUTOGUESS_MAPPING.keys())) + "}"
+hmifmt = "{huggingface_model_id:<" + str(max(len(huggingface_model_id) for huggingface_model_id in AUTOGUESS_MAPPING.values())) + "}"
+for name, huggingface_model_id in AUTOGUESS_MAPPING.items():
+    seen.add(name)
+    if huggingface_model_id == "***UNKNOWN***":
+        print(namefmt.format(name=name) + " = " + namefmt.format(name="***UNKNOWN***") + " : PENDING")
+        continue
+    tokenizer_config = get_tokenizer_config_for_huggingface_model_id(huggingface_model_id)
+    assert 'chat_template' in tokenizer_config
+    matched = match_chat_template_to_adapter(tokenizer_config['chat_template'])
+    if matched is None:
+        matched, sub_template = "MISSING MAPPING", None
+    else:
+        matched, sub_template = matched
+    sub_template = f"[{sub_template}]" if sub_template else ""
+    print(namefmt.format(name=name) + " = " + namefmt.format(name=matched) + " : " + ("OK     " if name == matched else "FAILURE") + " " + hmifmt.format(huggingface_model_id=huggingface_model_id) + " " + sub_template)
+    failures += name != matched
+
+for entry in autoguess:
+    if entry['name'] not in seen:
+        print(namefmt.format(name=entry['name']) + "   MISSING MAPPING")
+        failures += 1
+
+if failures > 0:
+    print(f"There were {failures} failure(s)!")
+    sys.exit(1)