Test (~180) more models (#54)

* dump ~180 more of most popular chat models * unskip all but 1 test on win32
google · Feb 9, 2025 · a72057e · a72057e
1 parent ff6f9a0
commit a72057e
Showing 1 changed file with 214 additions and 26 deletions.
diff --git a/tests/CMakeLists.txt b/tests/CMakeLists.txt
@@ -60,6 +60,9 @@ if (CMAKE_SYSTEM_NAME STREQUAL "Windows" AND CMAKE_SYSTEM_PROCESSOR STREQUAL "ar
 endif()
 target_link_libraries(test-supported-template PRIVATE nlohmann_json::nlohmann_json)
 
+# https://huggingface.co/models?other=conversational
+# https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?types=fine-tuned%2Cchat
+
 set(MODEL_IDS
     # List of model IDs to test the chat template of.
     # For each of them, the tokenizer_config.json file will be fetched, and the template
@@ -70,63 +73,248 @@ set(MODEL_IDS
     # For Gated models, you'll need to run `huggingface-cli login` (and be granted access) to download their template.
 
     abacusai/Fewshot-Metamath-OrcaVicuna-Mistral
-    bofenghuang/vigogne-2-70b-chat
-    CohereForAI/c4ai-command-r-plus # Gated
-    databricks/dbrx-instruct # Gated
-    google/gemma-2-2b-it # Gated
-    google/gemma-7b-it # Gated
+    allenai/Llama-3.1-Tulu-3-405B
+    allenai/Llama-3.1-Tulu-3-405B-SFT
+    allenai/Llama-3.1-Tulu-3-8B
+    arcee-ai/Virtuoso-Lite
+    arcee-ai/Virtuoso-Medium-v2
+    arcee-ai/Virtuoso-Small-v2
+    AtlaAI/Selene-1-Mini-Llama-3.1-8B
+    avemio/GRAG-NEMO-12B-ORPO-HESSIAN-AI
     BEE-spoke-data/tFINE-900m-instruct-orpo
-    MiniMaxAI/MiniMax-Text-01
+    bespokelabs/Bespoke-Stratos-7B
+    bfuzzy1/acheron-m1a-llama
+    bofenghuang/vigogne-2-70b-chat
+    bytedance-research/UI-TARS-72B-DPO
+    bytedance-research/UI-TARS-7B-DPO
+    bytedance-research/UI-TARS-7B-SFT
+    carsenk/phi3.5_mini_exp_825_uncensored
+    CohereForAI/aya-expanse-8b
+    CohereForAI/c4ai-command-r-plus
+    CohereForAI/c4ai-command-r7b-12-2024
+    cyberagent/DeepSeek-R1-Distill-Qwen-14B-Japanese
+    cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese
+    databricks/dbrx-instruct
+    DavieLion/Llama-3.2-1B-SPIN-iter3
+    deepseek-ai/deepseek-coder-33b-instruct
+    deepseek-ai/deepseek-coder-6.7b-instruct
+    deepseek-ai/deepseek-coder-7b-instruct-v1.5
+    deepseek-ai/DeepSeek-Coder-V2-Instruct
+    deepseek-ai/DeepSeek-Coder-V2-Lite-Base
+    deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct
+    deepseek-ai/deepseek-llm-67b-chat
+    deepseek-ai/deepseek-llm-7b-chat
+    deepseek-ai/DeepSeek-R1-Distill-Llama-70B
+    deepseek-ai/DeepSeek-R1-Distill-Llama-8B
+    deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
+    deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
+    deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
+    deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
+    deepseek-ai/DeepSeek-V2-Lite
+    deepseek-ai/DeepSeek-V2.5
+    deepseek-ai/DeepSeek-V3
+    Delta-Vector/Rei-12B
+    dicta-il/dictalm2.0-instruct
+    ehristoforu/Falcon3-8B-Franken-Basestruct
+    EpistemeAI/Mistral-Nemo-Instruct-12B-Philosophy-Math
+    FlofloB/83k_continued_pretraining_Qwen2.5-0.5B-Instruct_Unsloth_merged_16bit
+    FlofloB/test_continued_pretraining_Phi-3-mini-4k-instruct_Unsloth_merged_16bit
+    godlikehhd/alpaca_data_sampled_ifd_new_5200
+    godlikehhd/alpaca_data_score_max_0.7_2600
+    google/gemma-2-27b-it
+    google/gemma-2-2b-it
+    google/gemma-2-2b-jpn-it
+    google/gemma-7b-it
+    HelpingAI/HAI-SER
+    HuggingFaceTB/SmolLM2-1.7B-Instruct
+    HuggingFaceTB/SmolLM2-135M-Instruct
+    HuggingFaceTB/SmolLM2-360M-Instruct
+    huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated
+    huihui-ai/DeepSeek-R1-Distill-Llama-8B-abliterated
+    huihui-ai/DeepSeek-R1-Distill-Qwen-14B-abliterated-v2
+    huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated
+    huihui-ai/DeepSeek-R1-Distill-Qwen-7B-abliterated-v2
+    huihui-ai/Qwen2.5-14B-Instruct-1M-abliterated
+    ibm-granite/granite-3.1-8b-instruct
+    Ihor/Text2Graph-R1-Qwen2.5-0.5b
     indischepartij/MiniCPM-3B-OpenHermes-2.5-v2
+    Infinigence/Megrez-3B-Instruct
+    inflatebot/MN-12B-Mag-Mell-R1
+    INSAIT-Institute/BgGPT-Gemma-2-27B-IT-v1.0
+    jinaai/ReaderLM-v2
+    Josephgflowers/TinyLlama_v1.1_math_code-world-test-1
+    kms7530/chemeng_qwen-math-7b_24_1_100_1_nonmath
+    knifeayumu/Cydonia-v1.3-Magnum-v4-22B
+    langgptai/qwen1.5-7b-chat-sa-v0.1
+    LatitudeGames/Wayfarer-12B
+    LGAI-EXAONE/EXAONE-3.5-2.4B-Instruct
+    LGAI-EXAONE/EXAONE-3.5-7.8B-Instruct
+    lightblue/DeepSeek-R1-Distill-Qwen-7B-Japanese
+    Magpie-Align/Llama-3-8B-Magpie-Align-v0.1
+    Magpie-Align/Llama-3.1-8B-Magpie-Align-v0.1
     mattshumer/Reflection-Llama-3.1-70B
+    MaziyarPanahi/calme-3.2-instruct-78b
     meetkai/functionary-medium-v3.1
     meetkai/functionary-medium-v3.2
-    meta-llama/Llama-3.1-8B-Instruct # Gated
-    meta-llama/Llama-3.2-3B-Instruct # Gated
-    meta-llama/Llama-3.3-70B-Instruct # Gated
-    meta-llama/Meta-Llama-3.1-8B-Instruct # Gated
+    meta-llama/Llama-2-7b-chat-hf
+    meta-llama/Llama-3.1-8B-Instruct
+    meta-llama/Llama-3.2-1B-Instruct
+    meta-llama/Llama-3.2-3B-Instruct
+    meta-llama/Llama-3.3-70B-Instruct
+    meta-llama/Meta-Llama-3-8B-Instruct
+    meta-llama/Meta-Llama-3.1-8B-Instruct
     microsoft/Phi-3-medium-4k-instruct
     microsoft/Phi-3-mini-4k-instruct
     microsoft/Phi-3-small-8k-instruct
     microsoft/Phi-3.5-mini-instruct
     microsoft/Phi-3.5-vision-instruct
-    mistralai/Mistral-7B-Instruct-v0.2 # Gated
-    mistralai/Mistral-Large-Instruct-2407 # Gated
-    mistralai/Mistral-Large-Instruct-2411 # Gated
-    mistralai/Mistral-Nemo-Instruct-2407 # Gated
-    mistralai/Mixtral-8x7B-Instruct-v0.1 # Gated
+    microsoft/phi-4
+    migtissera/Tess-3-Mistral-Nemo-12B
+    MiniMaxAI/MiniMax-Text-01
+    MiniMaxAI/MiniMax-VL-01
+    ministral/Ministral-3b-instruct
+    mistralai/Codestral-22B-v0.1
+    mistralai/Mistral-7B-Instruct-v0.1
+    mistralai/Mistral-7B-Instruct-v0.2
+    mistralai/Mistral-7B-Instruct-v0.3
+    mistralai/Mistral-Large-Instruct-2407
+    mistralai/Mistral-Large-Instruct-2411
+    mistralai/Mistral-Nemo-Instruct-2407
+    mistralai/Mistral-Small-24B-Instruct-2501
+    mistralai/Mixtral-8x7B-Instruct-v0.1
+    mkurman/Qwen2.5-14B-DeepSeek-R1-1M
     mlabonne/AlphaMonarch-7B
+    mlx-community/Josiefied-Qwen2.5-0.5B-Instruct-abliterated-v1-float32
+    mlx-community/Qwen2.5-VL-7B-Instruct-8bit
+    mobiuslabsgmbh/DeepSeek-R1-ReDistill-Qwen-1.5B-v1.1
+    NaniDAO/deepseek-r1-qwen-2.5-32B-ablated
+    netcat420/MFANNv0.20
+    netcat420/MFANNv0.24
+    netease-youdao/Confucius-o1-14B
     NexaAIDev/Octopus-v2
     NousResearch/Hermes-2-Pro-Llama-3-8B
     NousResearch/Hermes-2-Pro-Mistral-7B
     NousResearch/Hermes-3-Llama-3.1-70B
+    NovaSky-AI/Sky-T1-32B-Flash
+    NovaSky-AI/Sky-T1-32B-Preview
+    nvidia/AceMath-7B-RM
+    nvidia/Eagle2-1B
+    nvidia/Eagle2-9B
     nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
+    OnlyCheeini/greesychat-turbo
+    onnx-community/DeepSeek-R1-Distill-Qwen-1.5B-ONNX
+    open-thoughts/OpenThinker-7B
     openchat/openchat-3.5-0106
+    Orenguteng/Llama-3.1-8B-Lexi-Uncensored-V2
     OrionStarAI/Orion-14B-Chat
+    pankajmathur/orca_mini_v6_8b
+    PowerInfer/SmallThinker-3B-Preview
+    PrimeIntellect/INTELLECT-1-Instruct
+    princeton-nlp/Mistral-7B-Base-SFT-RDPO
+    princeton-nlp/Mistral-7B-Instruct-DPO
+    princeton-nlp/Mistral-7B-Instruct-RDPO
+    prithivMLmods/Bellatrix-Tiny-1.5B-R1
+    prithivMLmods/Bellatrix-Tiny-1B-R1
+    prithivMLmods/Bellatrix-Tiny-1B-v3
+    prithivMLmods/Bellatrix-Tiny-3B-R1
+    prithivMLmods/Blaze-14B-xElite
+    prithivMLmods/Calcium-Opus-14B-Elite2-R1
+    prithivMLmods/Calme-Ties-78B
+    prithivMLmods/Calme-Ties2-78B
+    prithivMLmods/Calme-Ties3-78B
+    prithivMLmods/ChemQwen2-vL
+    prithivMLmods/GWQ2b
+    prithivMLmods/LatexMind-2B-Codec
+    prithivMLmods/Llama-3.2-6B-AlgoCode
+    prithivMLmods/Megatron-Opus-14B-Exp
+    prithivMLmods/Megatron-Opus-14B-Stock
+    prithivMLmods/Megatron-Opus-7B-Exp
+    prithivMLmods/Omni-Reasoner-Merged
+    prithivMLmods/Omni-Reasoner4-Merged
+    prithivMLmods/Primal-Opus-14B-Optimus-v1
+    prithivMLmods/Qwen-7B-Distill-Reasoner
+    prithivMLmods/Qwen2.5-1.5B-DeepSeek-R1-Instruct
+    prithivMLmods/Qwen2.5-14B-DeepSeek-R1-1M
+    prithivMLmods/Qwen2.5-32B-DeepSeek-R1-Instruct
+    prithivMLmods/Qwen2.5-7B-DeepSeek-R1-1M
+    prithivMLmods/QwQ-Math-IO-500M
+    prithivMLmods/Triangulum-v2-10B
+    qingy2024/Falcon3-2x10B-MoE-Instruct
+    Qwen/QVQ-72B-Preview
+    Qwen/Qwen1.5-7B-Chat
     Qwen/Qwen2-7B-Instruct
+    Qwen/Qwen2-VL-72B-Instruct
     Qwen/Qwen2-VL-7B-Instruct
+    Qwen/Qwen2.5-0.5B
+    Qwen/Qwen2.5-1.5B-Instruct
+    Qwen/Qwen2.5-14B
+    Qwen/Qwen2.5-14B-Instruct-1M
+    Qwen/Qwen2.5-32B
+    Qwen/Qwen2.5-32B-Instruct
+    Qwen/Qwen2.5-3B-Instruct
+    Qwen/Qwen2.5-72B-Instruct
+    Qwen/Qwen2.5-7B
     Qwen/Qwen2.5-7B-Instruct
+    Qwen/Qwen2.5-7B-Instruct-1M
+    Qwen/Qwen2.5-Coder-32B-Instruct
+    Qwen/Qwen2.5-Coder-7B-Instruct
+    Qwen/Qwen2.5-Math-1.5B
     Qwen/Qwen2.5-Math-7B-Instruct
+    Qwen/Qwen2.5-VL-3B-Instruct
+    Qwen/Qwen2.5-VL-72B-Instruct
+    Qwen/Qwen2.5-VL-7B-Instruct
     Qwen/QwQ-32B-Preview
+    rubenroy/Zurich-14B-GCv2-5m
+    rubenroy/Zurich-7B-GCv2-5m
+    RWKV-Red-Team/ARWKV-7B-Preview-0.1
+    SakanaAI/TinySwallow-1.5B
+    SakanaAI/TinySwallow-1.5B-Instruct
+    Sao10K/70B-L3.3-Cirrus-x1
+    SentientAGI/Dobby-Mini-Leashed-Llama-3.1-8B
+    SentientAGI/Dobby-Mini-Unhinged-Llama-3.1-8B
+    silma-ai/SILMA-Kashif-2B-Instruct-v1.0
+    simplescaling/s1-32B
+    sometimesanotion/Lamarck-14B-v0.7
+    sonthenguyen/zephyr-sft-bnb-4bit-DPO-mtbr-180steps
+    Steelskull/L3.3-Damascus-R1
+    Steelskull/L3.3-MS-Nevoria-70b
+    Steelskull/L3.3-Nevoria-R1-70b
+    sthenno/tempesthenno-icy-0130
+    sumink/qwft
+    Tarek07/Progenitor-V1.1-LLaMa-70B
     teknium/OpenHermes-2.5-Mistral-7B
     TheBloke/FusionNet_34Bx2_MoE-AWQ
+    thirdeyeai/elevate360m
+    THUDM/glm-4-9b-chat
+    THUDM/glm-edge-1.5b-chat
+    tiiuae/Falcon3-10B-Instruct
+    TinyLlama/TinyLlama-1.1B-Chat-v1.0
+    UCLA-AGI/Mistral7B-PairRM-SPPO-Iter3
+    unsloth/DeepSeek-R1-Distill-Llama-8B
+    unsloth/DeepSeek-R1-Distill-Llama-8B-unsloth-bnb-4bit
+    unsloth/Mistral-Small-24B-Instruct-2501-unsloth-bnb-4bit
+    upstage/solar-pro-preview-instruct
+    ValiantLabs/Llama3.1-8B-Enigma
+    xwen-team/Xwen-72B-Chat
+    xwen-team/Xwen-7B-Chat
 
     # Broken, TODO:
-    # meetkai/functionary-medium-v3.1      # jinja2 expectation is computed w/ wrong escapes
-    # fireworks-ai/llama-3-firefunction-v2 # https://github.com/google/minja/issues/7
     # ai21labs/AI21-Jamba-1.5-Large        # https://github.com/google/minja/issues/8
+    # Almawave/Velvet-14B
+    # deepseek-ai/DeepSeek-R1
+    # deepseek-ai/DeepSeek-R1-Zero
+    # fireworks-ai/llama-3-firefunction-v2 # https://github.com/google/minja/issues/7
+    # HuggingFaceTB/SmolVLM-256M-Instruct
+    # HuggingFaceTB/SmolVLM-500M-Instruct
+    # HuggingFaceTB/SmolVLM-Instruct
+    # meta-llama/Llama-3.2-11B-Vision-Instruct
+    # unsloth/DeepSeek-R1
 )
 
-if(NOT WIN32)
-    list(APPEND MODEL_IDS
+if(WIN32)
+    list(REMOVE_ITEM MODEL_IDS
         # Needs investigation (https://github.com/google/minja/issues/40)
-        CohereForAI/c4ai-command-r7b-12-2024 # Gated
-        deepseek-ai/deepseek-coder-33b-instruct
-        deepseek-ai/DeepSeek-Coder-V2-Instruct
-        deepseek-ai/DeepSeek-V2.5
-        deepseek-ai/DeepSeek-R1-Distill-Llama-8B
-        deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
-        deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
+        CohereForAI/c4ai-command-r7b-12-2024    
     )
 endif()