ignore Qwen models in tokenizers test until bos issue is fixed

2025-10-23 02:57:14 +03:00 · 2024-09-19 00:18:21 +01:00
parent dee83e4840
commit 68028cc980
1 changed files with 5 additions and 3 deletions
--- a/test/test_tokenizers.py
+++ b/test/test_tokenizers.py
@@ -1,3 +1,5 @@
+import os
+import re
 from transformers import AutoTokenizer, AutoProcessor
 from exo.models import model_base_shards

@@ -22,10 +24,10 @@ def test_tokenizer(name, tokenizer, verbose=False):
    strip_tokens = lambda s: s.lstrip(tokenizer.decode([tokenizer.bos_token_id])).rstrip(tokenizer.decode([tokenizer.eos_token_id]))
    assert text == strip_tokens(decoded) == strip_tokens(reconstructed)

-ignore = ["TriAiExperiments/SFR-Iterative-DPO-LLaMA-3-70B-R", "mlx-community/DeepSeek-Coder-V2-Lite-Instruct-4bit-mlx", "llava-hf/llava-1.5-7b-hf"]
-models = [shard.model_id for shards in model_base_shards.values() for shard in shards.values() if shard.model_id not in ignore]
+ignore = ["TriAiExperiments/SFR-Iterative-DPO-LLaMA-3-70B-R", "mlx-community/DeepSeek-Coder-V2-Lite-Instruct-4bit-mlx", "llava-hf/llava-1.5-7b-hf", "mlx-community/Qwen*"]
+ignore_pattern = re.compile(r"^(" + "|".join(model.replace("*", ".*") for model in ignore) + r")")
+models = [shard.model_id for shards in model_base_shards.values() for shard in shards.values() if not ignore_pattern.match(shard.model_id)]

-import os
 verbose = os.environ.get("VERBOSE", "0").lower() == "1"
 for m in models:
    # TODO: figure out why use_fast=False is giving inconsistent behaviour (no spaces decoding invididual tokens) for Mistral-Large-Instruct-2407-4bit