unsloth/tests/test_get_model_name.py
Avaya Aggarwal f18e9dddf0
feat: Add support for OLMo-3 model (#4678)
* feat: Add support for OLMo-3 model in mapping and tests

* Update unsloth/models/mapper.py

Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>

* Update tests/test_get_model_name.py

Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>

* Fix casing, add Think variants, and align version gate for OLMo-3 PR 4678

Mapper: switch slugs from OLMo-3 to canonical Olmo-3 mixed case, drop the
non-existent unsloth/Olmo-3-7B-Instruct-bnb-4bit dead alias, and add the
already-published Olmo-3-7B-Think and Olmo-3-32B-Think Unsloth mirrors.

Loader: change the olmo3 transformers version gate from Version("4.57.0")
to Version("4.57.0.dev0") so nightly/source builds that already contain
olmo3 are not blocked, matching the OLMo-2, Gemma 3 and Cohere patterns.

* Use canonical Olmo-3 casing and cover Think variants in OLMo-3 tests

Mirrors the mapper.py fixes on pr-4678-code: HuggingFace canonical slugs
for the OLMo-3 family use mixed-case Olmo-3 (not OLMo-3 like OLMo-2), and
Unsloth already hosts Olmo-3-7B-Think and Olmo-3-32B-Think mirrors, so
the resolution matrix now covers all three published Olmo-3 families.

---------

Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
Co-authored-by: Daniel Han <danielhanchen@gmail.com>
2026-04-15 07:39:11 -07:00

167 lines
6.2 KiB
Python

import unittest
from unittest.mock import patch
from unsloth.models.loader_utils import get_model_name
from unsloth.models import loader_utils
from unsloth.models.mapper import FLOAT_TO_INT_MAPPER, MAP_TO_UNSLOTH_16bit
def _no_remote_mapper():
return {}, {}, {}
class TestGetModelName(unittest.TestCase):
def _assert_mapping(self, model_name, load_in_4bit, expected, should_change):
mapped = get_model_name(model_name, load_in_4bit = load_in_4bit)
self.assertEqual(mapped.lower(), expected.lower())
if should_change:
self.assertNotEqual(mapped.lower(), model_name.lower())
else:
self.assertEqual(mapped.lower(), model_name.lower())
@patch.object(loader_utils, "_get_new_mapper", _no_remote_mapper)
def test_resolution_matrix(self):
cases = [
# Core mappings
("meta-llama/Llama-2-7b-hf", True, "unsloth/llama-2-7b-bnb-4bit", True),
("meta-llama/Llama-2-7b-hf", False, "unsloth/llama-2-7b", True),
(
"mistralai/Ministral-8B-Instruct-2410",
True,
"mistralai/Ministral-8B-Instruct-2410",
False,
),
(
"meta-llama/Llama-3.2-1B-Instruct",
False,
"unsloth/Llama-3.2-1B-Instruct",
True,
),
(
"meta-llama/Llama-2-7b-chat-hf",
True,
"unsloth/llama-2-7b-chat-bnb-4bit",
True,
),
(
"meta-llama/Llama-3.3-70B-Instruct",
True,
"unsloth/llama-3.3-70b-instruct-unsloth-bnb-4bit",
True,
),
("Qwen/Qwen3-8B", True, "unsloth/Qwen3-8B-unsloth-bnb-4bit", True),
("Qwen/Qwen3-8B", False, "unsloth/Qwen3-8B", True),
("Qwen/Qwen3-8B-FP8", False, "unsloth/Qwen3-8B-FP8", True),
("Qwen/Qwen3-8B-FP8", True, "unsloth/Qwen3-8B-unsloth-bnb-4bit", True),
(
"mistralai/Ministral-3-3B-Instruct-2512",
True,
"unsloth/Ministral-3-3B-Instruct-2512-unsloth-bnb-4bit",
True,
),
(
"mistralai/Ministral-3-3B-Instruct-2512",
False,
"unsloth/Ministral-3-3B-Instruct-2512",
True,
),
(
"allenai/Olmo-3-7B-Instruct",
True,
"unsloth/Olmo-3-7B-Instruct-unsloth-bnb-4bit",
True,
),
(
"allenai/Olmo-3-7B-Instruct",
False,
"unsloth/Olmo-3-7B-Instruct",
True,
),
(
"allenai/Olmo-3-7B-Think",
True,
"unsloth/Olmo-3-7B-Think-unsloth-bnb-4bit",
True,
),
(
"allenai/Olmo-3-7B-Think",
False,
"unsloth/Olmo-3-7B-Think",
True,
),
(
"allenai/Olmo-3-32B-Think",
True,
"unsloth/Olmo-3-32B-Think-unsloth-bnb-4bit",
True,
),
(
"allenai/Olmo-3-32B-Think",
False,
"unsloth/Olmo-3-32B-Think",
True,
),
("unsloth/Kimi-K2-Instruct", True, "unsloth/Kimi-K2-Instruct-BF16", True),
("unsloth/Kimi-K2-Instruct", False, "unsloth/Kimi-K2-Instruct", False),
# Fallback-to-original behavior
"nonexistent-user/nonexistent-model-123",
"google/gemma-3-random-prototype-123",
"imdatta0/nanoqwen-fp8",
"imdatta0/nanoqwen-bf16",
# Backward compatibility for legacy 4bit names
("unsloth/llama-2-7b-bnb-4bit", True, "unsloth/llama-2-7b-bnb-4bit", False),
("unsloth/llama-2-7b-bnb-4bit", False, "unsloth/llama-2-7b", True),
("google/gemma-2-9b", True, "unsloth/gemma-2-9b-bnb-4bit", True),
# GPT-OSS behavior
("openai/gpt-oss-20b", False, "unsloth/gpt-oss-20b", True),
("openai/gpt-oss-20b", True, "unsloth/gpt-oss-20b-unsloth-bnb-4bit", True),
("unsloth/gpt-oss-20b", True, "unsloth/gpt-oss-20b-unsloth-bnb-4bit", True),
("unsloth/gpt-oss-20b-bf16", True, "unsloth/gpt-oss-20b-bf16", False),
(
"unsloth/gpt-oss-20b-unsloth-bnb-4bit",
False,
"unsloth/gpt-oss-20b",
True,
),
(
"unsloth/gpt-oss-20b-bnb-4bit",
True,
"unsloth/gpt-oss-20b-bnb-4bit",
False,
),
]
for case in cases:
if isinstance(case, str):
model_name = case
with self.subTest(model_name = model_name, load_in_4bit = True):
self._assert_mapping(model_name, True, model_name, False)
else:
model_name, load_in_4bit, expected, should_change = case
with self.subTest(model_name = model_name, load_in_4bit = load_in_4bit):
self._assert_mapping(
model_name, load_in_4bit, expected, should_change
)
def test_static_mapper_contract(self):
contracts = [
("qwen/qwen3-8b", "unsloth/qwen3-8b-unsloth-bnb-4bit"),
("qwen/qwen3-8b-fp8", "unsloth/qwen3-8b-unsloth-bnb-4bit"),
(
"mistralai/ministral-3-3b-instruct-2512",
"unsloth/ministral-3-3b-instruct-2512-unsloth-bnb-4bit",
),
(
"allenai/olmo-3-7b-instruct",
"unsloth/olmo-3-7b-instruct-unsloth-bnb-4bit",
),
("unsloth/kimi-k2-instruct", "unsloth/kimi-k2-instruct-bf16"),
]
for src, expected in contracts:
with self.subTest(src = src):
self.assertEqual(FLOAT_TO_INT_MAPPER[src], expected)
self.assertEqual(
MAP_TO_UNSLOTH_16bit["qwen/qwen3-8b-fp8"], "unsloth/Qwen3-8B-FP8"
)
if __name__ == "__main__":
unittest.main()