mirror of
https://github.com/unslothai/unsloth
synced 2026-04-21 13:37:39 +00:00
* feat: Add support for OLMo-3 model in mapping and tests
* Update unsloth/models/mapper.py
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
* Update tests/test_get_model_name.py
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
* Fix casing, add Think variants, and align version gate for OLMo-3 PR 4678
Mapper: switch slugs from OLMo-3 to canonical Olmo-3 mixed case, drop the
non-existent unsloth/Olmo-3-7B-Instruct-bnb-4bit dead alias, and add the
already-published Olmo-3-7B-Think and Olmo-3-32B-Think Unsloth mirrors.
Loader: change the olmo3 transformers version gate from Version("4.57.0")
to Version("4.57.0.dev0") so nightly/source builds that already contain
olmo3 are not blocked, matching the OLMo-2, Gemma 3 and Cohere patterns.
* Use canonical Olmo-3 casing and cover Think variants in OLMo-3 tests
Mirrors the mapper.py fixes on pr-4678-code: HuggingFace canonical slugs
for the OLMo-3 family use mixed-case Olmo-3 (not OLMo-3 like OLMo-2), and
Unsloth already hosts Olmo-3-7B-Think and Olmo-3-32B-Think mirrors, so
the resolution matrix now covers all three published Olmo-3 families.
---------
Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
Co-authored-by: Daniel Han <danielhanchen@gmail.com>
167 lines
6.2 KiB
Python
167 lines
6.2 KiB
Python
import unittest
|
|
from unittest.mock import patch
|
|
from unsloth.models.loader_utils import get_model_name
|
|
from unsloth.models import loader_utils
|
|
from unsloth.models.mapper import FLOAT_TO_INT_MAPPER, MAP_TO_UNSLOTH_16bit
|
|
|
|
|
|
def _no_remote_mapper():
|
|
return {}, {}, {}
|
|
|
|
|
|
class TestGetModelName(unittest.TestCase):
|
|
def _assert_mapping(self, model_name, load_in_4bit, expected, should_change):
|
|
mapped = get_model_name(model_name, load_in_4bit = load_in_4bit)
|
|
self.assertEqual(mapped.lower(), expected.lower())
|
|
if should_change:
|
|
self.assertNotEqual(mapped.lower(), model_name.lower())
|
|
else:
|
|
self.assertEqual(mapped.lower(), model_name.lower())
|
|
|
|
@patch.object(loader_utils, "_get_new_mapper", _no_remote_mapper)
|
|
def test_resolution_matrix(self):
|
|
cases = [
|
|
# Core mappings
|
|
("meta-llama/Llama-2-7b-hf", True, "unsloth/llama-2-7b-bnb-4bit", True),
|
|
("meta-llama/Llama-2-7b-hf", False, "unsloth/llama-2-7b", True),
|
|
(
|
|
"mistralai/Ministral-8B-Instruct-2410",
|
|
True,
|
|
"mistralai/Ministral-8B-Instruct-2410",
|
|
False,
|
|
),
|
|
(
|
|
"meta-llama/Llama-3.2-1B-Instruct",
|
|
False,
|
|
"unsloth/Llama-3.2-1B-Instruct",
|
|
True,
|
|
),
|
|
(
|
|
"meta-llama/Llama-2-7b-chat-hf",
|
|
True,
|
|
"unsloth/llama-2-7b-chat-bnb-4bit",
|
|
True,
|
|
),
|
|
(
|
|
"meta-llama/Llama-3.3-70B-Instruct",
|
|
True,
|
|
"unsloth/llama-3.3-70b-instruct-unsloth-bnb-4bit",
|
|
True,
|
|
),
|
|
("Qwen/Qwen3-8B", True, "unsloth/Qwen3-8B-unsloth-bnb-4bit", True),
|
|
("Qwen/Qwen3-8B", False, "unsloth/Qwen3-8B", True),
|
|
("Qwen/Qwen3-8B-FP8", False, "unsloth/Qwen3-8B-FP8", True),
|
|
("Qwen/Qwen3-8B-FP8", True, "unsloth/Qwen3-8B-unsloth-bnb-4bit", True),
|
|
(
|
|
"mistralai/Ministral-3-3B-Instruct-2512",
|
|
True,
|
|
"unsloth/Ministral-3-3B-Instruct-2512-unsloth-bnb-4bit",
|
|
True,
|
|
),
|
|
(
|
|
"mistralai/Ministral-3-3B-Instruct-2512",
|
|
False,
|
|
"unsloth/Ministral-3-3B-Instruct-2512",
|
|
True,
|
|
),
|
|
(
|
|
"allenai/Olmo-3-7B-Instruct",
|
|
True,
|
|
"unsloth/Olmo-3-7B-Instruct-unsloth-bnb-4bit",
|
|
True,
|
|
),
|
|
(
|
|
"allenai/Olmo-3-7B-Instruct",
|
|
False,
|
|
"unsloth/Olmo-3-7B-Instruct",
|
|
True,
|
|
),
|
|
(
|
|
"allenai/Olmo-3-7B-Think",
|
|
True,
|
|
"unsloth/Olmo-3-7B-Think-unsloth-bnb-4bit",
|
|
True,
|
|
),
|
|
(
|
|
"allenai/Olmo-3-7B-Think",
|
|
False,
|
|
"unsloth/Olmo-3-7B-Think",
|
|
True,
|
|
),
|
|
(
|
|
"allenai/Olmo-3-32B-Think",
|
|
True,
|
|
"unsloth/Olmo-3-32B-Think-unsloth-bnb-4bit",
|
|
True,
|
|
),
|
|
(
|
|
"allenai/Olmo-3-32B-Think",
|
|
False,
|
|
"unsloth/Olmo-3-32B-Think",
|
|
True,
|
|
),
|
|
("unsloth/Kimi-K2-Instruct", True, "unsloth/Kimi-K2-Instruct-BF16", True),
|
|
("unsloth/Kimi-K2-Instruct", False, "unsloth/Kimi-K2-Instruct", False),
|
|
# Fallback-to-original behavior
|
|
"nonexistent-user/nonexistent-model-123",
|
|
"google/gemma-3-random-prototype-123",
|
|
"imdatta0/nanoqwen-fp8",
|
|
"imdatta0/nanoqwen-bf16",
|
|
# Backward compatibility for legacy 4bit names
|
|
("unsloth/llama-2-7b-bnb-4bit", True, "unsloth/llama-2-7b-bnb-4bit", False),
|
|
("unsloth/llama-2-7b-bnb-4bit", False, "unsloth/llama-2-7b", True),
|
|
("google/gemma-2-9b", True, "unsloth/gemma-2-9b-bnb-4bit", True),
|
|
# GPT-OSS behavior
|
|
("openai/gpt-oss-20b", False, "unsloth/gpt-oss-20b", True),
|
|
("openai/gpt-oss-20b", True, "unsloth/gpt-oss-20b-unsloth-bnb-4bit", True),
|
|
("unsloth/gpt-oss-20b", True, "unsloth/gpt-oss-20b-unsloth-bnb-4bit", True),
|
|
("unsloth/gpt-oss-20b-bf16", True, "unsloth/gpt-oss-20b-bf16", False),
|
|
(
|
|
"unsloth/gpt-oss-20b-unsloth-bnb-4bit",
|
|
False,
|
|
"unsloth/gpt-oss-20b",
|
|
True,
|
|
),
|
|
(
|
|
"unsloth/gpt-oss-20b-bnb-4bit",
|
|
True,
|
|
"unsloth/gpt-oss-20b-bnb-4bit",
|
|
False,
|
|
),
|
|
]
|
|
for case in cases:
|
|
if isinstance(case, str):
|
|
model_name = case
|
|
with self.subTest(model_name = model_name, load_in_4bit = True):
|
|
self._assert_mapping(model_name, True, model_name, False)
|
|
else:
|
|
model_name, load_in_4bit, expected, should_change = case
|
|
with self.subTest(model_name = model_name, load_in_4bit = load_in_4bit):
|
|
self._assert_mapping(
|
|
model_name, load_in_4bit, expected, should_change
|
|
)
|
|
|
|
def test_static_mapper_contract(self):
|
|
contracts = [
|
|
("qwen/qwen3-8b", "unsloth/qwen3-8b-unsloth-bnb-4bit"),
|
|
("qwen/qwen3-8b-fp8", "unsloth/qwen3-8b-unsloth-bnb-4bit"),
|
|
(
|
|
"mistralai/ministral-3-3b-instruct-2512",
|
|
"unsloth/ministral-3-3b-instruct-2512-unsloth-bnb-4bit",
|
|
),
|
|
(
|
|
"allenai/olmo-3-7b-instruct",
|
|
"unsloth/olmo-3-7b-instruct-unsloth-bnb-4bit",
|
|
),
|
|
("unsloth/kimi-k2-instruct", "unsloth/kimi-k2-instruct-bf16"),
|
|
]
|
|
for src, expected in contracts:
|
|
with self.subTest(src = src):
|
|
self.assertEqual(FLOAT_TO_INT_MAPPER[src], expected)
|
|
self.assertEqual(
|
|
MAP_TO_UNSLOTH_16bit["qwen/qwen3-8b-fp8"], "unsloth/Qwen3-8B-FP8"
|
|
)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
unittest.main()
|