vllm/tests/lora/test_lora_huggingface.py

# SPDX-License-Identifier: Apache-2.0

import pytest

from vllm.lora.models import LoRAModel
from vllm.lora.peft_helper import PEFTHelper
from vllm.lora.utils import get_adapter_absolute_path
from vllm.model_executor.models.llama import LlamaForCausalLM

# Provide absolute path and huggingface lora ids
lora_fixture_name = ["sql_lora_files", "sql_lora_huggingface_id"]
LLAMA_LORA_MODULES = [
    "qkv_proj", "o_proj", "gate_up_proj", "down_proj", "embed_tokens",
    "lm_head"
]


@pytest.mark.parametrize("lora_fixture_name", lora_fixture_name)
def test_load_checkpoints_from_huggingface(lora_fixture_name, request):
    lora_name = request.getfixturevalue(lora_fixture_name)
    packed_modules_mapping = LlamaForCausalLM.packed_modules_mapping
    embedding_modules = LlamaForCausalLM.embedding_modules
    embed_padding_modules = LlamaForCausalLM.embedding_padding_modules
    expected_lora_modules: list[str] = []
    for module in LLAMA_LORA_MODULES:
        if module in packed_modules_mapping:
            expected_lora_modules.extend(packed_modules_mapping[module])
        else:
            expected_lora_modules.append(module)

    lora_path = get_adapter_absolute_path(lora_name)

    # lora loading should work for either absolute path and hugggingface id.
    peft_helper = PEFTHelper.from_local_dir(lora_path, 4096)
    lora_model = LoRAModel.from_local_checkpoint(
        lora_path,
        expected_lora_modules,
        peft_helper=peft_helper,
        lora_model_id=1,
        device="cpu",
        embedding_modules=embedding_modules,
        embedding_padding_modules=embed_padding_modules)

    # Assertions to ensure the model is loaded correctly
    assert lora_model is not None, "LoRAModel is not loaded correctly"
[Misc] Add SPDX-License-Identifier headers to python source files (#12628) - Add SPDX license headers to python source files - Check for SPDX headers using pre-commit commit 9d7ef44c3cfb72ca4c32e1c677d99259d10d4745 Author: Russell Bryant <rbryant@redhat.com> Date: Fri Jan 31 14:18:24 2025 -0500 Add SPDX license headers to python source files This commit adds SPDX license headers to python source files as recommended to the project by the Linux Foundation. These headers provide a concise way that is both human and machine readable for communicating license information for each source file. It helps avoid any ambiguity about the license of the code and can also be easily used by tools to help manage license compliance. The Linux Foundation runs license scans against the codebase to help ensure we are in compliance with the licenses of the code we use, including dependencies. Having these headers in place helps that tool do its job. More information can be found on the SPDX site: - https://spdx.dev/learn/handling-license-info/ Signed-off-by: Russell Bryant <rbryant@redhat.com> commit 5a1cf1cb3b80759131c73f6a9dddebccac039dea Author: Russell Bryant <rbryant@redhat.com> Date: Fri Jan 31 14:36:32 2025 -0500 Check for SPDX headers using pre-commit Signed-off-by: Russell Bryant <rbryant@redhat.com> --------- Signed-off-by: Russell Bryant <rbryant@redhat.com> 2025-02-02 14:58:18 -05:00			`# SPDX-License-Identifier: Apache-2.0`

[Core] Support dynamically loading Lora adapter from HuggingFace (#6234) Co-authored-by: Antoni Baum <antoni.baum@protonmail.com> 2024-07-22 15:42:40 -07:00			`import pytest`

			`from vllm.lora.models import LoRAModel`
[Misc][LoRA] Improve the readability of LoRA error messages (#12102) Signed-off-by: Jee Jee Li <pandaleefree@gmail.com> 2025-01-17 19:32:28 +08:00			`from vllm.lora.peft_helper import PEFTHelper`
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234) Co-authored-by: Antoni Baum <antoni.baum@protonmail.com> 2024-07-22 15:42:40 -07:00			`from vllm.lora.utils import get_adapter_absolute_path`
			`from vllm.model_executor.models.llama import LlamaForCausalLM`

			`# Provide absolute path and huggingface lora ids`
			`lora_fixture_name = ["sql_lora_files", "sql_lora_huggingface_id"]`
[Misc] Reduce LoRA-related static variable (#13166) 2025-02-22 16:21:30 +08:00			`LLAMA_LORA_MODULES = [`
			`"qkv_proj", "o_proj", "gate_up_proj", "down_proj", "embed_tokens",`
			`"lm_head"`
			`]`
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234) Co-authored-by: Antoni Baum <antoni.baum@protonmail.com> 2024-07-22 15:42:40 -07:00

			`@pytest.mark.parametrize("lora_fixture_name", lora_fixture_name)`
			`def test_load_checkpoints_from_huggingface(lora_fixture_name, request):`
			`lora_name = request.getfixturevalue(lora_fixture_name)`
			`packed_modules_mapping = LlamaForCausalLM.packed_modules_mapping`
			`embedding_modules = LlamaForCausalLM.embedding_modules`
			`embed_padding_modules = LlamaForCausalLM.embedding_padding_modules`
Update deprecated Python 3.8 typing (#13971) 2025-03-03 01:34:51 +00:00			`expected_lora_modules: list[str] = []`
[Misc] Reduce LoRA-related static variable (#13166) 2025-02-22 16:21:30 +08:00			`for module in LLAMA_LORA_MODULES:`
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234) Co-authored-by: Antoni Baum <antoni.baum@protonmail.com> 2024-07-22 15:42:40 -07:00			`if module in packed_modules_mapping:`
			`expected_lora_modules.extend(packed_modules_mapping[module])`
			`else:`
			`expected_lora_modules.append(module)`

			`lora_path = get_adapter_absolute_path(lora_name)`

			`# lora loading should work for either absolute path and hugggingface id.`
[Misc][LoRA] Improve the readability of LoRA error messages (#12102) Signed-off-by: Jee Jee Li <pandaleefree@gmail.com> 2025-01-17 19:32:28 +08:00			`peft_helper = PEFTHelper.from_local_dir(lora_path, 4096)`
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234) Co-authored-by: Antoni Baum <antoni.baum@protonmail.com> 2024-07-22 15:42:40 -07:00			`lora_model = LoRAModel.from_local_checkpoint(`
			`lora_path,`
			`expected_lora_modules,`
[Misc][LoRA] Improve the readability of LoRA error messages (#12102) Signed-off-by: Jee Jee Li <pandaleefree@gmail.com> 2025-01-17 19:32:28 +08:00			`peft_helper=peft_helper,`
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234) Co-authored-by: Antoni Baum <antoni.baum@protonmail.com> 2024-07-22 15:42:40 -07:00			`lora_model_id=1,`
			`device="cpu",`
			`embedding_modules=embedding_modules,`
			`embedding_padding_modules=embed_padding_modules)`

			`# Assertions to ensure the model is loaded correctly`
			`assert lora_model is not None, "LoRAModel is not loaded correctly"`