mirror of
https://github.com/huggingface/peft.git
synced 2025-10-20 15:33:48 +08:00
Resolves #2695 For some PEFT methods, there was a bit of a mess when it comes to how the init_weights argument was set in test_custom_models.py. The default kwargs for the tests should be that the PEFT method is initialized as an identity transform, and for specific tests we want to disable that. Note that most PEFT methods are initialized by default to be identity transforms, which is why the argument does not need to be set explicitly, but it's not true for all PEFT methods. With this PR, SHiRA, C3A, and FourierFT are now initialized to be consistent with this. This made it possible to remove some extra handling of those methods which was intermingled with certain tests. Moreover, test_custom_models.py now uses the set_init_weights_false helper function where appropriate. While working on this, I also cleaned up a bit the docs for the init_weights arguments of these PEFT methods where appropriate. I added some clarifying comments. For test_unload_adapter, I simplified a config type check and rewrote it to load the base model only once. --------- Co-authored-by: githubnemo <githubnemo@users.noreply.github.com>
306 lines
11 KiB
Python
306 lines
11 KiB
Python
# Copyright 2023-present the HuggingFace Inc. team.
|
|
#
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
# you may not use this file except in compliance with the License.
|
|
# You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
# See the License for the specific language governing permissions and
|
|
# limitations under the License.
|
|
import os
|
|
import unittest
|
|
from contextlib import contextmanager
|
|
from functools import lru_cache, wraps
|
|
from unittest import mock
|
|
|
|
import numpy as np
|
|
import pytest
|
|
import torch
|
|
from accelerate.test_utils.testing import get_backend
|
|
from datasets import load_dataset
|
|
|
|
from peft import (
|
|
AdaLoraConfig,
|
|
IA3Config,
|
|
LNTuningConfig,
|
|
LoraConfig,
|
|
PromptLearningConfig,
|
|
VBLoRAConfig,
|
|
)
|
|
from peft.import_utils import (
|
|
is_aqlm_available,
|
|
is_auto_awq_available,
|
|
is_auto_gptq_available,
|
|
is_eetq_available,
|
|
is_gptqmodel_available,
|
|
is_hqq_available,
|
|
is_optimum_available,
|
|
is_torchao_available,
|
|
)
|
|
|
|
|
|
# Globally shared model cache used by `hub_online_once`.
|
|
_HUB_MODEL_ACCESSES = {}
|
|
|
|
|
|
torch_device, device_count, memory_allocated_func = get_backend()
|
|
|
|
|
|
def require_non_cpu(test_case):
|
|
"""
|
|
Decorator marking a test that requires a hardware accelerator backend. These tests are skipped when there are no
|
|
hardware accelerator available.
|
|
"""
|
|
return unittest.skipUnless(torch_device != "cpu", "test requires a hardware accelerator")(test_case)
|
|
|
|
|
|
def require_non_xpu(test_case):
|
|
"""
|
|
Decorator marking a test that should be skipped for XPU.
|
|
"""
|
|
return unittest.skipUnless(torch_device != "xpu", "test requires a non-XPU")(test_case)
|
|
|
|
|
|
def require_torch_gpu(test_case):
|
|
"""
|
|
Decorator marking a test that requires a GPU. Will be skipped when no GPU is available.
|
|
"""
|
|
if not torch.cuda.is_available():
|
|
return unittest.skip("test requires GPU")(test_case)
|
|
else:
|
|
return test_case
|
|
|
|
|
|
def require_torch_multi_gpu(test_case):
|
|
"""
|
|
Decorator marking a test that requires multiple GPUs. Will be skipped when less than 2 GPUs are available.
|
|
"""
|
|
if not torch.cuda.is_available() or torch.cuda.device_count() < 2:
|
|
return unittest.skip("test requires multiple GPUs")(test_case)
|
|
else:
|
|
return test_case
|
|
|
|
|
|
def require_torch_multi_accelerator(test_case):
|
|
"""
|
|
Decorator marking a test that requires multiple hardware accelerators. These tests are skipped on a machine without
|
|
multiple accelerators.
|
|
"""
|
|
return unittest.skipUnless(
|
|
torch_device != "cpu" and device_count > 1, "test requires multiple hardware accelerators"
|
|
)(test_case)
|
|
|
|
|
|
def require_bitsandbytes(test_case):
|
|
"""
|
|
Decorator marking a test that requires the bitsandbytes library. Will be skipped when the library is not installed.
|
|
"""
|
|
try:
|
|
import bitsandbytes # noqa: F401
|
|
|
|
test_case = pytest.mark.bitsandbytes(test_case)
|
|
except ImportError:
|
|
test_case = pytest.mark.skip(reason="test requires bitsandbytes")(test_case)
|
|
return test_case
|
|
|
|
|
|
def require_auto_gptq(test_case):
|
|
"""
|
|
Decorator marking a test that requires auto-gptq. These tests are skipped when auto-gptq isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_gptqmodel_available() or is_auto_gptq_available(), "test requires auto-gptq")(
|
|
test_case
|
|
)
|
|
|
|
|
|
def require_gptqmodel(test_case):
|
|
"""
|
|
Decorator marking a test that requires gptqmodel. These tests are skipped when gptqmodel isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_gptqmodel_available(), "test requires gptqmodel")(test_case)
|
|
|
|
|
|
def require_aqlm(test_case):
|
|
"""
|
|
Decorator marking a test that requires aqlm. These tests are skipped when aqlm isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_aqlm_available(), "test requires aqlm")(test_case)
|
|
|
|
|
|
def require_hqq(test_case):
|
|
"""
|
|
Decorator marking a test that requires aqlm. These tests are skipped when aqlm isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_hqq_available(), "test requires hqq")(test_case)
|
|
|
|
|
|
def require_auto_awq(test_case):
|
|
"""
|
|
Decorator marking a test that requires auto-awq. These tests are skipped when auto-awq isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_auto_awq_available(), "test requires auto-awq")(test_case)
|
|
|
|
|
|
def require_eetq(test_case):
|
|
"""
|
|
Decorator marking a test that requires eetq. These tests are skipped when eetq isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_eetq_available(), "test requires eetq")(test_case)
|
|
|
|
|
|
def require_optimum(test_case):
|
|
"""
|
|
Decorator marking a test that requires optimum. These tests are skipped when optimum isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_optimum_available(), "test requires optimum")(test_case)
|
|
|
|
|
|
def require_torchao(test_case):
|
|
"""
|
|
Decorator marking a test that requires torchao. These tests are skipped when torchao isn't installed.
|
|
"""
|
|
return unittest.skipUnless(is_torchao_available(), "test requires torchao")(test_case)
|
|
|
|
|
|
def require_deterministic_for_xpu(test_case):
|
|
@wraps(test_case)
|
|
def wrapper(*args, **kwargs):
|
|
if torch_device == "xpu":
|
|
original_state = torch.are_deterministic_algorithms_enabled()
|
|
try:
|
|
torch.use_deterministic_algorithms(True)
|
|
return test_case(*args, **kwargs)
|
|
finally:
|
|
torch.use_deterministic_algorithms(original_state)
|
|
else:
|
|
return test_case(*args, **kwargs)
|
|
|
|
return wrapper
|
|
|
|
|
|
@contextmanager
|
|
def temp_seed(seed: int):
|
|
"""Temporarily set the random seed. This works for python numpy, pytorch."""
|
|
|
|
np_state = np.random.get_state()
|
|
np.random.seed(seed)
|
|
|
|
torch_state = torch.random.get_rng_state()
|
|
torch.random.manual_seed(seed)
|
|
|
|
if torch.cuda.is_available():
|
|
torch_cuda_states = torch.cuda.get_rng_state_all()
|
|
torch.cuda.manual_seed_all(seed)
|
|
|
|
try:
|
|
yield
|
|
finally:
|
|
np.random.set_state(np_state)
|
|
|
|
torch.random.set_rng_state(torch_state)
|
|
if torch.cuda.is_available():
|
|
torch.cuda.set_rng_state_all(torch_cuda_states)
|
|
|
|
|
|
def get_state_dict(model, unwrap_compiled=True):
|
|
"""
|
|
Get the state dict of a model. If the model is compiled, unwrap it first.
|
|
"""
|
|
if unwrap_compiled:
|
|
model = getattr(model, "_orig_mod", model)
|
|
return model.state_dict()
|
|
|
|
|
|
@lru_cache
|
|
def load_dataset_english_quotes():
|
|
# can't use pytest fixtures for now because of unittest style tests
|
|
data = load_dataset("ybelkada/english_quotes_copy")
|
|
return data
|
|
|
|
|
|
@lru_cache
|
|
def load_cat_image():
|
|
# can't use pytest fixtures for now because of unittest style tests
|
|
dataset = load_dataset("huggingface/cats-image", trust_remote_code=True)
|
|
image = dataset["test"]["image"][0]
|
|
return image
|
|
|
|
|
|
def set_init_weights_false(config_cls, kwargs):
|
|
# helper function that sets the config kwargs such that the model is *not* initialized as an identity transform
|
|
kwargs = kwargs.copy()
|
|
|
|
if issubclass(config_cls, PromptLearningConfig):
|
|
return kwargs
|
|
if config_cls in (LNTuningConfig, VBLoRAConfig):
|
|
return kwargs
|
|
|
|
if config_cls in (LoraConfig, AdaLoraConfig):
|
|
kwargs["init_lora_weights"] = False
|
|
elif config_cls == IA3Config:
|
|
kwargs["init_ia3_weights"] = False
|
|
else:
|
|
kwargs["init_weights"] = False
|
|
return kwargs
|
|
|
|
|
|
@contextmanager
|
|
def hub_online_once(model_id: str):
|
|
"""Set env[HF_HUB_OFFLINE]=1 (and patch transformers/hugging_face_hub to think that it was always that way)
|
|
for model ids that were already to avoid contacting the hub twice for the same model id in the context. The global
|
|
variable `_HUB_MODEL_ACCESSES` tracks the number of hits per model id between `hub_online_once` calls.
|
|
|
|
The reason for doing a context manager and not patching specific methods (e.g., `from_pretrained`) is that there
|
|
are a lot of places (`PeftConfig.from_pretrained`, `get_peft_state_dict`, `load_adapter`, ...) that possibly
|
|
communicate with the hub to download files / check versions / etc.
|
|
|
|
Note that using this context manager can cause problems when used in code sections that access different resources.
|
|
Example:
|
|
|
|
```
|
|
def test_something(model_id, config_kwargs):
|
|
with hub_online_once(model_id):
|
|
model = ...from_pretrained(model_id)
|
|
self.do_something_specific_with_model(model)
|
|
```
|
|
It is assumed that `do_something_specific_with_model` is an absract method that is implement by several tests.
|
|
Imagine the first test simply does `model.generate([1,2,3])`. The second call from another test suite however uses
|
|
a tokenizer (`AutoTokenizer.from_pretrained(model_id)`) - this will fail since the first pass was online but didn't
|
|
use the tokenizer and we're now in offline mode and cannot fetch the tokenizer. The recommended workaround is to
|
|
extend the cache key (`model_id` passed to `hub_online_once` in this case) by something in case the tokenizer is
|
|
used, so that these tests don't share a cache pool with the tests that don't use a tokenizer.
|
|
|
|
It is best to avoid using this context manager in *yield* fixtures (normal fixtures are fine) as this is equivalent
|
|
to wrapping the whole test in the context manager without explicitly writing it out, leading to unexpected
|
|
`HF_HUB_OFFLINE` behavior in the test body.
|
|
"""
|
|
global _HUB_MODEL_ACCESSES
|
|
override = {}
|
|
|
|
try:
|
|
if model_id in _HUB_MODEL_ACCESSES:
|
|
override = {"HF_HUB_OFFLINE": "1"}
|
|
_HUB_MODEL_ACCESSES[model_id] += 1
|
|
else:
|
|
if model_id not in _HUB_MODEL_ACCESSES:
|
|
_HUB_MODEL_ACCESSES[model_id] = 0
|
|
with (
|
|
# strictly speaking it is not necessary to set the environment variable since most code that's out there
|
|
# is evaluating it at import time and we'd have to reload the modules for it to take effect. It's
|
|
# probably still a good idea to have it if there's some dynamic code that checks it.
|
|
mock.patch.dict(os.environ, override),
|
|
mock.patch("huggingface_hub.constants.HF_HUB_OFFLINE", override.get("HF_HUB_OFFLINE", False) == "1"),
|
|
mock.patch("transformers.utils.hub._is_offline_mode", override.get("HF_HUB_OFFLINE", False) == "1"),
|
|
):
|
|
yield
|
|
except Exception:
|
|
# in case of an error we have to assume that we didn't access the model properly from the hub
|
|
# for the first time, so the next call cannot be considered cached.
|
|
if _HUB_MODEL_ACCESSES.get(model_id) == 0:
|
|
del _HUB_MODEL_ACCESSES[model_id]
|
|
raise
|