-
Notifications
You must be signed in to change notification settings - Fork 2.5k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[
enh
] Add Support for multiple adapters on Transformers-based models (
#3046) * Support adapters on SentenceTransformer * Add transformer model check + add testing * Update ValueError text slightly; use self[0]; slight format changes * Upload stsb-bert-tiny-lora and extend tests --------- Co-authored-by: Carles Onielfa <[email protected]>
- Loading branch information
1 parent
6baee57
commit 7ede83b
Showing
3 changed files
with
214 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,143 @@ | ||
from __future__ import annotations | ||
|
||
from functools import wraps | ||
|
||
from transformers.integrations.peft import PeftAdapterMixin as PeftAdapterMixinTransformers | ||
|
||
from .models import Transformer | ||
|
||
|
||
def peft_wrapper(func): | ||
"""Wrapper to call the method on the auto_model with a check for PEFT compatibility.""" | ||
|
||
@wraps(func) | ||
def wrapper(self, *args, **kwargs): | ||
self.check_peft_compatible_model() | ||
method = getattr(self[0].auto_model, func.__name__) | ||
return method(*args, **kwargs) | ||
|
||
return wrapper | ||
|
||
|
||
class PeftAdapterMixin: | ||
""" | ||
Wrapper Mixin that adds the functionality to easily load and use adapters on the model. For | ||
more details about adapters check out the documentation of PEFT | ||
library: https://huggingface.co/docs/peft/index | ||
Currently supported PEFT methods follow those supported by transformers library, | ||
you can find more information on: | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin | ||
""" | ||
|
||
def has_peft_compatible_model(self) -> bool: | ||
return isinstance(self[0], Transformer) and isinstance(self[0].auto_model, PeftAdapterMixinTransformers) | ||
|
||
def check_peft_compatible_model(self) -> None: | ||
if not self.has_peft_compatible_model(): | ||
raise ValueError( | ||
"PEFT methods are only supported for Sentence Transformer models that use the Transformer module." | ||
) | ||
|
||
@peft_wrapper | ||
def load_adapter(self, *args, **kwargs) -> None: | ||
""" | ||
Load adapter weights from file or remote Hub folder." If you are not familiar with adapters and PEFT methods, we | ||
invite you to read more about them on PEFT official documentation: https://huggingface.co/docs/peft | ||
Requires peft as a backend to load the adapter weights and the underlying model to be compatible with PEFT. | ||
Args: | ||
*args: | ||
Positional arguments to pass to the underlying AutoModel `load_adapter` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.load_adapter | ||
**kwargs: | ||
Keyword arguments to pass to the underlying AutoModel `load_adapter` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.load_adapter | ||
""" | ||
... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def add_adapter(self, *args, **kwargs) -> None: | ||
""" | ||
Adds a fresh new adapter to the current model for training purposes. If no adapter name is passed, a default | ||
name is assigned to the adapter to follow the convention of PEFT library (in PEFT we use "default" as the | ||
default adapter name). | ||
Requires peft as a backend to load the adapter weights and the underlying model to be compatible with PEFT. | ||
Args: | ||
*args: | ||
Positional arguments to pass to the underlying AutoModel `add_adapter` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.add_adapter | ||
**kwargs: | ||
Keyword arguments to pass to the underlying AutoModel `add_adapter` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.add_adapter | ||
""" | ||
... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def set_adapter(self, *args, **kwargs) -> None: | ||
""" | ||
Sets a specific adapter by forcing the model to use a that adapter and disable the other adapters. | ||
Args: | ||
*args: | ||
Positional arguments to pass to the underlying AutoModel `set_adapter` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.set_adapter | ||
**kwargs: | ||
Keyword arguments to pass to the underlying AutoModel `set_adapter` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.set_adapter | ||
""" | ||
... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def disable_adapters(self) -> None: | ||
""" | ||
Disable all adapters that are attached to the model. This leads to inferring with the base model only. | ||
""" | ||
... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def enable_adapters(self) -> None: | ||
""" | ||
Enable adapters that are attached to the model. The model will use `self.active_adapter()` | ||
""" | ||
... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def active_adapters(self) -> list[str]: | ||
""" | ||
If you are not familiar with adapters and PEFT methods, we invite you to read more about them on the PEFT | ||
official documentation: https://huggingface.co/docs/peft | ||
Gets the current active adapters of the model. In case of multi-adapter inference (combining multiple adapters | ||
for inference) returns the list of all active adapters so that users can deal with them accordingly. | ||
For previous PEFT versions (that does not support multi-adapter inference), `module.active_adapter` will return | ||
a single string. | ||
""" | ||
... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def active_adapter(self) -> str: ... # Implementation handled by the wrapper | ||
|
||
@peft_wrapper | ||
def get_adapter_state_dict(self, *args, **kwargs) -> dict: | ||
""" | ||
If you are not familiar with adapters and PEFT methods, we invite you to read more about them on the PEFT | ||
official documentation: https://huggingface.co/docs/peft | ||
Gets the adapter state dict that should only contain the weights tensors of the specified adapter_name adapter. | ||
If no adapter_name is passed, the active adapter is used. | ||
Args: | ||
*args: | ||
Positional arguments to pass to the underlying AutoModel `get_adapter_state_dict` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.get_adapter_state_dict | ||
**kwargs: | ||
Keyword arguments to pass to the underlying AutoModel `get_adapter_state_dict` function. More information can be found in the transformers documentation | ||
https://huggingface.co/docs/transformers/main/en/peft#transformers.integrations.PeftAdapterMixin.get_adapter_state_dict | ||
""" | ||
... # Implementation handled by the wrapper |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters