-
Notifications
You must be signed in to change notification settings - Fork 48
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Install Acceleration Framework into Training Script (#157)
* add acceleration framework Signed-off-by: Yu Chin Fabian Lim <[email protected]> * framework can add callbacks Signed-off-by: Yu Chin Fabian Lim <[email protected]> * add basic acceleration framework unit tests, lint. Signed-off-by: Yu Chin Fabian Lim <[email protected]> * add README, plugin installation tool Signed-off-by: Yu Chin Fabian Lim <[email protected]> * updates to readme Signed-off-by: Yu Chin Fabian Lim <[email protected]> * more readme updates Signed-off-by: Yu Chin Fabian Lim <[email protected]> * update fms-accel dep Signed-off-by: Yu Chin Fabian Lim <[email protected]> * add more tests Signed-off-by: Yu Chin Fabian Lim <[email protected]> * fixes after rebase + linting Signed-off-by: Yu Chin Fabian Lim <[email protected]> * make acceleration framework tests a module and lint,fmt. Signed-off-by: Yu Chin Fabian Lim <[email protected]> * clarify the usages flows Signed-off-by: Yu Chin Fabian Lim <[email protected]> * replace yaml with dataclass args Signed-off-by: Yu Chin Fabian Lim <[email protected]> * fmt + lint Signed-off-by: Yu Chin Fabian Lim <[email protected]> * improve tests Signed-off-by: Yu Chin Fabian Lim <[email protected]> * test fixes Signed-off-by: Yu Chin Fabian Lim <[email protected]> * improve data parsing logic Signed-off-by: Yu Chin Fabian Lim <[email protected]> * add foak test Signed-off-by: Yu Chin Fabian Lim <[email protected]> * fix bug and add bnb test Signed-off-by: Yu Chin Fabian Lim <[email protected]> * add missing peft config test Signed-off-by: Yu Chin Fabian Lim <[email protected]> * update README as per @Ssukriti's suggestions. Signed-off-by: Yu Chin Fabian Lim <[email protected]> * remove test helpers Signed-off-by: Yu Chin Fabian Lim <[email protected]> * fix merge errors and other issues Signed-off-by: Yu Chin Fabian Lim <[email protected]> * add one more check in get_framework and other fixes. Signed-off-by: Yu Chin Fabian Lim <[email protected]> * fix tests Signed-off-by: Yu Chin Fabian Lim <[email protected]> --------- Signed-off-by: Yu Chin Fabian Lim <[email protected]>
- Loading branch information
Showing
14 changed files
with
1,368 additions
and
6 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,13 @@ | ||
# Copyright The FMS HF Tuning Authors | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,47 @@ | ||
# Copyright The FMS HF Tuning Authors | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
|
||
def create_mock_plugin_class_and_spy(class_name, plugin_cls): | ||
"helper function to create plugin class" | ||
|
||
spy = { | ||
"model_loader_calls": 0, | ||
"augmentation_calls": 0, | ||
"get_ready_for_train_calls": 0, | ||
} | ||
|
||
def model_loader(self, *args, **kwargs): | ||
spy["model_loader_calls"] += 1 | ||
return plugin_cls.model_loader(self, *args, **kwargs) | ||
|
||
def augmentation( | ||
self, | ||
*args, | ||
**kwargs, | ||
): | ||
spy["augmentation_calls"] += 1 | ||
return plugin_cls.augmentation(self, *args, **kwargs) | ||
|
||
def get_callbacks_and_ready_for_train(self, *args, **kwargs): | ||
spy["get_ready_for_train_calls"] += 1 | ||
return plugin_cls.get_callbacks_and_ready_for_train(self, args, **kwargs) | ||
|
||
attributes = { | ||
"model_loader": model_loader, | ||
"augmentation": augmentation, | ||
"get_callbacks_and_ready_for_train": get_callbacks_and_ready_for_train, | ||
} | ||
|
||
return type(class_name, (plugin_cls,), attributes), spy |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,135 @@ | ||
# Copyright The FMS HF Tuning Authors | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
# Standard | ||
|
||
# Third Party | ||
import pytest | ||
import transformers | ||
|
||
# Local | ||
from tuning.config.acceleration_configs import ( | ||
FusedOpsAndKernelsConfig, | ||
QuantizedLoraConfig, | ||
) | ||
from tuning.config.acceleration_configs.fused_ops_and_kernels import ( | ||
FastKernelsConfig, | ||
FusedLoraConfig, | ||
) | ||
from tuning.config.acceleration_configs.quantized_lora_config import ( | ||
AutoGPTQLoraConfig, | ||
BNBQLoraConfig, | ||
) | ||
|
||
|
||
def test_dataclass_parse_successfully(): | ||
parser = transformers.HfArgumentParser(dataclass_types=QuantizedLoraConfig) | ||
|
||
# if nothing is specified then it will parse into the null class | ||
(cfg, _) = parser.parse_args_into_dataclasses(return_remaining_strings=True) | ||
assert cfg.auto_gptq is None | ||
assert cfg.bnb_qlora is None | ||
|
||
# 1.1 specifying "--auto_gptq" with the first item of AutoGPTQLoraConfig | ||
# will parse | ||
(cfg,) = parser.parse_args_into_dataclasses( | ||
["--auto_gptq", "triton_v2"], | ||
) | ||
assert isinstance(cfg.auto_gptq, AutoGPTQLoraConfig) | ||
assert cfg.bnb_qlora is None | ||
|
||
# 1.2 specifying "--auto_gptq" with the two items of AutoGPTQLoraConfig | ||
# will parse | ||
(cfg,) = parser.parse_args_into_dataclasses( | ||
["--auto_gptq", "triton_v2", "true"], | ||
) | ||
assert isinstance(cfg.auto_gptq, AutoGPTQLoraConfig) | ||
assert cfg.bnb_qlora is None | ||
|
||
# 2. specifying "--bnb_qlora" with the first item of BNBQLoraConfig | ||
# will parse | ||
(cfg,) = parser.parse_args_into_dataclasses( | ||
["--bnb_qlora", "nf4"], | ||
) | ||
assert cfg.auto_gptq is None | ||
assert isinstance(cfg.bnb_qlora, BNBQLoraConfig) | ||
|
||
|
||
def test_two_dataclasses_parse_successfully_together(): | ||
"""Ensure that the two dataclasses can parse arguments successfully | ||
together. | ||
""" | ||
parser = transformers.HfArgumentParser( | ||
dataclass_types=(QuantizedLoraConfig, FusedOpsAndKernelsConfig) | ||
) | ||
|
||
# 1. specifying "--auto_gptq" together with "--fused_lora" and | ||
# "--fast_kernels" will parse. | ||
cfg, cfg2 = parser.parse_args_into_dataclasses( | ||
[ | ||
"--auto_gptq", | ||
"triton_v2", | ||
"--fused_lora", | ||
"auto_gptq", | ||
"true", | ||
"--fast_kernels", | ||
"true", | ||
"true", | ||
"true", | ||
], | ||
) | ||
assert isinstance(cfg.auto_gptq, AutoGPTQLoraConfig) | ||
assert cfg.bnb_qlora is None | ||
assert isinstance(cfg2.fused_lora, FusedLoraConfig) | ||
assert isinstance(cfg2.fast_kernels, FastKernelsConfig) | ||
|
||
|
||
def test_dataclass_will_fail_to_parse_with_no_args(): | ||
"""Ensure that the dataclass arg parser will refuse to parse if | ||
only the key is specified without any following arguments. | ||
""" | ||
parser = transformers.HfArgumentParser(dataclass_types=QuantizedLoraConfig) | ||
|
||
# 1. passing only the key without any body will fail | ||
# - at least the first argument of the dataclass will be expected. | ||
with pytest.raises( | ||
SystemExit, # argparse will exit | ||
): | ||
(_,) = parser.parse_args_into_dataclasses( | ||
["--auto_gptq"], | ||
) | ||
|
||
|
||
def test_dataclass_will_fail_to_accept_illegal_args(): | ||
"""Ensure that some basic rules that are put in the dataclasses will | ||
fail at initialization of the class. | ||
""" | ||
|
||
# 1. auto_gptq does not support from_quantized at the moment. | ||
with pytest.raises( | ||
ValueError, match="only 'from_quantized' == True currently supported." | ||
): | ||
AutoGPTQLoraConfig(from_quantized=False) | ||
|
||
# 1.1 auto_gptq only supports triton_v2 at the moment | ||
with pytest.raises( | ||
ValueError, match="only 'triton_v2' kernel currently supported." | ||
): | ||
AutoGPTQLoraConfig(kernel="fake-kernel") | ||
|
||
# 2 bnb only supports two quant types | ||
with pytest.raises( | ||
ValueError, match="quant_type can only be either 'nf4' or 'fp4." | ||
): | ||
BNBQLoraConfig(quant_type="fake-quant-type") |
Oops, something went wrong.