Skip to content

Commit 81beafc

Browse files
authored
Adapt transformers v4.57.0 (#2305)
Signed-off-by: Kaihui-intel <[email protected]>
1 parent 74218cf commit 81beafc

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

neural_compressor/transformers/models/modeling_auto.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -745,13 +745,13 @@ def load_low_bit(cls, pretrained_model_name_or_path, *model_args, **kwargs):
745745
tmp_kwargs = {
746746
"sharded_metadata": sharded_metadata,
747747
"disk_offload_folder": offload_folder,
748-
"offload_state_dict": offload_state_dict,
749748
"dtype": torch_dtype,
750749
}
750+
if parse(transformers.__version__) < parse("4.57"):
751+
tmp_kwargs["offload_state_dict"] = offload_state_dict
751752
if parse(transformers.__version__) < parse("4.51"):
752753
tmp_kwargs["_fast_init"] = _fast_init
753754
tmp_kwargs["low_cpu_mem_usage"] = True
754-
755755
model_message = model_class._load_pretrained_model(*tmp_args, **tmp_kwargs)
756756
model = model_message[0]
757757

0 commit comments

Comments
 (0)