mirror of
https://github.com/wassname/SimPO.git
synced 2026-06-27 16:43:59 +08:00
change attn implementation arg
This commit is contained in:
@@ -213,7 +213,6 @@ def main():
|
|||||||
model_kwargs = dict(
|
model_kwargs = dict(
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
trust_remote_code=model_args.trust_remote_code,
|
trust_remote_code=model_args.trust_remote_code,
|
||||||
use_flash_attention_2=model_args.use_flash_attention_2,
|
|
||||||
torch_dtype=torch_dtype,
|
torch_dtype=torch_dtype,
|
||||||
use_cache=False if training_args.gradient_checkpointing else True,
|
use_cache=False if training_args.gradient_checkpointing else True,
|
||||||
device_map=get_kbit_device_map() if quantization_config is not None else None,
|
device_map=get_kbit_device_map() if quantization_config is not None else None,
|
||||||
|
|||||||
Reference in New Issue
Block a user