mirror of
https://github.com/wassname/SimPO.git
synced 2026-06-27 15:13:50 +08:00
change attn implementation arg
This commit is contained in:
@@ -213,7 +213,6 @@ def main():
|
||||
model_kwargs = dict(
|
||||
revision=model_args.model_revision,
|
||||
trust_remote_code=model_args.trust_remote_code,
|
||||
use_flash_attention_2=model_args.use_flash_attention_2,
|
||||
torch_dtype=torch_dtype,
|
||||
use_cache=False if training_args.gradient_checkpointing else True,
|
||||
device_map=get_kbit_device_map() if quantization_config is not None else None,
|
||||
|
||||
Reference in New Issue
Block a user