This commit is contained in:
parent
4ad2be2d34
commit
1e989784d3
|
|
@ -487,7 +487,7 @@ def main():
|
||||||
torch_dtype=dtype,
|
torch_dtype=dtype,
|
||||||
low_cpu_mem_usage=True,
|
low_cpu_mem_usage=True,
|
||||||
trust_remote_code=True,
|
trust_remote_code=True,
|
||||||
attn_implementation="flash_attention_2"
|
attn_implementation="sdpa"
|
||||||
)
|
)
|
||||||
|
|
||||||
print(f"GC enabled? {getattr(model, 'is_gradient_checkpointing', False)}", flush=True)
|
print(f"GC enabled? {getattr(model, 'is_gradient_checkpointing', False)}", flush=True)
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue