mirror of
https://github.com/lilakk/BLEUBERI.git
synced 2026-04-19 12:58:12 +00:00
13 lines
372 B
Python
13 lines
372 B
Python
# Make it more memory efficient by monkey patching the LLaMA model with xformers attention.
|
|
|
|
# Need to call this before importing transformers.
|
|
from fastchat.train.llama_xformers_attn_monkey_patch import (
|
|
replace_llama_attn_with_xformers_attn,
|
|
)
|
|
|
|
replace_llama_attn_with_xformers_attn()
|
|
|
|
from fastchat.train.train import train
|
|
|
|
if __name__ == "__main__":
|
|
train()
|