LLaMA-3-V / llava /train /train_xformers.py
mmaaz60's picture
Adds code to host LLaVA-LLaMA-3 demo on HF space.
143d7a9
raw
history blame contribute delete
No virus
366 Bytes
# Make it more memory efficient by monkey patching the LLaMA model with xformers attention.
# Need to call this before importing transformers.
from llava.train.llama_xformers_attn_monkey_patch import (
replace_llama_attn_with_xformers_attn,
)
replace_llama_attn_with_xformers_attn()
from llava.train.train import train
if __name__ == "__main__":
train()