RxnIM / mllm /pipeline /finetune_mem.py
CYF200127's picture
Upload 235 files
3e1d9f3 verified
raw
history blame contribute delete
710 Bytes
# Adopted from https://github.com/lm-sys/FastChat. Below is the original copyright:
# Adopted from tatsu-lab@stanford_alpaca. Below is the original copyright:
# Make it more memory efficient by monkey patching the LLaMA model with FlashAttn.
import sys
import pathlib
project_path = pathlib.Path(__file__).parent.parent.parent
sys.path.append(str(project_path))
# Need to call this before importing transformers.
from mllm.utils.llama_flash_attn_monkey_patch import replace_llama_attn_with_flash_attn
replace_llama_attn_with_flash_attn()
from mllm.pipeline.finetune import main
# noinspection PyUnusedLocal
def _mp_fn(index):
# For xla_spawn (TPUs)
main()
if __name__ == "__main__":
main()