CuMo-7b-zero / cumo /train /train_mem.py
jiachenl
update
c3f3b0b
raw
history blame
114 Bytes
from cumo.train.train import train
if __name__ == "__main__":
train(attn_implementation="flash_attention_2")