Spaces:

Dovakiins
/

qwerrwe

Build error

Nanobit commited on Aug 12, 2023

Commit

b521206

unverified ·

1 Parent(s): 289d5c4

Feat: Add rope scaling (#343)

* Feat: Add rope scaling

* fix: move rope config

Files changed (2) hide show

README.md CHANGED Viewed

@@ -474,6 +474,10 @@ landmark_attention:
 # xpos RoPE see https://github.com/kaiokendev/cutoff-len-is-context-len/blob/main/util/xpos_rope_llama_monkey_patch.py
 # llama only
 xpos_rope:
 # resume from a specific checkpoint dir
 resume_from_checkpoint:

 # xpos RoPE see https://github.com/kaiokendev/cutoff-len-is-context-len/blob/main/util/xpos_rope_llama_monkey_patch.py
 # llama only
 xpos_rope:
+# RoPE Scaling https://github.com/huggingface/transformers/pull/24653
+rope_scaling:
+  type: # linear | dynamic
+  factor: # float
 # resume from a specific checkpoint dir
 resume_from_checkpoint:

src/axolotl/utils/models.py CHANGED Viewed

@@ -219,7 +219,9 @@ def load_model(
         elif cfg.is_llama_derived_model and not cfg.trust_remote_code:
             from transformers import LlamaForCausalLM
-            config = LlamaConfig.from_pretrained(base_model_config)
             model = LlamaForCausalLM.from_pretrained(
                 base_model,
                 config=config,

         elif cfg.is_llama_derived_model and not cfg.trust_remote_code:
             from transformers import LlamaForCausalLM
+            config = LlamaConfig.from_pretrained(
+                base_model_config, rope_scaling=cfg.rope_scaling
+            )
             model = LlamaForCausalLM.from_pretrained(
                 base_model,
                 config=config,