Remove xpos and llama-landmark [bad merge]

axolotl-ai-cloud · Jan 11, 2024 · 7628056 · 7628056
1 parent 3019d1f
commit 7628056
Show file tree

Hide file tree

Showing 2 changed files with 0 additions and 26 deletions.
diff --git a/README.md b/README.md
@@ -825,15 +825,8 @@ flash_attn_fuse_mlp: # Whether to fuse part of the MLP into a single operation
 # Whether to use scaled-dot-product attention
 # https://pytorch.org/docs/stable/generated/torch.nn.functional.scaled_dot_product_attention.html
 sdp_attention:
-# Landmark attention (only llama)
-landmark_attention:
 # Shifted-sparse attention (only llama)
 s2_attention:
-
-# xpos RoPE see https://github.com/kaiokendev/cutoff-len-is-context-len/blob/main/util/xpos_rope_llama_monkey_patch.py
-# LLaMA only
-xpos_rope:
-
 # Resume from a specific checkpoint dir
 resume_from_checkpoint:
 # If resume_from_checkpoint isn't set and you simply want it to start where it left off.

diff --git a/src/axolotl/utils/models.py b/src/axolotl/utils/models.py
@@ -299,30 +299,11 @@ def load_model(
 
             LOG.info("patching with sdp attention")
             hijack_llama_sdp_attention()
-        elif cfg.landmark_attention:
-            from axolotl.monkeypatch.llama_landmark_attn import (
-                MEM_TOKEN,
-                patch_llama_with_landmark_attn,
-            )
-
-            LOG.info("patching with landmark attention")
-            patch_llama_with_landmark_attn()
-
-            # Note: This might overwrite previous additional_special_tokens
-            tokenizer.add_special_tokens({"additional_special_tokens": [MEM_TOKEN]})
         elif cfg.s2_attention:
             raise NotImplementedError(
                 "Shifted-sparse attention not currently implemented without flash attention."
             )
 
-        if cfg.xpos_rope:
-            from axolotl.monkeypatch.xpos_rope_llama_monkey_patch import (
-                replace_llama_rope_with_xpos_rope,
-            )
-
-            LOG.info("patching with xpos rope")
-            replace_llama_rope_with_xpos_rope()
-
         LOG.info("patching with sdp attention")
         hijack_llama_sdp_attention()