Motif-Technologies
/

Motif-2.6B

Text Generation

text-generation-inference

Model card Files Files and versions

leejunhyeok commited on Jun 9

Commit

607612f

·

verified ·

1 Parent(s): 0d851ca

Update modeling_motif.py

Files changed (1) hide show

modeling_motif.py +6 -5

modeling_motif.py CHANGED Viewed

@@ -615,11 +615,12 @@ class MotifFlashAttention2(MotifAttention):
             cos, sin = (self.rotary_emb(value_states, q_len + past_key_value.get_usable_length(q_len, self.layer_idx))
                         if use_cache else position_embeddings)
-        query_states, key_states = apply_rotary_pos_emb(query_states,
-                                                        key_states,
-                                                        cos,
-                                                        sin,
-                                                        fused_rope=True)
         if past_key_value is not None:
             cache_kwargs = {"sin": sin, "cos": cos, "cache_position": cache_position}  # Specific to RoPE models

             cos, sin = (self.rotary_emb(value_states, q_len + past_key_value.get_usable_length(q_len, self.layer_idx))
                         if use_cache else position_embeddings)
+        query_states, key_states = apply_rotary_pos_emb(
+            query_states,
+            key_states,
+            cos,
+            sin
+        )
         if past_key_value is not None:
             cache_kwargs = {"sin": sin, "cos": cos, "cache_position": cache_position}  # Specific to RoPE models