Skip to content

Commit

Permalink
attn one kv
Browse files Browse the repository at this point in the history
  • Loading branch information
Kye committed Aug 28, 2023
1 parent c37d1cb commit 72cf984
Show file tree
Hide file tree
Showing 2 changed files with 13 additions and 24 deletions.
35 changes: 12 additions & 23 deletions Andromeda/configs.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,9 +12,8 @@
alibi_pos_bias=True,
alibi_num_heads=4,
rotary_xpos=True,
attn_flash=True,
# shift_tokens=1,
attn_one_kv_head=True,
attn_flash=True,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand All @@ -32,10 +31,8 @@
use_abs_pos_emb=False,
alibi_pos_bias=True,
alibi_num_heads=6,
rotary_xpos=True,
attn_flash=True,
shift_tokens=1,
attn_one_kv_head=True,
rotary_xpos=True,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand All @@ -53,10 +50,8 @@
use_abs_pos_emb=False,
alibi_pos_bias=True,
alibi_num_heads=8,
rotary_xpos=True,
attn_flash=True,
shift_tokens=1,
attn_one_kv_head=True,
rotary_xpos=True,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand All @@ -72,10 +67,8 @@
use_abs_pos_emb=False,
alibi_pos_bias=True,
alibi_num_heads=4,
rotary_xpos=True,
attn_flash=True,
shift_tokens=1,
attn_one_kv_head=True,
rotary_xpos=True,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand All @@ -91,10 +84,8 @@
use_abs_pos_emb=False,
alibi_pos_bias=True,
alibi_num_heads=4,
rotary_xpos=True,
attn_flash=True,
shift_tokens=1,
attn_one_kv_head=True,
rotary_xpos=True,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand All @@ -110,10 +101,8 @@
use_abs_pos_emb=False,
alibi_pos_bias=True,
alibi_num_heads=4,
rotary_xpos=True,
attn_flash=True,
shift_tokens=1,
attn_one_kv_head=True,
rotary_xpos=True,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand Down
2 changes: 1 addition & 1 deletion Andromeda/model.py
Original file line number Diff line number Diff line change
Expand Up @@ -48,7 +48,7 @@ def __init__(self,
alibi_num_heads=12,
rotary_xpos=True,
attn_flash=True,
attn_kv_heads = 2,
attn_kv_heads = 2,
qk_norm=True,
attn_qk_norm=True,
attn_qk_norm_dim_scale=True,
Expand Down

0 comments on commit 72cf984

Please sign in to comment.