patches to make llama4 performant

This commit is contained in:
Wing Lian
2025-04-06 22:50:48 -04:00
parent 4b28b2a0b4
commit 37630fc6ef
10 changed files with 364 additions and 7 deletions

View File

@@ -6,7 +6,7 @@ triton>=3.0.0
mamba-ssm==1.2.0.post1
xformers>=0.0.23.post1
autoawq==0.2.7.post3
liger-kernel==0.5.5
liger-kernel==0.5.6
# END section
packaging==23.2