remove stray print, add llama4 chat template to schema, bump peft to 0.15.1
This commit is contained in:
@@ -11,7 +11,7 @@ liger-kernel==0.5.5
|
|||||||
|
|
||||||
packaging==23.2
|
packaging==23.2
|
||||||
|
|
||||||
peft==0.15.0
|
peft==0.15.1
|
||||||
transformers==4.51.0
|
transformers==4.51.0
|
||||||
tokenizers>=0.21.1
|
tokenizers>=0.21.1
|
||||||
accelerate==1.6.0
|
accelerate==1.6.0
|
||||||
|
|||||||
@@ -162,7 +162,6 @@ def patch_flex_make_mask():
|
|||||||
for n in tuple(sys.modules):
|
for n in tuple(sys.modules):
|
||||||
if ".modeling_" in n and "llama4" not in n:
|
if ".modeling_" in n and "llama4" not in n:
|
||||||
if hasattr(sys.modules[n], "make_flex_block_causal_mask"):
|
if hasattr(sys.modules[n], "make_flex_block_causal_mask"):
|
||||||
print(n)
|
|
||||||
sys.modules[n].make_flex_block_causal_mask = (
|
sys.modules[n].make_flex_block_causal_mask = (
|
||||||
patched_make_flex_block_causal_mask
|
patched_make_flex_block_causal_mask
|
||||||
)
|
)
|
||||||
|
|||||||
@@ -26,6 +26,7 @@ class ChatTemplate(str, Enum):
|
|||||||
gemma = "gemma" # pylint: disable=invalid-name
|
gemma = "gemma" # pylint: disable=invalid-name
|
||||||
cohere = "cohere" # pylint: disable=invalid-name
|
cohere = "cohere" # pylint: disable=invalid-name
|
||||||
llama3 = "llama3" # pylint: disable=invalid-name
|
llama3 = "llama3" # pylint: disable=invalid-name
|
||||||
|
llama4 = "llama4" # pylint: disable=invalid-name
|
||||||
llama3_2_vision = "llama3_2_vision" # pylint: disable=invalid-name
|
llama3_2_vision = "llama3_2_vision" # pylint: disable=invalid-name
|
||||||
phi_3 = "phi_3" # pylint: disable=invalid-name
|
phi_3 = "phi_3" # pylint: disable=invalid-name
|
||||||
phi_35 = "phi_35" # pylint: disable=invalid-name
|
phi_35 = "phi_35" # pylint: disable=invalid-name
|
||||||
|
|||||||
Reference in New Issue
Block a user