granite chat multipack support and example
This commit is contained in:
@@ -36,6 +36,8 @@ SUPPORTED_MULTIPACK_MODEL_TYPES = [
|
|||||||
"glm",
|
"glm",
|
||||||
"glm4",
|
"glm4",
|
||||||
"smollm3",
|
"smollm3",
|
||||||
|
"granite",
|
||||||
|
"granitemoe",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@@ -644,6 +644,19 @@ class LoRAValidationMixin:
|
|||||||
)
|
)
|
||||||
return data
|
return data
|
||||||
|
|
||||||
|
@model_validator(mode="before")
|
||||||
|
@classmethod
|
||||||
|
def check_lora_dropout_parameters(cls, data):
|
||||||
|
if (
|
||||||
|
data.get("lora_dropout", 0.0)
|
||||||
|
and data.get("lora_dropout") > 0.0
|
||||||
|
and data.get("lora_target_parameters")
|
||||||
|
):
|
||||||
|
# lora.ParamWrapper does not work with lora_dropout != 0
|
||||||
|
raise ValueError(
|
||||||
|
"`lora_dropout` does not work when using `lora_target_parameters`"
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
class RLValidationMixin:
|
class RLValidationMixin:
|
||||||
"""Validation methods related to RL training configuration."""
|
"""Validation methods related to RL training configuration."""
|
||||||
|
|||||||
Reference in New Issue
Block a user