fix: use existing model config
This commit is contained in:
@@ -49,12 +49,9 @@ def do_linearize(cfg: DictDefault, cli_args: TrainerCliArgs) -> None:
|
|||||||
for p in model.parameters():
|
for p in model.parameters():
|
||||||
p.requires_grad = False
|
p.requires_grad = False
|
||||||
|
|
||||||
# load config
|
|
||||||
base_config = load_model_config(cfg)
|
|
||||||
|
|
||||||
# convert to linear llama
|
# convert to linear llama
|
||||||
linear_llama_config = LinearLlamaConfig.from_llama(
|
linear_llama_config = LinearLlamaConfig.from_llama(
|
||||||
base_config, cfg.attention_config
|
model.config, cfg.attention_config
|
||||||
)
|
)
|
||||||
model = LinearLlamaForCausalLM.from_llama(
|
model = LinearLlamaForCausalLM.from_llama(
|
||||||
model, config=linear_llama_config, train_attention=True
|
model, config=linear_llama_config, train_attention=True
|
||||||
|
|||||||
Reference in New Issue
Block a user