don't scale delta before decomposing
This commit is contained in:
@@ -134,7 +134,7 @@ def decompose_delta_weight(layer_weight, avg_weight, alpha, rank):
|
|||||||
|
|
||||||
delta_first_pass = final_weight - base_weight
|
delta_first_pass = final_weight - base_weight
|
||||||
|
|
||||||
delta_for_svd = delta_first_pass / scaling
|
delta_for_svd = delta_first_pass
|
||||||
|
|
||||||
# 3. Low-rank factorization of the delta direction
|
# 3. Low-rank factorization of the delta direction
|
||||||
lora_A, lora_B = low_rank_decomposition(delta_for_svd, rank)
|
lora_A, lora_B = low_rank_decomposition(delta_for_svd, rank)
|
||||||
|
|||||||
Reference in New Issue
Block a user