Skip to content

Commit 5d5af74

Browse files
sayakpaullinoytsaban
authored andcommitted
[training] use the lr when using 8bit adam. (#9796)
* use the lr when using 8bit adam. * remove lr as we pack it in params_to_optimize. --------- Co-authored-by: Linoy Tsaban <[email protected]>
1 parent 3e12251 commit 5d5af74

11 files changed

+6
-33
lines changed

examples/advanced_diffusion_training/train_dreambooth_lora_flux_advanced.py

Lines changed: 3 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -1778,15 +1778,10 @@ def load_model_hook(models, input_dir):
17781778
if not args.enable_t5_ti:
17791779
# pure textual inversion - only clip
17801780
if pure_textual_inversion:
1781-
params_to_optimize = [
1782-
text_parameters_one_with_lr,
1783-
]
1781+
params_to_optimize = [text_parameters_one_with_lr]
17841782
te_idx = 0
17851783
else: # regular te training or regular pivotal for clip
1786-
params_to_optimize = [
1787-
transformer_parameters_with_lr,
1788-
text_parameters_one_with_lr,
1789-
]
1784+
params_to_optimize = [transformer_parameters_with_lr, text_parameters_one_with_lr]
17901785
te_idx = 1
17911786
elif args.enable_t5_ti:
17921787
# pivotal tuning of clip & t5
@@ -1809,9 +1804,7 @@ def load_model_hook(models, input_dir):
18091804
]
18101805
te_idx = 1
18111806
else:
1812-
params_to_optimize = [
1813-
transformer_parameters_with_lr,
1814-
]
1807+
params_to_optimize = [transformer_parameters_with_lr]
18151808

18161809
# Optimizer creation
18171810
if not (args.optimizer.lower() == "prodigy" or args.optimizer.lower() == "adamw"):
@@ -1871,7 +1864,6 @@ def load_model_hook(models, input_dir):
18711864
params_to_optimize[-1]["lr"] = args.learning_rate
18721865
optimizer = optimizer_class(
18731866
params_to_optimize,
1874-
lr=args.learning_rate,
18751867
betas=(args.adam_beta1, args.adam_beta2),
18761868
beta3=args.prodigy_beta3,
18771869
weight_decay=args.adam_weight_decay,

examples/advanced_diffusion_training/train_dreambooth_lora_sd15_advanced.py

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1358,10 +1358,7 @@ def load_model_hook(models, input_dir):
13581358
else args.adam_weight_decay,
13591359
"lr": args.text_encoder_lr if args.text_encoder_lr else args.learning_rate,
13601360
}
1361-
params_to_optimize = [
1362-
unet_lora_parameters_with_lr,
1363-
text_lora_parameters_one_with_lr,
1364-
]
1361+
params_to_optimize = [unet_lora_parameters_with_lr, text_lora_parameters_one_with_lr]
13651362
else:
13661363
params_to_optimize = [unet_lora_parameters_with_lr]
13671364

@@ -1423,7 +1420,6 @@ def load_model_hook(models, input_dir):
14231420

14241421
optimizer = optimizer_class(
14251422
params_to_optimize,
1426-
lr=args.learning_rate,
14271423
betas=(args.adam_beta1, args.adam_beta2),
14281424
beta3=args.prodigy_beta3,
14291425
weight_decay=args.adam_weight_decay,

examples/advanced_diffusion_training/train_dreambooth_lora_sdxl_advanced.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1794,7 +1794,6 @@ def load_model_hook(models, input_dir):
17941794

17951795
optimizer = optimizer_class(
17961796
params_to_optimize,
1797-
lr=args.learning_rate,
17981797
betas=(args.adam_beta1, args.adam_beta2),
17991798
beta3=args.prodigy_beta3,
18001799
weight_decay=args.adam_weight_decay,

examples/cogvideo/train_cogvideox_image_to_video_lora.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -947,7 +947,6 @@ def get_optimizer(args, params_to_optimize, use_deepspeed: bool = False):
947947

948948
optimizer = optimizer_class(
949949
params_to_optimize,
950-
lr=args.learning_rate,
951950
betas=(args.adam_beta1, args.adam_beta2),
952951
beta3=args.prodigy_beta3,
953952
weight_decay=args.adam_weight_decay,

examples/cogvideo/train_cogvideox_lora.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -969,7 +969,6 @@ def get_optimizer(args, params_to_optimize, use_deepspeed: bool = False):
969969

970970
optimizer = optimizer_class(
971971
params_to_optimize,
972-
lr=args.learning_rate,
973972
betas=(args.adam_beta1, args.adam_beta2),
974973
beta3=args.prodigy_beta3,
975974
weight_decay=args.adam_weight_decay,

examples/dreambooth/train_dreambooth_flux.py

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1226,10 +1226,7 @@ def load_model_hook(models, input_dir):
12261226
"weight_decay": args.adam_weight_decay_text_encoder,
12271227
"lr": args.text_encoder_lr if args.text_encoder_lr else args.learning_rate,
12281228
}
1229-
params_to_optimize = [
1230-
transformer_parameters_with_lr,
1231-
text_parameters_one_with_lr,
1232-
]
1229+
params_to_optimize = [transformer_parameters_with_lr, text_parameters_one_with_lr]
12331230
else:
12341231
params_to_optimize = [transformer_parameters_with_lr]
12351232

@@ -1291,7 +1288,6 @@ def load_model_hook(models, input_dir):
12911288

12921289
optimizer = optimizer_class(
12931290
params_to_optimize,
1294-
lr=args.learning_rate,
12951291
betas=(args.adam_beta1, args.adam_beta2),
12961292
beta3=args.prodigy_beta3,
12971293
weight_decay=args.adam_weight_decay,

examples/dreambooth/train_dreambooth_lora_flux.py

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1335,10 +1335,7 @@ def load_model_hook(models, input_dir):
13351335
"weight_decay": args.adam_weight_decay_text_encoder,
13361336
"lr": args.text_encoder_lr if args.text_encoder_lr else args.learning_rate,
13371337
}
1338-
params_to_optimize = [
1339-
transformer_parameters_with_lr,
1340-
text_parameters_one_with_lr,
1341-
]
1338+
params_to_optimize = [transformer_parameters_with_lr, text_parameters_one_with_lr]
13421339
else:
13431340
params_to_optimize = [transformer_parameters_with_lr]
13441341

@@ -1400,7 +1397,6 @@ def load_model_hook(models, input_dir):
14001397

14011398
optimizer = optimizer_class(
14021399
params_to_optimize,
1403-
lr=args.learning_rate,
14041400
betas=(args.adam_beta1, args.adam_beta2),
14051401
beta3=args.prodigy_beta3,
14061402
weight_decay=args.adam_weight_decay,

examples/dreambooth/train_dreambooth_lora_sd3.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1468,7 +1468,6 @@ def load_model_hook(models, input_dir):
14681468

14691469
optimizer = optimizer_class(
14701470
params_to_optimize,
1471-
lr=args.learning_rate,
14721471
betas=(args.adam_beta1, args.adam_beta2),
14731472
beta3=args.prodigy_beta3,
14741473
weight_decay=args.adam_weight_decay,

examples/dreambooth/train_dreambooth_lora_sdxl.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1402,7 +1402,6 @@ def load_model_hook(models, input_dir):
14021402

14031403
optimizer = optimizer_class(
14041404
params_to_optimize,
1405-
lr=args.learning_rate,
14061405
betas=(args.adam_beta1, args.adam_beta2),
14071406
beta3=args.prodigy_beta3,
14081407
weight_decay=args.adam_weight_decay,

examples/dreambooth/train_dreambooth_sd3.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1328,7 +1328,6 @@ def load_model_hook(models, input_dir):
13281328

13291329
optimizer = optimizer_class(
13301330
params_to_optimize,
1331-
lr=args.learning_rate,
13321331
betas=(args.adam_beta1, args.adam_beta2),
13331332
beta3=args.prodigy_beta3,
13341333
weight_decay=args.adam_weight_decay,

examples/research_projects/scheduled_huber_loss_training/dreambooth/train_dreambooth_lora_sdxl.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1475,7 +1475,6 @@ def load_model_hook(models, input_dir):
14751475

14761476
optimizer = optimizer_class(
14771477
params_to_optimize,
1478-
lr=args.learning_rate,
14791478
betas=(args.adam_beta1, args.adam_beta2),
14801479
beta3=args.prodigy_beta3,
14811480
weight_decay=args.adam_weight_decay,

0 commit comments

Comments
 (0)