Fix issue with max_train_steps

bmaltais · Nov 17, 2024 · a6f0ff7 · a6f0ff7 · bbecausereasonss · Nov 18, 2024
1 parent d47e3e6
commit a6f0ff7
Show file tree

Hide file tree

Showing 4 changed files with 33 additions and 54 deletions.
diff --git a/kohya_gui/dreambooth_gui.py b/kohya_gui/dreambooth_gui.py
@@ -781,23 +781,23 @@ def train_model(
 
         log.info(f"Regularization factor: {reg_factor}")
 
-        if max_train_steps == 0:
-            # calculate max_train_steps
-            max_train_steps = int(
-                math.ceil(
-                    float(total_steps)
-                    / int(train_batch_size)
-                    / int(gradient_accumulation_steps)
-                    * int(epoch)
-                    * int(reg_factor)
-                )
-            )
-            max_train_steps_info = f"max_train_steps ({total_steps} / {train_batch_size} / {gradient_accumulation_steps} * {epoch} * {reg_factor}) = {max_train_steps}"
-        else:
-            if max_train_steps == 0:
-                max_train_steps_info = f"Max train steps: 0. sd-scripts will therefore default to 1600. Please specify a different value if required."
-            else:
-                max_train_steps_info = f"Max train steps: {max_train_steps}"
+        # if max_train_steps == 0:
+        #     # calculate max_train_steps
+        #     max_train_steps = int(
+        #         math.ceil(
+        #             float(total_steps)
+        #             / int(train_batch_size)
+        #             / int(gradient_accumulation_steps)
+        #             * int(epoch)
+        #             * int(reg_factor)
+        #         )
+        #     )
+        #     max_train_steps_info = f"max_train_steps ({total_steps} / {train_batch_size} / {gradient_accumulation_steps} * {epoch} * {reg_factor}) = {max_train_steps}"
+        # else:
+        #     if max_train_steps == 0:
+        #         max_train_steps_info = f"Max train steps: 0. sd-scripts will therefore default to 1600. Please specify a different value if required."
+        #     else:
+        #         max_train_steps_info = f"Max train steps: {max_train_steps}"
 
         log.info(f"Total steps: {total_steps}")
 

diff --git a/kohya_gui/finetune_gui.py b/kohya_gui/finetune_gui.py
@@ -846,16 +846,16 @@ def train_model(
         repeats = int(image_num) * int(dataset_repeats)
         log.info(f"repeats = {str(repeats)}")
 
-        if max_train_steps == 0:
-            # calculate max_train_steps
-            max_train_steps = int(
-                math.ceil(
-                    float(repeats)
-                    / int(train_batch_size)
-                    / int(gradient_accumulation_steps)
-                    * int(epoch)
-                )
-            )
+        # if max_train_steps == 0:
+        #     # calculate max_train_steps
+        #     max_train_steps = int(
+        #         math.ceil(
+        #             float(repeats)
+        #             / int(train_batch_size)
+        #             / int(gradient_accumulation_steps)
+        #             * int(epoch)
+        #         )
+        #     )
 
         # Divide by two because flip augmentation create two copied of the source images
         if flip_aug and max_train_steps:

diff --git a/kohya_gui/lora_gui.py b/kohya_gui/lora_gui.py
@@ -1076,7 +1076,7 @@ def train_model(
 
         log.info(f"Regularization factor: {reg_factor}")
 
-        if max_train_steps == 0:
+        if (max_train_steps == 0) and (stop_text_encoder_training != 0):
             # calculate max_train_steps
             max_train_steps = int(
                 math.ceil(
@@ -1094,13 +1094,9 @@ def train_model(
             else:
                 max_train_steps_info = f"Max train steps: {max_train_steps}"
 
-        # calculate stop encoder training
-        if stop_text_encoder_training == 0:
-            stop_text_encoder_training = 0
-        else:
-            stop_text_encoder_training = math.ceil(
-                float(max_train_steps) / 100 * int(stop_text_encoder_training)
-            )
+        stop_text_encoder_training = math.ceil(
+            float(max_train_steps) / 100 * int(stop_text_encoder_training)
+        ) if stop_text_encoder_training != 0 else 0
 
     # Calculate lr_warmup_steps
     if lr_warmup_steps > 0:

diff --git a/kohya_gui/textual_inversion_gui.py b/kohya_gui/textual_inversion_gui.py
@@ -664,22 +664,9 @@ def train_model(
         log.info(f"Regularization factor: {reg_factor}")
 
         if max_train_steps == 0:
-            # calculate max_train_steps
-            max_train_steps = int(
-                math.ceil(
-                    float(total_steps)
-                    / int(train_batch_size)
-                    / int(gradient_accumulation_steps)
-                    * int(epoch)
-                    * int(reg_factor)
-                )
-            )
-            max_train_steps_info = f"max_train_steps ({total_steps} / {train_batch_size} / {gradient_accumulation_steps} * {epoch} * {reg_factor}) = {max_train_steps}"
+            max_train_steps_info = f"Max train steps: 0. sd-scripts will therefore default to 1600. Please specify a different value if required."
         else:
-            if max_train_steps == 0:
-                max_train_steps_info = f"Max train steps: 0. sd-scripts will therefore default to 1600. Please specify a different value if required."
-            else:
-                max_train_steps_info = f"Max train steps: {max_train_steps}"
+            max_train_steps_info = f"Max train steps: {max_train_steps}"
 
         # calculate stop encoder training
         if stop_text_encoder_training_pct == 0:
@@ -1076,10 +1063,6 @@ def list_embedding_files(path):
                             step=1,
                             label="Vectors",
                         )
-                        # max_train_steps = gr.Textbox(
-                        #     label='Max train steps',
-                        #     placeholder='(Optional) Maximum number of steps',
-                        # )
                         template = gr.Dropdown(
                             label="Template",
                             choices=[