updated style mimciking fine tuning

2025-08-13 23:50:20 +00:00
parent 8847035d12
commit 1b46270afa
83 changed files with 2537260 additions and 378 deletions
@@ -56,11 +56,15 @@ model:
 # Training Configuration
 training:
  num_epochs: 3                             # Number of training epochs
-  batch_size: 16                            # Training batch size (adjust based on GPU memory)
-  learning_rate: 3e-5                       # Learning rate (typical range: 1e-5 to 5e-5 for fine-tuning)
+  batch_size: 4                             # Training batch size (adjust based on GPU memory)
+  learning_rate: 2e-4                       # Learning rate (typical range: 1e-5 to 5e-5 for fine-tuning)
  weight_decay: 0.01                        # Weight decay for optimizer (prevents overfitting)
-  warmup_ratio: 0.1                         # Warmup ratio for scheduler (0.0 to 1.0)
+  warmup_steps: 5                           # Warmup steps (fixed value instead of ratio)
+  max_steps: 60                             # Maximum training steps
+  gradient_accumulation_steps: 4            # Gradient accumulation steps
  lr_scheduler_type: "linear"               # Scheduler type: "linear", "cosine", "polynomial"
+  seed: 3407                                # Random seed for reproducibility
+  model_output_dir: "./models/styling"  # Directory to save the trained model (updated to match actual location)

 # Inference Configuration
 inference: