Commit
·
25b6b65
1
Parent(s):
04c3d83
trainiing notes
Browse files
locon/amber_(genshin_impact)/training settings.txt
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
$noise_offset=0
|
| 2 |
+
$keep_tokens=0
|
| 3 |
+
$learning_rate=0.5
|
| 4 |
+
$text_encoder_lr=0.25
|
| 5 |
+
$unet_lr=0.5
|
| 6 |
+
$lr_warmup_ratio = 0.0
|
| 7 |
+
$weight_decay = 0.2 # not currently usedg
|
| 8 |
+
$resolution=512
|
| 9 |
+
$train_batch_size = 4
|
| 10 |
+
$gradient_accumulation_steps=2 # not currently usnig
|
| 11 |
+
$num_epochs = 5
|
| 12 |
+
$save_every_n_epochs=1
|
| 13 |
+
$scheduler="cosine_with_restarts"
|
| 14 |
+
$network_dim=4 # linear layers
|
| 15 |
+
$network_alpha=4 # linear layers
|
| 16 |
+
$conv_dim=1
|
| 17 |
+
$conv_alpha=1 # due to code errors this was 4 (took value from network_alpha)
|
| 18 |
+
$network_args="conv_dim={0}" -f $conv_alpha
|
| 19 |
+
$network_args2="conv_alpha={1}" -f $conv_dim
|
| 20 |
+
$optimizer_args="weight_decay=0.60 decouple=True" # not used from settings, set directly in code
|
| 21 |
+
$optimizer_type="DAdaptation"
|