trained on 52 images. some photos some video screencaps and some drawings (most by hotglossed)
may turn noses into mouths sometimes
{
"engine": "kohya",
"unetLR": 0.0003,
"clipSkip": 1,
"loraType": "lora",
"keepTokens": 0,
"networkDim": 32,
"numRepeats": 10,
"resolution": 1024,
"lrScheduler": "cosine_with_restarts",
"minSnrGamma": 5,
"noiseOffset": 0.03,
"targetSteps": 1156,
"enableBucket": true,
"networkAlpha": 16,
"optimizerType": "AdamW8Bit",
"textEncoderLR": 0.00003,
"maxTrainEpochs": 20,
"shuffleCaption": true,
"trainBatchSize": 9,
"flipAugmentation": true,
"lrSchedulerNumCycles": 4
}