Eric Wang 3 лет назад
Родитель
Сommit
5cd474bcc0
1 измененных файлов с 1 добавлено и 1 удалено
  1. 1 1
      finetune.py

+ 1 - 1
finetune.py

@@ -63,7 +63,7 @@ MICRO_BATCH_SIZE = 4  # this could actually be 5 but i like powers of 2
 BATCH_SIZE = 128
 GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // MICRO_BATCH_SIZE
 EPOCHS = 3  # from the result
-LEARNING_RATE = 3e-4  # the karpathy constant
+LEARNING_RATE = 2e-5  # also from the result
 CUTOFF_LEN = 256  # 256 accounts for about 96% of the data
 
 data = data.shuffle().map(