пре 3 година · b948f892ba
--- a/finetune.py
+++ b/finetune.py
@@ -31,7 +31,7 @@ def train(
 
															     micro_batch_size: int = 4,
														
 
															     num_epochs: int = 3,
														
 
															     learning_rate: float = 3e-4,
														
 
															-    cutoff_len: int = 512,
														
 
															+    cutoff_len: int = 256,
														
 
															     val_set_size: int = 2000,
														
 
															     # lora hyperparams
														
 
															     lora_r: int = 8,
														
@@ -43,7 +43,7 @@ def train(
 
															     ],
														
 
															     # llm hyperparams
														
 
															     train_on_inputs: bool = True,  # if False, masks out inputs in loss
														
 
															-    group_by_length: bool = True,  # faster, but produces an odd training loss curve
														
 
															+    group_by_length: bool = False,  # faster, but produces an odd training loss curve
														
 
															 ):
														
 
															     print(
														
 
															         f"Training Alpaca-LoRA model with params:\n"