diff --git a/hf_roberta_base/03_train_pytorch_regression.py b/hf_roberta_base/03_train_pytorch_regression.py index 1b5eb30..1996cd0 100644 --- a/hf_roberta_base/03_train_pytorch_regression.py +++ b/hf_roberta_base/03_train_pytorch_regression.py @@ -12,6 +12,7 @@ from tqdm.auto import tqdm BATCH_SIZE = 4 EARLY_STOPPING = 3 WARMUP_STEPS = 10_000 +LR=1e-6 STEPS_EVAL = 5_000 if TEST: @@ -34,7 +35,7 @@ eval_dataloader_small = DataLoader(eval_dataset_small, batch_size=BATCH_SIZE) eval_dataloader_full = DataLoader(eval_dataset_full, batch_size=BATCH_SIZE) model = AutoModelForSequenceClassification.from_pretrained(MODEL, num_labels=1) -optimizer = AdamW(model.parameters(), lr=1e-6) +optimizer = AdamW(model.parameters(), lr=LR) num_epochs = 5