diff --git a/configs/train/finetune_gptj.yaml b/configs/train/finetune_gptj.yaml index aa6bf4a8..ce6feef7 100644 --- a/configs/train/finetune_gptj.yaml +++ b/configs/train/finetune_gptj.yaml @@ -9,7 +9,7 @@ streaming: false num_proc: 64 dataset_path: "nomic-ai/turbo-500k-multi" max_length: 1024 -batch_size: 16 +batch_size: 8 # train dynamics lr: 2.0e-5