From 1a451445a21234cc8443603025eba5ab3572cb49 Mon Sep 17 00:00:00 2001 From: Wayner Barrios Date: Sat, 1 Apr 2023 23:52:25 -0400 Subject: [PATCH] DatasetDict to dataset object. --- data.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/data.py b/data.py index 0e356f7d..ff79924c 100644 --- a/data.py +++ b/data.py @@ -68,7 +68,7 @@ def load_data(config, tokenizer): dataset = load_dataset("json", data_files=files, split="train") else: - dataset = load_dataset(dataset_path) + dataset = load_dataset(dataset_path,split='train') dataset = dataset.train_test_split(test_size=.05, seed=config["seed"])