SengTak's picture
added necesary files-1
55890ea verified
raw
history blame
764 Bytes
from ..dataset import E5Data
from ..dataset import Wiki1M
def load_dataset(dataset_name, split="validation", file_path=None, **kwargs):
"""
Loads a dataset by name.
Args:
dataset_name (str): Name of the dataset to load.
split (str): Split of the dataset to load.
file_path (str): Path to the dataset file.
"""
dataset_mapping = {
"E5": E5Data,
"Wiki1M": Wiki1M,
}
if dataset_name not in dataset_mapping:
raise NotImplementedError(f"Dataset name {dataset_name} not supported.")
if split not in ["train", "validation", "test"]:
raise NotImplementedError(f"Split {split} not supported.")
return dataset_mapping[dataset_name](split=split, file_path=file_path, **kwargs)