if return_X_y == True: A tuple of NumPy arrays containing (features, labels)
if dataset_name not in dataset_names:
raise ValueError("Data set not found in PMLB.")
dataset_url = "https://github.com/EpistasisLab/penn-ml-benchmarks/raw/master/datasets/{DATASET_NAME}/{DATASET_NAME}.csv.gz".format(DATASET_NAME=dataset_name)
if local_cache_dir is None:
dataset = pd.read_csv(dataset_url, sep="\t", compression="gzip")