2021-10-24 11:31:20 +00:00
|
|
|
# Download CIFAR dataset and create a dataset with ClearML's Dataset class
|
|
|
|
from clearml import StorageManager, Dataset
|
|
|
|
|
|
|
|
manager = StorageManager()
|
|
|
|
|
2024-08-05 12:46:11 +00:00
|
|
|
dataset_path = manager.get_local_copy(remote_url="https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz")
|
2021-10-24 11:31:20 +00:00
|
|
|
|
2024-08-05 12:46:11 +00:00
|
|
|
dataset = Dataset.create(dataset_name="cifar_dataset", dataset_project="dataset_examples")
|
2021-10-24 11:31:20 +00:00
|
|
|
|
|
|
|
# Prepare and clean data here before it is added to the dataset
|
|
|
|
|
|
|
|
dataset.add_files(path=dataset_path)
|
|
|
|
|
|
|
|
# Dataset is uploaded to the ClearML Server by default
|
|
|
|
dataset.upload()
|
|
|
|
|
|
|
|
dataset.finalize()
|