File size: 385 Bytes
6ca4b94
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
from datasets import load_dataset
from src.config import config

def download_dataset():
    print(f"Downloading dataset: {config.data.dataset_path}")
    dataset = load_dataset(
        config.data.dataset_path,
        split="train",
        cache_dir="cache"
    )
    print(f"Dataset downloaded successfully: {len(dataset)} rows")

if __name__ == "__main__":
    download_dataset()