diff --git a/download_data.sh b/download_data.sh index b9d4622..5acb12f 100755 --- a/download_data.sh +++ b/download_data.sh @@ -9,19 +9,19 @@ read -p "Enter the number corresponding to your choice: " choice case $choice in 2) - # Download 10m dataset - wget https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_{0001..0010}.json.gz -P ~/data/bluesky -N + # Download 10m dataset: files 0001 to 0010 + wget --timestamping --directory-prefix ~/data/bluesky --input-file <(seq --format "https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_%04g.json.gz" 1 10) ;; 3) - # Download 100m dataset - wget https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_{0001..0100}.json.gz -P ~/data/bluesky -N + # Download 100m dataset: files 0001 to 0100 + wget --timestamping --directory-prefix ~/data/bluesky --input-file <(seq --format "https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_%04g.json.gz" 1 100) ;; 4) - # Download 1000m dataset - wget https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_{0001..1000}.json.gz -P ~/data/bluesky -N + # Download 1000m dataset: files 0001 to 1000 + wget --timestamping --directory-prefix ~/data/bluesky --input-file <(seq --format "https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_%04g.json.gz" 1 1000) ;; *) - # Download 1m dataset - wget https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_0001.json.gz -P ~/data/bluesky -N + # Download 1m dataset: single file + wget --timestamping --directory-prefix ~/data/bluesky "https://clickhouse-public-datasets.s3.amazonaws.com/bluesky/file_0001.json.gz" ;; -esac \ No newline at end of file +esac