-
Notifications
You must be signed in to change notification settings - Fork 0
/
get_data.sh
27 lines (22 loc) · 852 Bytes
/
get_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
#! /bin/sh
# dataset URLs
GOOGLE_DRIVE_URL="https://drive.google.com/uc?export=download&id="
CREDIT_RISK_URL="$GOOGLE_DRIVE_URL"1KM3MnRLpOxUKESUbqFXBmiDoU_cna927
AMES_HOUSING_URL="$GOOGLE_DRIVE_URL"1VyekZ6K5ZRXg61ihwZKSZaCNn-OGSpSE
# file paths
INPUT_DIR=input
CREDIT_RISK_DIR="$INPUT_DIR"/credit-risk
AMES_HOUSING_DIR="$INPUT_DIR"/ames-housing-test
# delete the input folder
echo "Deleting input folder"
rm -rf "$INPUT_DIR"
# download and extract credit risk data
echo "Downloading credit risk data"
mkdir -p "$CREDIT_RISK_DIR"
curl -L "$CREDIT_RISK_URL" -o "$CREDIT_RISK_DIR".zip
unzip "$CREDIT_RISK_DIR".zip -d "$CREDIT_RISK_DIR"
# download and extract Ames housing data
echo "Downloading Ames housing data"
mkdir -p "$CREDIT_RISK_DIR"
curl -L "$AMES_HOUSING_URL" -o "$AMES_HOUSING_DIR".zip
unzip "$AMES_HOUSING_DIR".zip -d "$AMES_HOUSING_DIR"