python3 -m venv myenv
source myenv/bin/activate
pip install -r requirements.txt
dvc init
git add .dvc .gitignore
git commit -m "Initialize DVC"
python3 getDataset.py
aws configure
aws s3 mb s3://uottawa-dvc-bucket
dvc remote add s3_remote s3://uottawa-dvc-bucket
dvc remote modify s3_remote region us-west-2 # Change region if needed
dvc remote modify s3_remote access_key_id YOUR_AWS_ACCESS_KEY_ID
dvc remote modify s3_remote secret_access_key YOUR_AWS_SECRET_ACCESS_KEY
dvc remote default s3_remote
dvc add data/imdb
git add data/imdb.dvc .gitignore
git commit -m "Track IMDb dataset with DVC on S3"
dvc push
git clone the repo
./addRemote.sh
dvc pull