examples/github_issue_summarization/ks_app/components/download_data.sh

21 lines
432 B
Bash

#!/bin/bash
#
# Script to download the data
# Usage
# download_data.sh <URL of data> <data_dir>
# e.g
# download_data.sh https://storage.googleapis.com/kubeflow-examples/github-issue-summarization-data/github-issues.zip /data
#
# Script expects data to be a zip file
set -ex
URL=$1
DATA_DIR=$2
mkdir -p ${DATA_DIR}
wget --directory-prefix=${DATA_DIR} ${URL}
TARGET=$(basename ${URL})
unzip -d ${DATA_DIR} ${DATA_DIR}/${TARGET}