Skip to content

Commit

Permalink
now downloading job data from my personal drive link
Browse files Browse the repository at this point in the history
  • Loading branch information
wangpatrick57 committed Dec 21, 2024
1 parent 9a63b5c commit 73dc4ac
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 3 deletions.
7 changes: 4 additions & 3 deletions benchmark/job/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,6 @@
import click

from benchmark.constants import DEFAULT_SCALE_FACTOR
from benchmark.job.load_info import JobLoadInfo
from util.log import DBGYM_LOGGER_NAME
from util.shell import subprocess_run
from util.workspace import (
Expand All @@ -13,7 +12,8 @@
link_result,
)

JOB_TABLES_URL = "https://homepages.cwi.nl/~boncz/job/imdb.tgz"
# JOB_TABLES_URL = "https://homepages.cwi.nl/~boncz/job/imdb.tgz" # This link stopped working for me
JOB_TABLES_URL = "https://drive.google.com/uc?id=19m0zDpphAw0Bu9Irr_ta9EGr5k85hiN1"
JOB_QUERY_NAMES = [
"1a",
"1b",
Expand Down Expand Up @@ -177,7 +177,8 @@ def _download_job_data(dbgym_cfg: DBGymConfig) -> None:

logging.getLogger(DBGYM_LOGGER_NAME).info(f"Downloading: {expected_symlink_dpath}")
real_data_path = dbgym_cfg.cur_task_runs_data_path(mkdir=True)
subprocess_run(f"curl -O {JOB_TABLES_URL}", cwd=real_data_path)
# subprocess_run(f"curl -O {JOB_TABLES_URL}", cwd=real_data_path) # This is if we're using a non-Google-Drive link
subprocess_run(f"gdown {JOB_TABLES_URL}", cwd=real_data_path)
job_data_dpath = dbgym_cfg.cur_task_runs_data_path(
default_tables_dname(DEFAULT_SCALE_FACTOR), mkdir=True
)
Expand Down
1 change: 1 addition & 0 deletions dependencies/requirements.txt
Original file line number Diff line number Diff line change
Expand Up @@ -135,3 +135,4 @@ Werkzeug==3.0.1
wrapt==1.14.1
zipp==3.17.0
streamlit==1.39.0
gdown==5.2.0

0 comments on commit 73dc4ac

Please sign in to comment.