File size: 2,593 Bytes
6bec1f5 92efc51 6bec1f5 c26894e 6bec1f5 92efc51 6bec1f5 92efc51 6bec1f5 92efc51 6bec1f5 c26894e 6bec1f5 9b36cb7 6bec1f5 9b36cb7 d599f4f f8a5547 9b36cb7 6bec1f5 8aabc99 6bec1f5 9b36cb7 6bec1f5 92356fe 92efc51 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 |
import os
import sys
import subprocess
from huggingface_hub import hf_hub_download
def run_command(command: str, cwd: str = None) -> tuple:
"""Run a shell command in the specified directory and return the output."""
process = subprocess.Popen(
command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE, cwd=cwd
)
stdout, stderr = process.communicate()
if process.returncode != 0:
print(f"Error: {stderr.decode()}")
else:
print(f"Output: {stdout.decode()}")
return stdout, stderr
def download_dataset():
"""Download the dataset."""
print("Downloading the autocast dataset...")
repo_id = "valory/autocast"
base_dir = os.getcwd()
output_dir = os.path.join(
base_dir, "olas-predict-benchmark", "benchmark", "data", "autocast"
)
if not os.path.exists(output_dir):
os.makedirs(output_dir, exist_ok=True)
filenames = [
"autocast_questions_filtered.json",
"autocast_questions_filtered.pkl",
]
for filename in filenames:
hf_hub_download(
repo_id=repo_id,
filename=filename,
local_dir=output_dir,
repo_type="dataset",
)
print("Dataset downloaded successfully.")
def start():
"""Start commands."""
print("Starting commands...")
base_dir = os.getcwd()
# olas_dir = os.path.join(base_dir, "olas-predict-benchmark")
# mech_dir = os.path.join(olas_dir, "benchmark", "mech")
commands = [
# ("git submodule init", base_dir),
# no updates
# ("git submodule update --init --recursive", base_dir),
# ("git submodule update --remote --recursive", base_dir),
# (
# 'git config remote.origin.fetch "+refs/heads/*:refs/remotes/origin/*"',
# olas_dir,
# ),
# ("git remote update", olas_dir),
# ("git fetch --all", olas_dir),
# ("git checkout main", olas_dir),
# ("git pull origin main", olas_dir),
# ("git checkout 56ecf18a982c4548feac5efe787690a3ec37c835", mech_dir),
# # ("git pull origin main", mech_dir),
# ("pip install -e .", os.path.join(olas_dir, "benchmark")),
# ("pip install -e .", mech_dir),
("pip install lxml[html_clean]", base_dir),
("pip install --upgrade huggingface_hub", base_dir),
]
for command, cwd in commands:
run_command(command, cwd=cwd)
# add benchmark to the path
# sys.path.append(os.path.join(olas_dir, "benchmark"))
# Download the dataset
download_dataset()
start()
|