Commit 52ab19fa authored by Hines, Jesse's avatar Hines, Jesse
Browse files

Marconi100 download

parent a1057945
Loading
Loading
Loading
Loading
+32 −17
Original line number Diff line number Diff line
@@ -20,12 +20,15 @@

# to analyze dataset
python -m raps.telemetry -f /path/to/job_table.parquet --system marconi100 -v

"""
import uuid
import numpy as np
import pandas as pd
from tqdm import tqdm
from pathlib import Path
from datetime import datetime
import requests
import urllib.request

from ..job import job_dict, Job
from ..utils import power_to_utilization, WorkloadData
@@ -241,3 +244,15 @@ def cdu_index_to_name(index: int, config: dict):
def cdu_pos(index: int, config: dict) -> tuple[int, int]:
    """ Return (row, col) tuple for a cdu index """
    return (0, index)  # TODO


def download(dest: Path, start: datetime | None, end: datetime | None):
    files = requests.get("https://zenodo.org/api/records/10127767").json()["files"]

    # marconi100 is just one big parquet, nothing to pre-filter
    dest.mkdir(parents = True)
    for file in files:
        print(f"Downloading {file['key']}")
        urllib.request.urlretrieve(file['links']['self'], dest / file['key'])

    print("Done!")