Spaces:
Paused
Paused
| import os | |
| import re | |
| import glob | |
| import tqdm | |
| import dill as pickle | |
| import subprocess | |
| import pandas as pd | |
| import datetime | |
| from functools import lru_cache | |
| block_time_500k = datetime.datetime(2023, 5, 29, 5, 29, 0) | |
| block_time_800k = datetime.datetime(2023, 7, 9, 21, 32, 48) | |
| dt = (pd.Timestamp(block_time_800k)-pd.Timestamp(block_time_500k))/(800_000-500_000) | |
| def run_subprocess(command='python multigraph.py', *args): | |
| try: | |
| # Run the subprocess with stdout and stderr pipes connected | |
| command = command + " ".join(args) | |
| print(f'{"===="*20}\nRunning: {command!r}') | |
| process = subprocess.Popen( | |
| command, | |
| stdout=subprocess.PIPE, | |
| stderr=subprocess.STDOUT, | |
| universal_newlines=True, # Set to True for text mode | |
| bufsize=1, # Line buffered, so output is available line by line | |
| shell=True # Set to True to allow running shell commands (use with caution) | |
| ) | |
| print(f'Subprocess started with pid {process.pid} and streaming output from stdout:') | |
| with process.stdout as output: | |
| for line in output: | |
| print(line, end='', flush=True) # Print without adding an extra newline | |
| if match := re.search('(?P<done>\\d+)/(?P<total>\\d+)',line): | |
| print('---> match.groupdict():', match.groupdict()) | |
| # try yielding the line here | |
| # Wait for the subprocess to finish and get the return code | |
| process.wait() | |
| print("===="*20) | |
| return process.returncode | |
| except subprocess.CalledProcessError as e: | |
| # If the subprocess returns a non-zero exit code, this exception will be raised | |
| return e.returncode | |
| def load_metagraph(path, extra_cols=None, rm_cols=None): | |
| with open(path, 'rb') as f: | |
| metagraph = pickle.load(f) | |
| df = pd.DataFrame(metagraph.axons) | |
| df['block'] = metagraph.block.item() | |
| df['timestamp'] = block_time_500k + dt*(df['block']-500_000) | |
| df['difficulty'] = getattr(metagraph, 'difficulty', None) | |
| for c in extra_cols: | |
| vals = getattr(metagraph,c) | |
| df[c] = vals | |
| return df.drop(columns=rm_cols) | |
| def load_metagraphs(block_start, block_end, block_step=1000, datadir='data/metagraph/1/', extra_cols=None): | |
| if extra_cols is None: | |
| extra_cols = ['total_stake','ranks','incentive','emission','consensus','trust','validator_trust','dividends'] | |
| blocks = range(block_start, block_end, block_step) | |
| print(f'Loading blocks {blocks[0]}-{blocks[-1]} from {datadir}') | |
| filenames = sorted(filename for filename in os.listdir(datadir) if filename.split('.')[0].isdigit() and int(filename.split('.')[0]) in blocks) | |
| print(f'Found {len(filenames)} files in {datadir}') | |
| metagraphs = [] | |
| pbar = tqdm.tqdm(filenames) | |
| for filename in pbar: | |
| pbar.set_description(f'Processing {filename}') | |
| try: | |
| metagraph = load_metagraph(os.path.join(datadir, filename), extra_cols=extra_cols, rm_cols=['protocol','placeholder1','placeholder2']) | |
| metagraphs.append(metagraph) | |
| except Exception as e: | |
| print(f'filename {filename!r} generated an exception: { e }') | |
| return pd.concat(metagraphs) | |