ir_chinese_medqa / utility /utils /save_metadata.py
欧卫
'add_app_files'
58627fa
from colbert.utils.utils import dotdict
import os
import sys
import git
import time
import copy
import ujson
import socket
def get_metadata_only():
args = dotdict()
args.hostname = socket.gethostname()
try:
args.git_branch = git.Repo(search_parent_directories=True).active_branch.name
args.git_hash = git.Repo(search_parent_directories=True).head.object.hexsha
args.git_commit_datetime = str(git.Repo(search_parent_directories=True).head.object.committed_datetime)
except git.exc.InvalidGitRepositoryError as e:
pass
args.current_datetime = time.strftime('%b %d, %Y ; %l:%M%p %Z (%z)')
args.cmd = ' '.join(sys.argv)
return args
def get_metadata(args):
args = copy.deepcopy(args)
args.hostname = socket.gethostname()
args.git_branch = git.Repo(search_parent_directories=True).active_branch.name
args.git_hash = git.Repo(search_parent_directories=True).head.object.hexsha
args.git_commit_datetime = str(git.Repo(search_parent_directories=True).head.object.committed_datetime)
args.current_datetime = time.strftime('%b %d, %Y ; %l:%M%p %Z (%z)')
args.cmd = ' '.join(sys.argv)
try:
args.input_arguments = copy.deepcopy(args.input_arguments.__dict__)
except:
args.input_arguments = None
return dict(args.__dict__)
# TODO: No reason for deepcopy. But: (a) Call provenance() on objects that can, (b) Only save simple, small objects. No massive lists or models or weird stuff!
# With that, I think we don't even need (necessarily) to restrict things to input_arguments.
def format_metadata(metadata):
assert type(metadata) == dict
return ujson.dumps(metadata, indent=4)
def save_metadata(path, args):
assert not os.path.exists(path), path
with open(path, 'w') as output_metadata:
data = get_metadata(args)
output_metadata.write(format_metadata(data) + '\n')
return data