pminervini's picture
update
73d1e6e
raw
history blame
1.43 kB
#!/usr/bin/env python
import os
import fnmatch
import json
from huggingface_hub import HfApi
def find_json_files(directory):
matches = []
for root, dirnames, filenames in os.walk(directory):
for filename in fnmatch.filter(filenames, '*.json'):
matches.append(os.path.join(root, filename))
return matches
directory_path = '/Users/pasquale/workspace/eval/requests'
json_files = find_json_files(directory_path)
api = HfApi()
model_lst = api.list_models()
model_lst = [m for m in model_lst]
id_to_model = {m.id: m for m in model_lst}
for path in json_files:
with open(path, 'r') as fr:
data = json.load(fr)
model_id = data['model']
if model_id in id_to_model:
model = id_to_model[model_id]
to_overwrite = False
is_finetuned = any(tag.startswith('base_model:') for tag in id_to_model[data['model']].tags)
if is_finetuned:
data["model_type"] = "fine-tuned"
to_overwrite = True
is_instruction_tuned = ('nstruct' in model_id) or ('chat' in model_id)
if is_instruction_tuned:
data["model_type"] = "instruction-tuned"
to_overwrite = True
if to_overwrite is True:
with open(path, 'w') as fw:
json.dump(data, fw)
else:
print(f'Model {model_id} not found')