__all__ = ['block', 'make_clickable_model', 'make_clickable_user', 'get_submissions'] import gradio as gr import pandas as pd from huggingface_hub import HfApi, repocard #def is_duplicated(space_id:str)->None: # card = repocard.RepoCard.load(space_id, repo_type="space") # return getattr(card.data, "duplicated_from", None) is not None def make_clickable_model(model_name, repo_type, link=None): if link is None: if repo_type == "Dataset": link = "https://huggingface.co/" + "datasets/" + model_name else: link = "https://huggingface.co/" + model_name return f'{model_name.split("/")[-1]}' def get_repo_ids(repo_type): api = HfApi() if repo_type == "Model": notebooks = api.list_models(filter=["notebook-favorites"]) elif repo_type == "Dataset": notebooks = api.list_datasets(filter=["notebook-favorites"]) print(notebooks) notebook_ids = [x for x in notebooks] return notebook_ids def make_clickable_user(user_id): link = "https://huggingface.co/" + user_id return f'{user_id}' def get_submissions(repo_type): submissions = get_repo_ids(repo_type) leaderboard_models = [] for submission in submissions: # user, model, likes #if not is_duplicated(submission.id): user_id = submission.id.split("/")[0] leaderboard_models.append( ( make_clickable_user(user_id), make_clickable_model(submission.id, repo_type), submission.likes, ) ) df = pd.DataFrame(data=leaderboard_models, columns=["User", "Repository", "Likes"]) df.sort_values(by=["Likes"], ascending=False, inplace=True) df.insert(0, "Rank", list(range(1, len(df) + 1))) return df block = gr.Blocks() with block: gr.Markdown( """# Notebooks Leaderboard This Space compiles coolest model and dataset repositories that contain notebooks! """ ) with gr.Tabs(): with gr.TabItem("Notebooks in Model Repositories 🤖"): with gr.Row(): model_data = gr.components.Dataframe( type="pandas", datatype=["number", "markdown", "markdown", "number"] ) with gr.Row(): data_run = gr.Button("Refresh") data_run.click( get_submissions, inputs=gr.Variable("Model"), outputs=model_data ) with gr.TabItem("Notebooks in Dataset Repositories 📖"): with gr.Row(): dataset_data = gr.components.Dataframe( type="pandas", datatype=["number", "markdown", "markdown", "number"] ) with gr.Row(): data_run = gr.Button("Refresh") data_run.click( get_submissions, inputs=gr.Variable("Dataset"), outputs=dataset_data ) block.load(get_submissions, inputs=gr.Variable("Model"), outputs=model_data) block.load(get_submissions, inputs=gr.Variable("Dataset"), outputs=dataset_data) block.launch(debug=True)