LevelBot / app.py
lunarflu's picture
lunarflu HF staff
Update app.py
be6073e verified
import asyncio
import csv
import datetime
import json
import logging
import os
import os.path
import random
import re
import threading
import time
import discord
import gradio as gr
import gradio_client
import gspread
import numpy as np
import pandas as pd
import requests
from apscheduler.executors.pool import ThreadPoolExecutor
from apscheduler.schedulers.background import BackgroundScheduler
from discord import Color, Embed
from discord.ext import commands, tasks
from gradio_client import Client
from gspread_dataframe import get_as_dataframe, set_with_dataframe
from gspread_formatting.dataframe import format_with_dataframe
from huggingface_hub import HfApi, list_liked_repos, list_metrics, list_models
from tabulate import tabulate
from datetime import datetime
DISCORD_TOKEN = os.environ.get("DISCORD_TOKEN", None)
intents = discord.Intents.all()
bot = commands.Bot(command_prefix='!', intents=intents)
#logger = logging.getLogger(__name__)
#logging.basicConfig(level=logging.DEBUG)
""""""
XP_PER_MESSAGE = 10 # 100k messages = 1M exp = lvl 100
""""""
service_account = json.loads(os.environ.get('KEY'))
file_path = 'service_account.json'
with open(file_path, 'w') as json_file:
json.dump(service_account, json_file)
gspread_bot = gspread.service_account(filename='service_account.json')
worksheet = gspread_bot.open("levelbot").sheet1
worksheet2 = gspread_bot.open("hf_discord_verified_users_test").sheet1
""""""
bot_ids = [1136614989411655780, 1166392942387265536, 1158038249835610123, 1130774761031610388, 1155489509518098565, 1155169841276260546, 1152238037355474964, 1154395078735953930]
""""""
api = HfApi()
""""""
#csv_file = 'data.csv'
global_df = pd.DataFrame()
worksheet2_df = pd.DataFrame()
print(type(global_df))
community_global_df = pd.DataFrame()
data = pd.read_csv("https://docs.google.com/spreadsheets/d/1hQSsIg1Y9WdBF_CdNM1L1rUUREoxKqRTe3_ILo-WK8w/export?format=csv&gid=0")
data2 = pd.read_csv("https://docs.google.com/spreadsheets/d/1T_twNONDSZ8zw7aDcYhw92DlawqPktti1xFw9ssJ13Y/export?format=csv&gid=0")
@bot.event
async def on_ready():
try:
global global_df
global worksheet2_df
await asyncio.sleep(1.1)
print(f'Logged in as {bot.user.name}')
print(f"XP_PER_MESSAGE: {XP_PER_MESSAGE}")
"""import data from google sheets -> HF Space df (doesn't make API call this way, as it's read-only)"""
data['discord_user_id'] = data['discord_user_id'].astype(str)
global_df = data
print(f"csv successfully retrieved: \n {global_df}")
worksheet2_df = data2.copy()
worksheet2_df['discord_user_id'] = worksheet2_df['discord_user_id'].astype(str)
worksheet2_df['id_recover_test'] = worksheet2_df['id_recover_test'].astype(str)
print(worksheet2_df.dtypes)
# updates both leaderboards
remove_huggingfolks.start()
#await periodic_api_test()
print(f"------------------------------------------------------------------------")
except Exception as e:
print(f"on_ready Error: {e}")
def update_google_sheet():
"""save data from HF Space -> google sheets (makes 2 API calls)"""
try:
print("Updating google sheets...")
name = "levelbot"
#worksheet = gspread_bot.open(name).sheet1
global_df['discord_user_id'] = global_df['discord_user_id'].astype(str)
# could just do this / format
set_with_dataframe(worksheet, global_df)
# very important, otherwise gspread will force format IDs in scientific notation by default (making them unusable)
worksheet.format(f"A1:A{len(global_df.index)+1}", {
"numberFormat": {
"type": 'TEXT',
},
})
timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
print(f"Google sheet {name} successfully updated at {timestamp}! \n{global_df}")
print(f"------------------------------------------------------------------------")
except Exception as e:
print(f"update_google_sheet Error: {e}")
executor = ThreadPoolExecutor(max_workers=1)
scheduler = BackgroundScheduler(executors={'default': executor})
scheduler.add_job(update_google_sheet, trigger='interval', minutes=1, max_instances=1)
scheduler.start()
def calculate_level(xp):
return int(xp ** (1.0 / 3.0))
def calculate_xp(level):
return (int(level ** 3))
processed_users = set()
async def periodic_api_test(): # needs rewrite, can do same thing and interact with csv -> push to google sheets
try:
# this should be gspread type function (do not mix with discord at all)
global worksheet2_df
# get
for index, user in enumerate(worksheet2_df['hf_user_name']):
if user in processed_users:
continue
await asyncio.sleep(0.5)
url = f"https://huggingface.co/api/users/{user}/overview"
response = requests.get(url)
if response.status_code == 200:
data = response.json()
likes = data["numLikes"]
models = data["numModels"]
datasets = data["numDatasets"]
spaces = data["numSpaces"]
discussions = data["numDiscussions"]
papers = data["numPapers"]
upvotes = data["numUpvotes"]
worksheet2_df.loc[index:index, 'likes':'upvotes'] = [[likes, models, datasets, spaces, discussions, papers, upvotes]]
pd.set_option('display.max_rows', 30)
print(worksheet2_df)
processed_users.add(user)
print(processed_users)
else:
print(f"Failed to retrieve data for user {user}. Status code: {response.status_code}")
except Exception as e:
print(f"periodic_api_test Error: {e}")
async def add_exp(member_id):
try:
"""Uses member_id to create new record or update old one [member_id_column] ... [member_exp_column]"""
await asyncio.sleep(0.1)
global global_df
guild = bot.get_guild(879548962464493619)
member = guild.get_member(member_id) # bot.get_user == User, guild.get_member == Member (not the same thing!)
lvl1 = guild.get_role(1171861537699397733)
lvl2 = guild.get_role(1171861595115245699)
lvl3 = guild.get_role(1171861626715115591)
lvl4 = guild.get_role(1171861657975259206)
lvl5 = guild.get_role(1171861686580412497)
lvl6 = guild.get_role(1171861900301172736)
lvl7 = guild.get_role(1171861936258941018)
lvl8 = guild.get_role(1171861968597024868)
lvl9 = guild.get_role(1171862009982242836)
lvl10 = guild.get_role(1164188093713223721)
lvl11 = guild.get_role(1171524944354607104)
lvl12 = guild.get_role(1171524990257082458)
lvl13 = guild.get_role(1171525021928263791)
lvl14 = guild.get_role(1171525062201966724)
lvl15 = guild.get_role(1171525098465918996)
lvl16 = guild.get_role(1176826165546201099)
lvl17 = guild.get_role(1176826221301092392)
lvl18 = guild.get_role(1176826260643659776)
lvl19 = guild.get_role(1176826288816791693)
lvl20 = guild.get_role(1176826319447801896)
lvl21 = guild.get_role(1195030831174008902)
lvl22 = guild.get_role(1195030883351150592)
lvl23 = guild.get_role(1196055555006009445)
lvl24 = guild.get_role(1196055640917938216)
lvl25 = guild.get_role(1196055712506318869)
lvl26 = guild.get_role(1196055775924195378)
lvl27 = guild.get_role(1196055837018435664)
lvl28 = guild.get_role(1196055908267081849)
lvl29 = guild.get_role(1196055970804150352)
lvl30 = guild.get_role(1196056027720847380)
lvls = {
1: lvl1, 2: lvl2, 3: lvl3, 4: lvl4, 5: lvl5, 6: lvl6, 7: lvl7, 8: lvl8, 9: lvl9, 10: lvl10,
11: lvl11, 12: lvl12, 13: lvl13, 14: lvl14, 15: lvl15, 16: lvl16, 17: lvl17, 18: lvl18, 19: lvl19, 20: lvl20,
21: lvl21, 22: lvl22, 23: lvl23, 24: lvl24, 25: lvl25, 26: lvl26, 27: lvl27, 28: lvl28, 29: lvl29, 30: lvl30,
}
# xp = int64
# member_name = string
# discord_user_id = string
member_found = False
for index, cell_value in global_df.iloc[:, 0].items():
if cell_value == str(member_id):
# if found, update that row...
member_found = True
print(f"Record for {member} found at row {index + 1}, column 1")
# increment the old experience value (better not to replace outright)
old_xp = global_df.loc[index, 'discord_exp']
new_xp = old_xp + XP_PER_MESSAGE
global_df.loc[index, 'discord_exp'] = new_xp # do not change column name
print(f"Record for {member} updated from {old_xp} to {global_df.loc[index, 'discord_exp']} (+{XP_PER_MESSAGE}) ")
# level up
current_level = calculate_level(new_xp)
print(f"Current_level for {member}: {current_level}")
if current_level >= 2 and current_level <=30:
current_role = lvls[current_level]
if current_role not in member.roles: # if we leveled up
await member.add_roles(current_role)
print(f"Level Up! Gave {member} {current_role}")
await member.remove_roles(lvls[current_level-1])
print(f"Removed {lvls[current_level-1]} from {member}")
#print(f"{member} Level up! {current_level-1} -> {current_level}!")
if current_role in member.roles: # needs update; reference exp reward for verification
#await member.send(f"Level up! {current_level-1} -> {current_level}!")
#if member_id == 811235357663297546:
row = global_df[global_df['discord_user_id'] == str(member_id)] # does this need to be string?
if not row.empty:
target_exp = row['discord_exp'].values[0]
rank = (global_df['discord_exp'] > target_exp).sum() + 1
print(f"The rank for discord_id {member_id} based on discord_exp is: {rank}")
else:
print(f"Discord ID {member_id} not found in the DataFrame.")
# send embed
embed = Embed(color=Color.blue())
embed.set_author(name=f"{member}", icon_url=member.avatar.url if member.avatar else bot.user.avatar.url)
embed.title = f"Level Up! `{current_level-1}` -> `{current_level}`"
msg = f'πŸ€— Congrats {member}! You just leveled up in the Hugging Face Discord server'
embed.description = f"{msg}."
embed.add_field(name="Leaderboard Ranking:", value=f"πŸ‘‘ **{rank}**\n\nhttps://discord.com/channels/879548962464493619/1197143964994773023", inline=True)
# can use ^ to track changes in leaderboard ranking and display in levelup message when climbing
# (green red arrow thingies)
# could also pull ranks above and below yourself (if they exist, i.e.)
# 1 nateraw
# 2 [you are here]
# 3 osanseviero
# also, ahead by how much exp, how many levels maybe
msg3 = "- Posting\n- Reacting / being reacted to\n- Being active on the Hugging Face Hub (verify to link your Hub + Discord accounts!)"
embed.add_field(name="How to Level Up:", value=msg3, inline=True)
verification_link = "https://discord.com/channels/879548962464493619/900125909984624713"
embed.add_field(name="Verify Here:", value=verification_link, inline=True)
#lunar = bot.get_user(811235357663297546)
await member.send(embed=embed)
print(f"Sent levelup embed to {member}")
#You can verify your account to earn 100 points! To verify, do A.
print(f"------------------------------------------------------------------------")
if not member_found:
# if not, create new record
print(f"creating new record for {member}")
xp = 10 # define somewhere else?
member_id = str(member_id)
member_name = str(member.name)
current_level = calculate_level(xp)
row_data = [member_id, member_name, xp, current_level]
global_df.loc[len(global_df.index)] = row_data
# initial role assignment
if current_level == 1:
if lvl1 not in member.roles:
await member.add_roles(lvl1)
print(f"Gave {member} {lvl1}") # can log this better
print(f"------------------------------------------------------------------------")
except Exception as e:
print(f"add_exp Error: {e}")
@bot.event
async def on_message(message):
try:
if message.author.id not in bot_ids: # could change to if author does not have bot role (roleid)
if "!help_xp" not in message.content:
print(f"adding exp from message {message.author}")
await asyncio.sleep(0.1)
await add_exp(message.author.id)
await bot.process_commands(message)
except Exception as e:
print(f"on_message Error: {e}")
@bot.event
async def on_reaction_add(reaction, user):
try:
if user.id not in bot_ids:
print(f"adding exp from react {user}")
await asyncio.sleep(0.1)
await add_exp(user.id)
await asyncio.sleep(0.1)
await add_exp(reaction.message.author.id)
except Exception as e:
print(f"on_reaction_add Error: {e}")
@tasks.loop(minutes=1)
async def remove_huggingfolks():
try:
# remove huggingfolks
global community_global_df
community_global_df = global_df.copy()
guild = bot.get_guild(879548962464493619)
role = discord.utils.get(guild.roles, id=897376942817419265)
members_with_role = [member.id for member in guild.members if role in member.roles]
for member_id in members_with_role:
community_global_df = community_global_df[community_global_df.iloc[:, 0] != str(member_id)]
#print(community_global_df)
community_global_df.drop(community_global_df.columns[0], axis=1, inplace=True)
community_global_df['discord_exp'] = pd.to_numeric(community_global_df['discord_exp'])
community_global_df = community_global_df.nlargest(len(community_global_df), 'discord_exp')
top_30_exp = community_global_df.nlargest(30, 'discord_exp')
top_30_exp['D'] = ['πŸ₯‡','πŸ₯ˆ','πŸ₯‰','','','','','','','','','','','','','','','','','','','','','','','','','','','']
top_30_rows = top_30_exp.values.tolist()
#print(top_30_rows)
channel = bot.get_channel(1197143964994773023)
message = await channel.fetch_message(1197148293164187678)
# put into message / leaderboard
new_table = tabulate(top_30_rows, headers=["Name", "Experience", "Level", "Rank"], tablefmt="plain")
await message.edit(content=f"Updated Leaderboard:\n```\n{new_table}\n```")
print(f"Updated discord leaderboard!")
except Exception as e:
print(f"remove_huggingfolks Error: {e}")
@bot.command(name='xp_help')
async def xp_help(ctx):
try:
help_message = "How to earn Discord / Hub exp: Post messages, react, Like, discuss, create repos and papers"
await ctx.author.send(help_message)
except Exception as e:
print(f"on_message Error: {e}")
@bot.command()
async def count_users_with_role(ctx, role_id):
role = discord.utils.get(ctx.guild.roles, id=int(role_id))
count = sum(1 for member in ctx.guild.members if role in member.roles)
await ctx.send(f"Number of users with the role '{role.name}': {count}")
# embeds with user pfps?
# name, pfp, time in server....
# weekly do different count
# count number of messages per user for every channel (total messages)
# fix sheet if necessary
# add emojis for some color
# check if members are still in the server
""""""
DISCORD_TOKEN = os.environ.get("DISCORD_TOKEN", None)
def run_bot():
bot.run(DISCORD_TOKEN)
threading.Thread(target=run_bot).start()
URL = "https://docs.google.com/spreadsheets/d/1hQSsIg1Y9WdBF_CdNM1L1rUUREoxKqRTe3_ILo-WK8w/edit#gid=0"
csv_url = URL.replace('/edit#gid=', '/export?format=csv&gid=')
def get_data():
try:
return community_global_df
except Exception as e:
print(f"on_message Error: {e}")
demo = gr.Blocks()
with demo:
try:
dataframe1 = pd.read_csv(csv_url)
column_values_unique = sorted(dataframe1.iloc[:, 3].unique())
dataframe2 = pd.DataFrame({'Levels': column_values_unique})
counts = {}
for value in data.iloc[:, 3]:
counts[value] = counts.get(value, 0) + 1
dataframe2['Members'] = dataframe2['Levels'].map(counts)
print("\nDataframe 2:")
print(dataframe2)
TITLE = """<h1 align="center" id="space-title">πŸ€— Hugging Face Level Leaderboard</h1>"""
gr.HTML(TITLE)
with gr.Tabs(elem_classes="tab-buttons") as tabs:
with gr.TabItem("πŸ… Level leaderboard", elem_id="level-table", id=0):
#gr.Markdown("# πŸ“ˆ Experience Leaderboard")
with gr.Row():
with gr.Column():
gr.DataFrame(get_data, every=5, height=500, interactive=False, col_count=(3, "fixed"), column_widths=["100px","100px","100px"])
with gr.Column():
gr.BarPlot(
value=dataframe2,
x="Levels",
y="Members",
title="Level Distribution",
height=450,
width=450,
interactive=False
)
#with gr.TabItem("πŸ“ˆ Members of the Week", elem_id="week-table", id=1):
#with gr.TabItem("πŸ“ˆ Hub-only leaderboard", elem_id="hub-table", id=2):
except Exception as e:
print(f"on_message Error: {e}")
demo.queue().launch()