Clémentine commited on
Commit
05bda40
1 Parent(s): c2cc6bf

change model types available at submission time

Browse files
app.py CHANGED
@@ -102,7 +102,7 @@ def update_table(
102
  hide_models: list,
103
  query: str,
104
  ):
105
- filtered_df = filter_models(hidden_df, type_query, size_query, precision_query, hide_models)
106
  filtered_df = filter_queries(query, filtered_df)
107
  df = select_columns(filtered_df, columns)
108
  return df
 
102
  hide_models: list,
103
  query: str,
104
  ):
105
+ filtered_df = filter_models(df=hidden_df, type_query=type_query, size_query=size_query, precision_query=precision_query, hide_models=hide_models)
106
  filtered_df = filter_queries(query, filtered_df)
107
  df = select_columns(filtered_df, columns)
108
  return df
src/display/about.py CHANGED
@@ -56,9 +56,8 @@ Side note on the baseline scores:
56
  ## Icons
57
  - {ModelType.PT.to_str(" : ")} model: new, base models, trained on a given corpora
58
  - {ModelType.FT.to_str(" : ")} model: pretrained models finetuned on more data
59
- Specific fine-tune subcategories (more adapted to chat):
60
- - {ModelType.IFT.to_str(" : ")} model: instruction fine-tunes, which are model fine-tuned specifically on datasets of task instruction
61
- - {ModelType.RL.to_str(" : ")} model: reinforcement fine-tunes, which usually change the model loss a bit with an added policy.
62
  If there is no icon, we have not uploaded the information on the model yet, feel free to open an issue with the model information!
63
 
64
  "Flagged" indicates that this model has been flagged by the community, and should probably be ignored! Clicking the link will redirect you to the discussion about the model.
 
56
  ## Icons
57
  - {ModelType.PT.to_str(" : ")} model: new, base models, trained on a given corpora
58
  - {ModelType.FT.to_str(" : ")} model: pretrained models finetuned on more data
59
+ - {ModelType.chat.to_str(" : ")} model: chat like fine-tunes, either using IFT (datasets of task instruction), RLHF or DPO (changing the model loss a bit with an added policy), etc
60
+ - {ModelType.merges.to_str(" : ")} model: merges or MoErges, models which have been merged or fused without additional fine-tuning.
 
61
  If there is no icon, we have not uploaded the information on the model yet, feel free to open an issue with the model information!
62
 
63
  "Flagged" indicates that this model has been flagged by the community, and should probably be ignored! Clicking the link will redirect you to the discussion about the model.
src/display/utils.py CHANGED
@@ -120,9 +120,9 @@ class ModelDetails:
120
 
121
  class ModelType(Enum):
122
  PT = ModelDetails(name="pretrained", symbol="🟢")
123
- FT = ModelDetails(name="fine-tuned", symbol="🔶")
124
- IFT = ModelDetails(name="instruction-tuned", symbol="")
125
- RL = ModelDetails(name="RL-tuned", symbol="🟦")
126
  Unknown = ModelDetails(name="", symbol="?")
127
 
128
  def to_str(self, separator=" "):
@@ -134,10 +134,10 @@ class ModelType(Enum):
134
  return ModelType.FT
135
  if "pretrained" in type or "🟢" in type:
136
  return ModelType.PT
137
- if "RL-tuned" in type or "🟦" in type:
138
- return ModelType.RL
139
- if "instruction-tuned" in type or "" in type:
140
- return ModelType.IFT
141
  return ModelType.Unknown
142
 
143
  class WeightType(Enum):
 
120
 
121
  class ModelType(Enum):
122
  PT = ModelDetails(name="pretrained", symbol="🟢")
123
+ FT = ModelDetails(name="fine-tuned on domain-specific datasets", symbol="🔶")
124
+ chat = ModelDetails(name="chat models (RLHF, DPO, IFT, ...)", symbol="💬")
125
+ merges = ModelDetails(name="merges and moerges", symbol="🤝")
126
  Unknown = ModelDetails(name="", symbol="?")
127
 
128
  def to_str(self, separator=" "):
 
134
  return ModelType.FT
135
  if "pretrained" in type or "🟢" in type:
136
  return ModelType.PT
137
+ if any([k in type for k in ["instruction-tuned", "RL-tuned", "chat", "🟦", "⭕", "💬"]]):
138
+ return ModelType.chat
139
+ if "merge" in type or "🤝" in type:
140
+ return ModelType.merges
141
  return ModelType.Unknown
142
 
143
  class WeightType(Enum):
src/leaderboard/filter_models.py CHANGED
@@ -133,6 +133,6 @@ def remove_forbidden_models(leaderboard_data: list[dict]):
133
  return leaderboard_data
134
 
135
 
136
- def filter_models(leaderboard_data: list[dict]):
137
  leaderboard_data = remove_forbidden_models(leaderboard_data)
138
  flag_models(leaderboard_data)
 
133
  return leaderboard_data
134
 
135
 
136
+ def filter_models_flags(leaderboard_data: list[dict]):
137
  leaderboard_data = remove_forbidden_models(leaderboard_data)
138
  flag_models(leaderboard_data)
src/populate.py CHANGED
@@ -5,7 +5,7 @@ import pandas as pd
5
 
6
  from src.display.formatting import has_no_nan_values, make_clickable_model
7
  from src.display.utils import AutoEvalColumn, EvalQueueColumn, baseline_row
8
- from src.leaderboard.filter_models import filter_models
9
  from src.leaderboard.read_evals import get_raw_eval_results
10
 
11
 
@@ -13,7 +13,7 @@ def get_leaderboard_df(results_path: str, requests_path: str, dynamic_path: str,
13
  raw_data = get_raw_eval_results(results_path=results_path, requests_path=requests_path, dynamic_path=dynamic_path)
14
  all_data_json = [v.to_dict() for v in raw_data]
15
  all_data_json.append(baseline_row)
16
- filter_models(all_data_json)
17
 
18
  df = pd.DataFrame.from_records(all_data_json)
19
  df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
 
5
 
6
  from src.display.formatting import has_no_nan_values, make_clickable_model
7
  from src.display.utils import AutoEvalColumn, EvalQueueColumn, baseline_row
8
+ from src.leaderboard.filter_models import filter_models_flags
9
  from src.leaderboard.read_evals import get_raw_eval_results
10
 
11
 
 
13
  raw_data = get_raw_eval_results(results_path=results_path, requests_path=requests_path, dynamic_path=dynamic_path)
14
  all_data_json = [v.to_dict() for v in raw_data]
15
  all_data_json.append(baseline_row)
16
+ filter_models_flags(all_data_json)
17
 
18
  df = pd.DataFrame.from_records(all_data_json)
19
  df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
src/scripts/update_all_request_files.py CHANGED
@@ -3,6 +3,7 @@ from huggingface_hub import ModelCard
3
 
4
  import json
5
  import time
 
6
  from src.submission.check_validity import is_model_on_hub, check_model_card, get_model_tags
7
  from src.envs import DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH, DYNAMIC_INFO_FILE_PATH, API, H4_TOKEN
8
 
@@ -85,3 +86,4 @@ def update_dynamic_files():
85
  commit_message=f"Daily request file update.",
86
  )
87
  print(f"UPDATE_DYNAMIC: pushed to hub")
 
 
3
 
4
  import json
5
  import time
6
+
7
  from src.submission.check_validity import is_model_on_hub, check_model_card, get_model_tags
8
  from src.envs import DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH, DYNAMIC_INFO_FILE_PATH, API, H4_TOKEN
9
 
 
86
  commit_message=f"Daily request file update.",
87
  )
88
  print(f"UPDATE_DYNAMIC: pushed to hub")
89
+
update_dynamic.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from src.scripts.update_all_request_files import update_dynamic_files
2
+
3
+ if __name__ == "__main__":
4
+ update_dynamic_files()