lixuejing commited on
Commit
8545ff9
·
1 Parent(s): ff205eb

update metric

Browse files
app.py CHANGED
@@ -29,12 +29,13 @@ from src.display.utils import (
29
  from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO, TOKEN
30
  from src.populate import get_evaluation_queue_df, get_leaderboard_df
31
  from src.submission.submit import add_new_eval
32
- #from src.tools.collections import update_collections
33
- #from src.tools.plots import (
34
- # create_metric_plot_obj,
35
- # create_plot_df,
36
- # create_scores_df,
37
- #)
 
38
 
39
  def restart_space():
40
  API.restart_space(repo_id=REPO_ID)
@@ -58,18 +59,18 @@ def init_space():
58
  except Exception:
59
  restart_space()
60
 
61
- #raw_data, original_df = get_leaderboard_df(
62
- leaderboard_df = get_leaderboard_df(
63
  results_path=EVAL_RESULTS_PATH,
64
  requests_path=EVAL_REQUESTS_PATH,
65
  #dynamic_path=DYNAMIC_INFO_FILE_PATH,
66
  cols=COLS,
67
  benchmark_cols=BENCHMARK_COLS
68
  )
69
- #update_collections(original_df.copy())
70
- #leaderboard_df = original_df.copy()
71
 
72
- #plot_df = create_plot_df(create_scores_df(raw_data))
73
 
74
  (
75
  finished_eval_queue_df,
@@ -77,11 +78,12 @@ def init_space():
77
  pending_eval_queue_df,
78
  ) = get_evaluation_queue_df(EVAL_REQUESTS_PATH, EVAL_COLS)
79
 
80
- #return leaderboard_df, original_df, plot_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df
81
- #leaderboard_df, original_df, plot_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df = init_space()
82
- return leaderboard_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df
 
83
 
84
- leaderboard_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df = init_space()
85
 
86
 
87
  # Searching and filtering
@@ -297,8 +299,8 @@ with demo:
297
 
298
  # Dummy leaderboard for handling the case when the user uses backspace key
299
  hidden_leaderboard_table_for_search = gr.components.Dataframe(
300
- #value=original_df[COLS],
301
- value=leaderboard_df[COLS],
302
  headers=COLS,
303
  datatype=TYPES,
304
  visible=False,
@@ -351,6 +353,23 @@ with demo:
351
  queue=True,
352
  )
353
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
354
  with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=2):
355
  gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
356
 
@@ -453,5 +472,6 @@ with demo:
453
 
454
  scheduler = BackgroundScheduler()
455
  scheduler.add_job(restart_space, "interval", seconds=1800)
 
456
  scheduler.start()
457
  demo.queue(default_concurrency_limit=40).launch()
 
29
  from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO, TOKEN
30
  from src.populate import get_evaluation_queue_df, get_leaderboard_df
31
  from src.submission.submit import add_new_eval
32
+ from src.scripts.update_all_request_files import update_dynamic_files
33
+ from src.tools.collections import update_collections
34
+ from src.tools.plots import (
35
+ create_metric_plot_obj,
36
+ create_plot_df,
37
+ create_scores_df,
38
+ )
39
 
40
  def restart_space():
41
  API.restart_space(repo_id=REPO_ID)
 
59
  except Exception:
60
  restart_space()
61
 
62
+ raw_data, original_df = get_leaderboard_df(
63
+ #leaderboard_df = get_leaderboard_df(
64
  results_path=EVAL_RESULTS_PATH,
65
  requests_path=EVAL_REQUESTS_PATH,
66
  #dynamic_path=DYNAMIC_INFO_FILE_PATH,
67
  cols=COLS,
68
  benchmark_cols=BENCHMARK_COLS
69
  )
70
+ update_collections(original_df.copy())
71
+ leaderboard_df = original_df.copy()
72
 
73
+ plot_df = create_plot_df(create_scores_df(raw_data))
74
 
75
  (
76
  finished_eval_queue_df,
 
78
  pending_eval_queue_df,
79
  ) = get_evaluation_queue_df(EVAL_REQUESTS_PATH, EVAL_COLS)
80
 
81
+ return leaderboard_df, original_df, plot_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df
82
+
83
+ leaderboard_df, original_df, plot_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df = init_space()
84
+ #return leaderboard_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df
85
 
86
+ #leaderboard_df, finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df = init_space()
87
 
88
 
89
  # Searching and filtering
 
299
 
300
  # Dummy leaderboard for handling the case when the user uses backspace key
301
  hidden_leaderboard_table_for_search = gr.components.Dataframe(
302
+ value=original_df[COLS],
303
+ #value=leaderboard_df[COLS],
304
  headers=COLS,
305
  datatype=TYPES,
306
  visible=False,
 
353
  queue=True,
354
  )
355
 
356
+ with gr.TabItem("📈 Metrics through time", elem_id="llm-benchmark-tab-table", id=4):
357
+ with gr.Row():
358
+ with gr.Column():
359
+ chart = create_metric_plot_obj(
360
+ plot_df,
361
+ [AutoEvalColumn.average.name],
362
+ title="Average of Top Scores and Human Baseline Over Time (from last update)",
363
+ )
364
+ gr.Plot(value=chart, min_width=500)
365
+ with gr.Column():
366
+ chart = create_metric_plot_obj(
367
+ plot_df,
368
+ BENCHMARK_COLS,
369
+ title="Top Scores and Human Baseline Over Time (from last update)",
370
+ )
371
+ gr.Plot(value=chart, min_width=500)
372
+
373
  with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=2):
374
  gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
375
 
 
472
 
473
  scheduler = BackgroundScheduler()
474
  scheduler.add_job(restart_space, "interval", seconds=1800)
475
+ scheduler.add_job(update_dynamic_files, "cron", minute=30) # launched every hour on the hour
476
  scheduler.start()
477
  demo.queue(default_concurrency_limit=40).launch()
src/about.py CHANGED
@@ -12,17 +12,16 @@ class Task:
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
14
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
15
- task0 = Task("cmmmu", "acc", "CMMMU")
16
- task1 = Task("cmmu", "acc", "CMMU")
17
- task2 = Task("cv_bench", "acc", "CV_Bench")
18
- task3 = Task("hallusion_bench", "acc", "Hallusion_Bench")
19
- task4 = Task("mmmu", "acc", "MMMU")
20
- task5 = Task("mmmu_pro_standard", "acc", "MMMU_Pro_Standard")
21
- task6 = Task("mmmu_pro_vision", "acc", "MMMU_Pro_Vision")
22
- task7 = Task("ocrbench", "acc", "OCRBench")
23
- task8 = Task("math_vision", "acc", "Math_Vision")
24
- task9 = Task("cvbench", "acc", "CVBench")
25
- task10 = Task("ciibench", "acc", "CIIBench")
26
 
27
  NUM_FEWSHOT = 0 # Change with your few shot
28
  # ---------------------------------------------------
 
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
14
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
15
+ cmmmu = Task("cmmmu", "acc", "CMMMU")
16
+ cmmu = Task("cmmu", "acc", "CMMU")
17
+ cv_bench = Task("cv_bench", "acc", "CV_Bench")
18
+ hallusion_bench = Task("hallusion_bench", "acc", "Hallusion_Bench")
19
+ mmmu = Task("mmmu", "acc", "MMMU")
20
+ mmmu_pro_standard = Task("mmmu_pro_standard", "acc", "MMMU_Pro_Standard")
21
+ mmmu_pro_vision = Task("mmmu_pro_vision", "acc", "MMMU_Pro_Vision")
22
+ ocrbench = Task("ocrbench", "acc", "OCRBench")
23
+ math_vision = Task("math_vision", "acc", "Math_Vision")
24
+ ciibench = Task("ciibench", "acc", "CIIBench")
 
25
 
26
  NUM_FEWSHOT = 0 # Change with your few shot
27
  # ---------------------------------------------------
src/display/utils.py CHANGED
@@ -136,3 +136,47 @@ NUMERIC_INTERVALS = {
136
  "~60": pd.Interval(45, 70, closed="right"),
137
  "70+": pd.Interval(70, 10000, closed="right"),
138
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
136
  "~60": pd.Interval(45, 70, closed="right"),
137
  "70+": pd.Interval(70, 10000, closed="right"),
138
  }
139
+
140
+ # Define the baselines
141
+ baseline_row = {
142
+ AutoEvalColumn.model.name: "<p>Baseline</p>",
143
+ AutoEvalColumn.revision.name: "N/A",
144
+ AutoEvalColumn.precision.name: None,
145
+ AutoEvalColumn.average.name: 92.75,
146
+ AutoEvalColumn.merged.name: False,
147
+ AutoEvalColumn.cmmmu.name: 100,
148
+ AutoEvalColumn.cmmu.name: 100,
149
+ AutoEvalColumn.cv_bench.name: 100,
150
+ AutoEvalColumn.hallusion_bench.name: 100,
151
+ AutoEvalColumn.mmmu.name: 100,
152
+ AutoEvalColumn.mmmu_pro_standard.name: 100,
153
+ AutoEvalColumn.mmmu_pro_vision.name: 100,
154
+ AutoEvalColumn.ocrbench.name: 100,
155
+ AutoEvalColumn.math_vision.name: 100,
156
+ AutoEvalColumn.ciibench.name: 100,
157
+ AutoEvalColumn.dummy.name: "baseline",
158
+ AutoEvalColumn.model_type.name: "",
159
+ AutoEvalColumn.flagged.name: False,
160
+ }
161
+
162
+ # Define the human baselines
163
+ human_baseline_row = {
164
+ AutoEvalColumn.model.name: "<p>Human performance</p>",
165
+ AutoEvalColumn.revision.name: "N/A",
166
+ AutoEvalColumn.precision.name: None,
167
+ AutoEvalColumn.average.name: 92.75,
168
+ AutoEvalColumn.merged.name: False,
169
+ AutoEvalColumn.cmmmu.name: 100,
170
+ AutoEvalColumn.cmmu.name: 100,
171
+ AutoEvalColumn.cv_bench.name: 100,
172
+ AutoEvalColumn.hallusion_bench.name: 100,
173
+ AutoEvalColumn.mmmu.name: 100,
174
+ AutoEvalColumn.mmmu_pro_standard.name: 100,
175
+ AutoEvalColumn.mmmu_pro_vision.name: 100,
176
+ AutoEvalColumn.ocrbench.name: 100,
177
+ AutoEvalColumn.math_vision.name: 100,
178
+ AutoEvalColumn.ciibench.name: 100,
179
+ AutoEvalColumn.dummy.name: "human_baseline",
180
+ AutoEvalColumn.model_type.name: "",
181
+ AutoEvalColumn.flagged.name: False,
182
+ }
src/envs.py CHANGED
@@ -6,12 +6,18 @@ from huggingface_hub import HfApi
6
  # ----------------------------------
7
  TOKEN = os.environ.get("HF_TOKEN") # A read/write token for your org
8
 
9
- OWNER = "demo-leaderboard-backend" # Change to your org - don't forget to create a results and request dataset, with the correct format!
 
10
  # ----------------------------------
11
 
12
- REPO_ID = f"{OWNER}/leaderboard"
13
- QUEUE_REPO = f"{OWNER}/requests"
14
- RESULTS_REPO = f"{OWNER}/results"
 
 
 
 
 
15
 
16
  # If you setup a cache later, just change HF_HOME
17
  CACHE_PATH=os.getenv("HF_HOME", ".")
@@ -21,5 +27,8 @@ EVAL_REQUESTS_PATH = os.path.join(CACHE_PATH, "eval-queue")
21
  EVAL_RESULTS_PATH = os.path.join(CACHE_PATH, "eval-results")
22
  EVAL_REQUESTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-queue-bk")
23
  EVAL_RESULTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-results-bk")
 
 
24
 
 
25
  API = HfApi(token=TOKEN)
 
6
  # ----------------------------------
7
  TOKEN = os.environ.get("HF_TOKEN") # A read/write token for your org
8
 
9
+
10
+ #OWNER = "BAAI/open_flageval_vlm_leaderboard" # Change to your org - don't forget to create a results and request dataset, with the correct format!
11
  # ----------------------------------
12
 
13
+ #REPO_ID = f"{OWNER}/leaderboard"
14
+ #QUEUE_REPO = f"{OWNER}/requests"
15
+ #RESULTS_REPO = f"{OWNER}/results"
16
+ #DYNAMIC_INFO_REPO = f"{OWNER}/dynamic_model_information"
17
+ REPO_ID = "BAAI/open_flageval_vlm_leaderboard"
18
+ QUEUE_REPO = "open-cn-llm-leaderboard/vlm_requests"
19
+ DYNAMIC_INFO_REPO = "open-cn-llm-leaderboard/vlm_dynamic_model_information"
20
+ RESULTS_REPO = "open-cn-llm-leaderboard/vlm_results"
21
 
22
  # If you setup a cache later, just change HF_HOME
23
  CACHE_PATH=os.getenv("HF_HOME", ".")
 
27
  EVAL_RESULTS_PATH = os.path.join(CACHE_PATH, "eval-results")
28
  EVAL_REQUESTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-queue-bk")
29
  EVAL_RESULTS_PATH_BACKEND = os.path.join(CACHE_PATH, "eval-results-bk")
30
+ DYNAMIC_INFO_PATH = os.path.join(CACHE_PATH, "dynamic-info")
31
+ DYNAMIC_INFO_FILE_PATH = os.path.join(DYNAMIC_INFO_PATH, "model_infos.json")
32
 
33
+ PATH_TO_COLLECTION = "open-cn-llm-leaderboard/flageval-vlm-leaderboard-best-models-677e51cdc44f8123e02cbda1"
34
  API = HfApi(token=TOKEN)
src/populate.py CHANGED
@@ -4,7 +4,7 @@ import os
4
  import pandas as pd
5
 
6
  from src.display.formatting import has_no_nan_values, make_clickable_model
7
- from src.display.utils import AutoEvalColumn, EvalQueueColumn
8
  from src.leaderboard.read_evals import get_raw_eval_results
9
  from src.leaderboard.filter_models import filter_models_flags
10
 
@@ -13,6 +13,7 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
13
  """Creates a dataframe from all the individual experiment results"""
14
  raw_data = get_raw_eval_results(results_path, requests_path)
15
  all_data_json = [v.to_dict() for v in raw_data]
 
16
  filter_models_flags(all_data_json)
17
 
18
  df = pd.DataFrame.from_records(all_data_json)
@@ -21,7 +22,7 @@ def get_leaderboard_df(results_path: str, requests_path: str, cols: list, benchm
21
 
22
  # filter out if any of the benchmarks have not been produced
23
  df = df[has_no_nan_values(df, benchmark_cols)]
24
- return df
25
 
26
 
27
  def get_evaluation_queue_df(save_path: str, cols: list) -> list[pd.DataFrame]:
 
4
  import pandas as pd
5
 
6
  from src.display.formatting import has_no_nan_values, make_clickable_model
7
+ from src.display.utils import AutoEvalColumn, EvalQueueColumn, baseline_row
8
  from src.leaderboard.read_evals import get_raw_eval_results
9
  from src.leaderboard.filter_models import filter_models_flags
10
 
 
13
  """Creates a dataframe from all the individual experiment results"""
14
  raw_data = get_raw_eval_results(results_path, requests_path)
15
  all_data_json = [v.to_dict() for v in raw_data]
16
+ all_data_json.append(baseline_row)
17
  filter_models_flags(all_data_json)
18
 
19
  df = pd.DataFrame.from_records(all_data_json)
 
22
 
23
  # filter out if any of the benchmarks have not been produced
24
  df = df[has_no_nan_values(df, benchmark_cols)]
25
+ return raw_data, df
26
 
27
 
28
  def get_evaluation_queue_df(save_path: str, cols: list) -> list[pd.DataFrame]:
src/scripts/create_request_file.py ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import json
2
+ import os
3
+ import pprint
4
+ from datetime import datetime, timezone
5
+
6
+ import click
7
+ from colorama import Fore
8
+ from huggingface_hub import HfApi, snapshot_download
9
+
10
+ from src.submission.check_validity import get_model_size
11
+ from src.display.utils import ModelType, WeightType
12
+
13
+ EVAL_REQUESTS_PATH = "eval-queue"
14
+ QUEUE_REPO = "open-cn-llm-leaderboard/vlm_requests"
15
+
16
+ precisions = ("float16", "bfloat16", "8bit (LLM.int8)", "4bit (QLoRA / FP4)", "GPTQ")
17
+ model_types = [e.name for e in ModelType]
18
+ weight_types = [e.name for e in WeightType]
19
+
20
+
21
+ def main():
22
+ api = HfApi()
23
+ current_time = datetime.now(timezone.utc).strftime("%Y-%m-%dT%H:%M:%SZ")
24
+ snapshot_download(repo_id=QUEUE_REPO, revision="main", local_dir=EVAL_REQUESTS_PATH, repo_type="dataset")
25
+
26
+ model_name = click.prompt("Enter model name")
27
+ revision = click.prompt("Enter revision", default="main")
28
+ precision = click.prompt("Enter precision", default="float16", type=click.Choice(precisions))
29
+ model_type = click.prompt("Enter model type", type=click.Choice(model_types))
30
+ weight_type = click.prompt("Enter weight type", default="Original", type=click.Choice(weight_types))
31
+ base_model = click.prompt("Enter base model", default="")
32
+ status = click.prompt("Enter status", default="FINISHED")
33
+
34
+ try:
35
+ model_info = api.model_info(repo_id=model_name, revision=revision)
36
+ except Exception as e:
37
+ print(f"{Fore.RED}Could not find model info for {model_name} on the Hub\n{e}{Fore.RESET}")
38
+ return 1
39
+
40
+ model_size = get_model_size(model_info=model_info, precision=precision)
41
+
42
+ try:
43
+ license = model_info.cardData["license"]
44
+ except Exception:
45
+ license = "?"
46
+
47
+ eval_entry = {
48
+ "model": model_name,
49
+ "base_model": base_model,
50
+ "revision": revision,
51
+ "private": False,
52
+ "precision": precision,
53
+ "weight_type": weight_type,
54
+ "status": status,
55
+ "submitted_time": current_time,
56
+ "model_type": model_type,
57
+ "likes": model_info.likes,
58
+ "params": model_size,
59
+ "license": license,
60
+ }
61
+
62
+ user_name = ""
63
+ model_path = model_name
64
+ if "/" in model_name:
65
+ user_name = model_name.split("/")[0]
66
+ model_path = model_name.split("/")[1]
67
+
68
+ pprint.pprint(eval_entry)
69
+
70
+ if click.confirm("Do you want to continue? This request file will be pushed to the hub"):
71
+ click.echo("continuing...")
72
+
73
+ out_dir = f"{EVAL_REQUESTS_PATH}/{user_name}"
74
+ os.makedirs(out_dir, exist_ok=True)
75
+ out_path = f"{out_dir}/{model_path}_eval_request_{False}_{precision}_{weight_type}.json"
76
+
77
+ with open(out_path, "w") as f:
78
+ # f.write(json.dumps(eval_entry))
79
+ json.dump(eval_entry, f, indent=4)
80
+
81
+ api.upload_file(
82
+ path_or_fileobj=out_path,
83
+ path_in_repo=out_path.split(f"{EVAL_REQUESTS_PATH}/")[1],
84
+ repo_id=QUEUE_REPO,
85
+ repo_type="dataset",
86
+ commit_message=f"Add {model_name} to eval queue",
87
+ )
88
+ else:
89
+ click.echo("aborting...")
90
+
91
+
92
+ if __name__ == "__main__":
93
+ main()
src/scripts/update_all_request_files.py ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #from huggingface_hub import ModelFilter, snapshot_download
2
+ from huggingface_hub import snapshot_download
3
+ from huggingface_hub import ModelCard
4
+
5
+ import json
6
+ import time
7
+
8
+ from src.submission.check_validity import is_model_on_hub, check_model_card, get_model_tags
9
+ from src.envs import DYNAMIC_INFO_REPO, DYNAMIC_INFO_PATH, DYNAMIC_INFO_FILE_PATH, API, TOKEN
10
+
11
+ def update_models(file_path, models):
12
+ """
13
+ Search through all JSON files in the specified root folder and its subfolders,
14
+ and update the likes key in JSON dict from value of input dict
15
+ """
16
+ with open(file_path, "r") as f:
17
+ model_infos = json.load(f)
18
+ for model_id, data in model_infos.items():
19
+ if model_id not in models:
20
+ data['still_on_hub'] = False
21
+ data['likes'] = 0
22
+ data['downloads'] = 0
23
+ data['created_at'] = ""
24
+ continue
25
+
26
+ model_cfg = models[model_id]
27
+ data['likes'] = model_cfg.likes
28
+ data['downloads'] = model_cfg.downloads
29
+ data['created_at'] = str(model_cfg.created_at)
30
+ #data['params'] = get_model_size(model_cfg, data['precision'])
31
+ data['license'] = model_cfg.card_data.license if model_cfg.card_data is not None else ""
32
+
33
+ # Is the model still on the hub?
34
+ model_name = model_id
35
+ if model_cfg.card_data is not None and model_cfg.card_data.base_model is not None:
36
+ model_name = model_cfg.card_data.base_model # for adapters, we look at the parent model
37
+ still_on_hub, _, _ = is_model_on_hub(
38
+ model_name=model_name, revision=data.get("revision"), trust_remote_code=True, test_tokenizer=False, token=TOKEN
39
+ )
40
+ # If the model doesn't have a model card or a license, we consider it's deleted
41
+ if still_on_hub:
42
+ try:
43
+ status, _, model_card = check_model_card(model_id)
44
+ if status is False:
45
+ still_on_hub = False
46
+ except Exception:
47
+ model_card = None
48
+ still_on_hub = False
49
+ data['still_on_hub'] = still_on_hub
50
+
51
+ tags = get_model_tags(model_card, model_id) if still_on_hub else []
52
+
53
+ data["tags"] = tags
54
+
55
+ with open(file_path, 'w') as f:
56
+ json.dump(model_infos, f, indent=2)
57
+
58
+ def update_dynamic_files():
59
+ """ This will only update metadata for models already linked in the repo, not add missing ones.
60
+ """
61
+ snapshot_download(
62
+ repo_id=DYNAMIC_INFO_REPO, local_dir=DYNAMIC_INFO_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30
63
+ )
64
+
65
+ print("UPDATE_DYNAMIC: Loaded snapshot")
66
+ # Get models
67
+ start = time.time()
68
+
69
+ models = list(API.list_models(
70
+ #filter=ModelFilter(task="text-generation"),
71
+ task="text-generation",
72
+ full=False,
73
+ cardData=True,
74
+ fetch_config=True,
75
+ ))
76
+ id_to_model = {model.id : model for model in models}
77
+
78
+ print(f"UPDATE_DYNAMIC: Downloaded list of models in {time.time() - start:.2f} seconds")
79
+
80
+ start = time.time()
81
+
82
+ update_models(DYNAMIC_INFO_FILE_PATH, id_to_model)
83
+
84
+ print(f"UPDATE_DYNAMIC: updated in {time.time() - start:.2f} seconds")
85
+
86
+ API.upload_file(
87
+ path_or_fileobj=DYNAMIC_INFO_FILE_PATH,
88
+ path_in_repo=DYNAMIC_INFO_FILE_PATH.split("/")[-1],
89
+ repo_id=DYNAMIC_INFO_REPO,
90
+ repo_type="dataset",
91
+ commit_message=f"Daily request file update.",
92
+ )
93
+ print(f"UPDATE_DYNAMIC: pushed to hub")
94
+
src/tools/collections.py ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+
3
+ import pandas as pd
4
+ from huggingface_hub import add_collection_item, delete_collection_item, get_collection, update_collection_item
5
+ from huggingface_hub.utils._errors import HfHubHTTPError
6
+ from pandas import DataFrame
7
+
8
+ from src.display.utils import AutoEvalColumn, ModelType
9
+ from src.envs import TOKEN, PATH_TO_COLLECTION
10
+
11
+ # Specific intervals for the collections
12
+ intervals = {
13
+ "1B": pd.Interval(0, 1.5, closed="right"),
14
+ "3B": pd.Interval(2.5, 3.5, closed="neither"),
15
+ "7B": pd.Interval(6, 8, closed="neither"),
16
+ "13B": pd.Interval(10, 14, closed="neither"),
17
+ "30B": pd.Interval(25, 35, closed="neither"),
18
+ "65B": pd.Interval(60, 70, closed="neither"),
19
+ }
20
+
21
+
22
+ def update_collections(df: DataFrame):
23
+ """This function updates the Open LLM Leaderboard model collection with the latest best models for
24
+ each size category and type.
25
+ """
26
+ collection = get_collection(collection_slug=PATH_TO_COLLECTION, token=TOKEN)
27
+ params_column = pd.to_numeric(df[AutoEvalColumn.params.name], errors="coerce")
28
+
29
+ cur_best_models = []
30
+
31
+ ix = 0
32
+ for type in ModelType:
33
+ if type.value.name == "":
34
+ continue
35
+ for size in intervals:
36
+ # We filter the df to gather the relevant models
37
+ type_emoji = [t[0] for t in type.value.symbol]
38
+ filtered_df = df[df[AutoEvalColumn.model_type_symbol.name].isin(type_emoji)]
39
+
40
+ numeric_interval = pd.IntervalIndex([intervals[size]])
41
+ mask = params_column.apply(lambda x: any(numeric_interval.contains(x)))
42
+ filtered_df = filtered_df.loc[mask]
43
+
44
+ best_models = list(
45
+ filtered_df.sort_values(AutoEvalColumn.average.name, ascending=False)[AutoEvalColumn.dummy.name]
46
+ )
47
+ print(type.value.symbol, size, best_models[:10])
48
+
49
+ # We add them one by one to the leaderboard
50
+ for model in best_models:
51
+ ix += 1
52
+ cur_len_collection = len(collection.items)
53
+ try:
54
+ collection = add_collection_item(
55
+ PATH_TO_COLLECTION,
56
+ item_id=model,
57
+ item_type="model",
58
+ exists_ok=True,
59
+ note=f"Best {type.to_str(' ')} model of around {size} on the leaderboard today!",
60
+ token=TOKEN,
61
+ )
62
+ if (
63
+ len(collection.items) > cur_len_collection
64
+ ): # we added an item - we make sure its position is correct
65
+ item_object_id = collection.items[-1].item_object_id
66
+ update_collection_item(
67
+ collection_slug=PATH_TO_COLLECTION, item_object_id=item_object_id, position=ix
68
+ )
69
+ cur_len_collection = len(collection.items)
70
+ cur_best_models.append(model)
71
+ break
72
+ except HfHubHTTPError:
73
+ continue
74
+
75
+ collection = get_collection(PATH_TO_COLLECTION, token=TOKEN)
76
+ for item in collection.items:
77
+ if item.item_id not in cur_best_models:
78
+ try:
79
+ delete_collection_item(
80
+ collection_slug=PATH_TO_COLLECTION, item_object_id=item.item_object_id, token=TOKEN
81
+ )
82
+ except HfHubHTTPError:
83
+ continue
src/tools/model_backlinks.py ADDED
@@ -0,0 +1,1309 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ models = [
2
+ "uni-tianyan/Uni-TianYan",
3
+ "fangloveskari/ORCA_LLaMA_70B_QLoRA",
4
+ "garage-bAInd/Platypus2-70B-instruct",
5
+ "upstage/Llama-2-70b-instruct-v2",
6
+ "fangloveskari/Platypus_QLoRA_LLaMA_70b",
7
+ "yeontaek/llama-2-70B-ensemble-v5",
8
+ "TheBloke/Genz-70b-GPTQ",
9
+ "TheBloke/Platypus2-70B-Instruct-GPTQ",
10
+ "psmathur/model_007",
11
+ "yeontaek/llama-2-70B-ensemble-v4",
12
+ "psmathur/orca_mini_v3_70b",
13
+ "ehartford/Samantha-1.11-70b",
14
+ "MayaPH/GodziLLa2-70B",
15
+ "psmathur/model_007_v2",
16
+ "chargoddard/MelangeA-70b",
17
+ "ehartford/Samantha-1.1-70b",
18
+ "psmathur/model_009",
19
+ "upstage/Llama-2-70b-instruct",
20
+ "yeontaek/llama-2-70B-ensemble-v7",
21
+ "yeontaek/llama-2-70B-ensemble-v6",
22
+ "chargoddard/MelangeB-70b",
23
+ "yeontaek/llama-2-70B-ensemble-v3",
24
+ "chargoddard/MelangeC-70b",
25
+ "garage-bAInd/Camel-Platypus2-70B",
26
+ "yeontaek/llama-2-70B-ensemble-v2",
27
+ "garage-bAInd/Camel-Platypus2-70B",
28
+ "migtissera/Synthia-70B-v1.2",
29
+ "v2ray/LLaMA-2-Wizard-70B-QLoRA",
30
+ "quantumaikr/llama-2-70b-fb16-orca-chat-10k",
31
+ "v2ray/LLaMA-2-Wizard-70B-QLoRA",
32
+ "stabilityai/StableBeluga2",
33
+ "quantumaikr/llama-2-70b-fb16-guanaco-1k",
34
+ "garage-bAInd/Camel-Platypus2-70B",
35
+ "migtissera/Synthia-70B-v1.1",
36
+ "migtissera/Synthia-70B",
37
+ "psmathur/model_101",
38
+ "augtoma/qCammel70",
39
+ "augtoma/qCammel-70",
40
+ "augtoma/qCammel-70v1",
41
+ "augtoma/qCammel-70x",
42
+ "augtoma/qCammel-70-x",
43
+ "jondurbin/airoboros-l2-70b-gpt4-1.4.1",
44
+ "dfurman/llama-2-70b-dolphin-peft",
45
+ "jondurbin/airoboros-l2-70b-2.1",
46
+ "TheBloke/llama-2-70b-Guanaco-QLoRA-fp16",
47
+ "quantumaikr/QuantumLM-llama2-70B-Korean-LoRA",
48
+ "quantumaikr/quantumairk-llama-2-70B-instruct",
49
+ "psmathur/model_420",
50
+ "psmathur/model_51",
51
+ "garage-bAInd/Camel-Platypus2-70B",
52
+ "TheBloke/Airoboros-L2-70B-2.1-GPTQ",
53
+ "OpenAssistant/llama2-70b-oasst-sft-v10",
54
+ "garage-bAInd/Platypus2-70B",
55
+ "liuxiang886/llama2-70B-qlora-gpt4",
56
+ "upstage/llama-65b-instruct",
57
+ "quantumaikr/llama-2-70b-fb16-korean",
58
+ "NousResearch/Nous-Hermes-Llama2-70b",
59
+ "v2ray/LLaMA-2-Jannie-70B-QLoRA",
60
+ "jondurbin/airoboros-l2-70b-gpt4-m2.0",
61
+ "jondurbin/airoboros-l2-70b-gpt4-m2.0",
62
+ "OpenAssistant/llama2-70b-oasst-sft-v10",
63
+ "yeontaek/llama-2-70B-ensemble-v8",
64
+ "jondurbin/airoboros-l2-70b-gpt4-2.0",
65
+ "jarradh/llama2_70b_chat_uncensored",
66
+ "WizardLM/WizardMath-70B-V1.0",
67
+ "jordiclive/Llama-2-70b-oasst-1-200",
68
+ "WizardLM/WizardMath-70B-V1.0",
69
+ "jondurbin/airoboros-l2-70b-gpt4-2.0",
70
+ "OpenLemur/lemur-70b-chat-v1",
71
+ "tiiuae/falcon-180B",
72
+ "tiiuae/falcon-180B",
73
+ "stabilityai/StableBeluga1-Delta",
74
+ "psmathur/model_42_70b",
75
+ "psmathur/test_42_70b",
76
+ "TheBloke/fiction.live-Kimiko-V2-70B-fp16",
77
+ "tiiuae/falcon-180B",
78
+ "WizardLM/WizardMath-70B-V1.0",
79
+ "tiiuae/falcon-180B-chat",
80
+ "jondurbin/airoboros-l2-70b-gpt4-2.0",
81
+ "ehartford/samantha-1.1-llama-33b",
82
+ "ajibawa-2023/scarlett-33b",
83
+ "ddobokki/Llama-2-70b-orca-200k",
84
+ "TheBloke/gpt4-alpaca-lora_mlp-65B-HF",
85
+ "tiiuae/falcon-180B-chat",
86
+ "tiiuae/falcon-180B-chat",
87
+ "tiiuae/falcon-180B",
88
+ "TheBloke/Lemur-70B-Chat-v1-GPTQ",
89
+ "NousResearch/Nous-Puffin-70B",
90
+ "WizardLM/WizardLM-70B-V1.0",
91
+ "WizardLM/WizardMath-70B-V1.0",
92
+ "meta-llama/Llama-2-70b-hf",
93
+ "TheBloke/Llama-2-70B-fp16",
94
+ "Weyaxi/llama-2-alpacagpt4-1000step",
95
+ "WizardLM/WizardLM-70B-V1.0",
96
+ "simsim314/WizardLM-70B-V1.0-HF",
97
+ "simsim314/WizardLM-70B-V1.0-HF",
98
+ "WizardLM/WizardLM-70B-V1.0",
99
+ "openbmb/UltraLM-65b",
100
+ "psmathur/model_420_preview",
101
+ "WizardLM/WizardLM-70B-V1.0",
102
+ "simsim314/WizardLM-70B-V1.0-HF",
103
+ "OpenBuddy/openbuddy-llama2-70b-v10.1-bf16",
104
+ "upstage/llama-30b-instruct-2048",
105
+ "jondurbin/airoboros-65b-gpt4-1.2",
106
+ "TheBloke/guanaco-65B-HF",
107
+ "jondurbin/airoboros-65b-gpt4-1.3",
108
+ "meta-llama/Llama-2-70b-chat-hf",
109
+ "ValiantLabs/ShiningValiant",
110
+ "Faradaylab/Aria-70B",
111
+ "lilloukas/GPlatty-30B",
112
+ "TheBloke/VicUnlocked-alpaca-65B-QLoRA-fp16",
113
+ "jondurbin/airoboros-65b-gpt4-1.4-peft",
114
+ "jondurbin/airoboros-65b-gpt4-1.4",
115
+ "jondurbin/airoboros-65b-gpt4-2.0",
116
+ "TheBloke/WizardLM-70B-V1.0-GPTQ",
117
+ "TheBloke/WizardLM-70B-V1.0-GPTQ",
118
+ "ariellee/SuperPlatty-30B",
119
+ "jondurbin/airoboros-65b-gpt4-1.4",
120
+ "jondurbin/airoboros-65b-gpt4-2.0",
121
+ "yeontaek/llama-2-70b-IA3-guanaco",
122
+ "CalderaAI/30B-Lazarus",
123
+ "Aspik101/trurl-2-13b-pl-instruct_unload",
124
+ "ehartford/WizardLM-33B-V1.0-Uncensored",
125
+ "ehartford/WizardLM-33B-V1.0-Uncensored",
126
+ "OpenBuddy/openbuddy-llama-65b-v8-bf16",
127
+ "Aspik101/llama-30b-instruct-2048-PL-lora",
128
+ "h2oai/h2ogpt-research-oasst1-llama-65b",
129
+ "Aspik101/llama-30b-instruct-2048-PL-lora",
130
+ "CalderaAI/30B-Epsilon",
131
+ "Aspik101/llama-30b-2048-instruct-PL-lora_unload",
132
+ "jondurbin/airoboros-65b-gpt4-m2.0",
133
+ "jondurbin/airoboros-65b-gpt4-m2.0",
134
+ "Aeala/Alpaca-elina-65b",
135
+ "TheBloke/robin-65b-v2-fp16",
136
+ "TheBloke/gpt4-alpaca-lora-30b-HF",
137
+ "TheBloke/Llama-2-70B-chat-GPTQ",
138
+ "upstage/llama-30b-instruct",
139
+ "OpenLemur/lemur-70b-v1",
140
+ "lmsys/vicuna-33b-v1.3",
141
+ "ausboss/llama-30b-supercot",
142
+ "ai-business/Luban-13B",
143
+ "Henk717/airochronos-33B",
144
+ "lmsys/vicuna-33b-v1.3",
145
+ "Henk717/airochronos-33B",
146
+ "bavest/fin-llama-33b-merged",
147
+ "jondurbin/airoboros-33b-gpt4-1.4",
148
+ "YeungNLP/firefly-llama-30b",
149
+ "Aspik101/30B-Lazarus-instruct-PL-lora_unload",
150
+ "uukuguy/speechless-llama2-luban-orca-platypus-13b",
151
+ "xxyyy123/test_merge_p_ov1_w0.66_w0.5_n1",
152
+ "jondurbin/airoboros-33b-gpt4-1.2",
153
+ "TheBloke/alpaca-lora-65B-HF",
154
+ "bofenghuang/vigogne-33b-instruct",
155
+ "yeontaek/llama-2-13B-ensemble-v5",
156
+ "garage-bAInd/Platypus-30B",
157
+ "Open-Orca/OpenOrca-Platypus2-13B",
158
+ "kajdun/viwaai-30b_v4",
159
+ "lilloukas/Platypus-30B",
160
+ "Open-Orca/OpenOrca-Platypus2-13B",
161
+ "Henk717/chronoboros-33B",
162
+ "jondurbin/airoboros-33b-2.1",
163
+ "HiTZ/alpaca-lora-65b-en-pt-es-ca",
164
+ "quantumaikr/QuantumLM-70B-hf",
165
+ "uukuguy/speechless-llama2-13b",
166
+ "uukuguy/speechless-llama2-hermes-orca-platypus-13b",
167
+ "openaccess-ai-collective/manticore-30b-chat-pyg-alpha",
168
+ "LLMs/WizardLM-30B-V1.0",
169
+ "TheBloke/WizardLM-30B-fp16",
170
+ "openaccess-ai-collective/hippogriff-30b-chat",
171
+ "concedo/Vicuzard-30B-Uncensored",
172
+ "TFLai/OpenOrca-Platypus2-13B-QLoRA-0.80-epoch",
173
+ "huggingface/llama-65b",
174
+ "huggyllama/llama-65b",
175
+ "gaodrew/gaodrew-llama-30b-instruct-2048-Open-Platypus-100steps",
176
+ "uukuguy/speechless-llama2-hermes-orca-platypus-wizardlm-13b",
177
+ "Sao10K/Mythical-Destroyer-V2-L2-13B",
178
+ "camel-ai/CAMEL-33B-Combined-Data",
179
+ "dsvv-cair/alpaca-cleaned-llama-30b-bf16",
180
+ "MetaIX/GPT4-X-Alpasta-30b",
181
+ "garage-bAInd/Stable-Platypus2-13B",
182
+ "TFLai/Luban-Platypus2-13B-QLora-0.80-epoch",
183
+ "TheBloke/OpenOrca-Platypus2-13B-GPTQ",
184
+ "IkariDev/Athena-tmp",
185
+ "OpenBuddyEA/openbuddy-llama-30b-v7.1-bf16",
186
+ "OpenBuddyEA/openbuddy-llama-30b-v7.1-bf16",
187
+ "Open-Orca/OpenOrcaxOpenChat-Preview2-13B",
188
+ "psmathur/model_007_13b_v2",
189
+ "Aspik101/Vicuzard-30B-Uncensored-instruct-PL-lora_unload",
190
+ "jondurbin/airoboros-33b-gpt4-m2.0",
191
+ "Sao10K/Mythical-Destroyer-L2-13B",
192
+ "TheBloke/Wizard-Vicuna-30B-Uncensored-fp16",
193
+ "ehartford/Wizard-Vicuna-30B-Uncensored",
194
+ "TFLai/Nova-13B",
195
+ "TheBloke/robin-33B-v2-fp16",
196
+ "totally-not-an-llm/PuddleJumper-13b",
197
+ "Aeala/VicUnlocked-alpaca-30b",
198
+ "Yhyu13/oasst-rlhf-2-llama-30b-7k-steps-hf",
199
+ "jondurbin/airoboros-33b-gpt4",
200
+ "jondurbin/airoboros-33b-gpt4-m2.0",
201
+ "tiiuae/falcon-40b-instruct",
202
+ "psmathur/orca_mini_v3_13b",
203
+ "Aeala/GPT4-x-AlpacaDente-30b",
204
+ "MayaPH/GodziLLa-30B",
205
+ "jondurbin/airoboros-33b-gpt4-m2.0",
206
+ "TFLai/SpeechlessV1-Nova-13B",
207
+ "yeontaek/llama-2-13B-ensemble-v4",
208
+ "ajibawa-2023/carl-33b",
209
+ "jondurbin/airoboros-33b-gpt4-2.0",
210
+ "TFLai/Stable-Platypus2-13B-QLoRA-0.80-epoch",
211
+ "jondurbin/airoboros-33b-gpt4-1.3",
212
+ "TehVenom/oasst-sft-6-llama-33b-xor-MERGED-16bit",
213
+ "TFLai/OrcaMini-Platypus2-13B-QLoRA-0.80-epoch",
214
+ "jondurbin/airoboros-33b-gpt4-2.0",
215
+ "chargoddard/Chronorctypus-Limarobormes-13b",
216
+ "jondurbin/airoboros-33b-gpt4-1.3",
217
+ "Open-Orca/OpenOrca-Platypus2-13B",
218
+ "FelixChao/vicuna-33b-coder",
219
+ "FelixChao/vicuna-33b-coder",
220
+ "Gryphe/MythoMix-L2-13b",
221
+ "Aeala/Enterredaas-33b",
222
+ "yeontaek/llama-2-13B-ensemble-v1",
223
+ "TFLai/OpenOrcaPlatypus2-Platypus2-13B-QLora-0.80-epoch",
224
+ "TFLai/Ensemble5-Platypus2-13B-QLora-0.80-epoch",
225
+ "yeontaek/llama-2-13B-ensemble-v3",
226
+ "TFLai/MythoMix-Platypus2-13B-QLoRA-0.80-epoch",
227
+ "yihan6324/llama2-13b-instructmining-40k-sharegpt",
228
+ "timdettmers/guanaco-33b-merged",
229
+ "TFLai/EnsembleV5-Nova-13B",
230
+ "circulus/Llama-2-13b-orca-v1",
231
+ "Undi95/ReMM-SLERP-L2-13B",
232
+ "Gryphe/MythoMax-L2-13b",
233
+ "stabilityai/StableBeluga-13B",
234
+ "circulus/Llama-2-13b-orca-v1",
235
+ "ehartford/WizardLM-30B-Uncensored",
236
+ "The-Face-Of-Goonery/huginnv1.2",
237
+ "TheBloke/OpenOrcaxOpenChat-Preview2-13B-GPTQ",
238
+ "Sao10K/Stheno-L2-13B",
239
+ "bofenghuang/vigogne-2-13b-instruct",
240
+ "The-Face-Of-Goonery/Huginn-13b-FP16",
241
+ "grimpep/L2-MythoMax22b-instruct-Falseblock",
242
+ "TFLai/Nous-Hermes-Platypus2-13B-QLoRA-0.80-epoch",
243
+ "yeontaek/Platypus2xOpenOrca-13B-IA3-v4",
244
+ "yeontaek/Platypus2xOpenOrca-13B-IA3",
245
+ "yeontaek/Platypus2xOpenOrca-13B-IA3-ensemble",
246
+ "Open-Orca/LlongOrca-13B-16k",
247
+ "Sao10K/Stheno-Inverted-L2-13B",
248
+ "garage-bAInd/Camel-Platypus2-13B",
249
+ "digitous/Alpacino30b",
250
+ "NousResearch/Nous-Hermes-Llama2-13b",
251
+ "yeontaek/Platypus2xOpenOrca-13B-IA3-v3",
252
+ "TFLai/MythicalDestroyerV2-Platypus2-13B-QLora-0.80-epoch",
253
+ "TheBloke/VicUnlocked-30B-LoRA-HF",
254
+ "Undi95/Nous-Hermes-13B-Code",
255
+ "The-Face-Of-Goonery/Chronos-Beluga-v2-13bfp16",
256
+ "NousResearch/Nous-Hermes-Llama2-13b",
257
+ "Monero/WizardLM-Uncensored-SuperCOT-StoryTelling-30b",
258
+ "TheBloke/Wizard-Vicuna-30B-Uncensored-GPTQ",
259
+ "Open-Orca/OpenOrcaxOpenChat-Preview2-13B",
260
+ "Austism/chronos-hermes-13b-v2",
261
+ "yeontaek/Platypus2xOpenOrca-13B-IA3-v2.1",
262
+ "yeontaek/Platypus2xOpenOrca-13B-IA3-v2",
263
+ "Gryphe/MythoLogic-L2-13b",
264
+ "augtoma/qCammel-13",
265
+ "YeungNLP/firefly-llama2-13b-v1.2",
266
+ "Aspik101/StableBeluga-13B-instruct-PL-lora_unload",
267
+ "andreaskoepf/llama2-13b-megacode2_min100",
268
+ "rombodawg/LosslessMegaCoder-llama2-13b-mini",
269
+ "yulan-team/YuLan-Chat-2-13b-fp16",
270
+ "elinas/chronos-33b",
271
+ "YeungNLP/firefly-llama2-13b",
272
+ "Sao10K/Medusa-13b",
273
+ "OptimalScale/robin-65b-v2-delta",
274
+ "minlik/chinese-alpaca-33b-merged",
275
+ "OpenAssistant/llama2-13b-megacode2-oasst",
276
+ "TheBloke/OpenAssistant-SFT-7-Llama-30B-HF",
277
+ "Undi95/UndiMix-v1-13b",
278
+ "ehartford/Samantha-1.11-13b",
279
+ "beaugogh/Llama2-13b-sharegpt4",
280
+ "Aeala/GPT4-x-AlpacaDente2-30b",
281
+ "luffycodes/nash-vicuna-13b-v1dot5-ep2-w-rag-w-simple",
282
+ "WizardLM/WizardLM-13B-V1.1",
283
+ "uukuguy/speechless-orca-platypus-coig-lite-2k-0.6e-13b",
284
+ "huggyllama/llama-30b",
285
+ "Undi95/ReMM-L2-13B-PIPPA",
286
+ "Undi95/ReMM-L2-13B",
287
+ "gaodrew/gaodrew-gorgonzola-13b",
288
+ "lmsys/vicuna-13b-v1.5",
289
+ "yeontaek/Platypus2xOpenOrca-13B-LoRa",
290
+ "Yhyu13/llama-30B-hf-openassitant",
291
+ "huggingface/llama-30b",
292
+ "lmsys/vicuna-13b-v1.5",
293
+ "TFLai/Athena-Platypus2-13B-QLora-0.80-epoch",
294
+ "TheBloke/dromedary-65b-lora-HF",
295
+ "yeontaek/llama-2-13b-Beluga-QLoRA",
296
+ "The-Face-Of-Goonery/Huginn-13b-V4",
297
+ "The-Face-Of-Goonery/Huginn-13b-v4.5",
298
+ "The-Face-Of-Goonery/Huginn-v3-13b",
299
+ "tiiuae/falcon-40b",
300
+ "WhoTookMyAmogusNickname/NewHope_HF_not_official",
301
+ "gaodrew/OpenOrca-Platypus2-13B-thera-1250",
302
+ "SLAM-group/NewHope",
303
+ "garage-bAInd/Platypus2-13B",
304
+ "migtissera/Synthia-13B",
305
+ "elinas/chronos-13b-v2",
306
+ "mosaicml/mpt-30b-chat",
307
+ "CHIH-HUNG/llama-2-13b-OpenOrca_5w",
308
+ "uukuguy/speechless-hermes-coig-lite-13b",
309
+ "TheBloke/tulu-30B-fp16",
310
+ "uukuguy/speechless-hermes-coig-lite-13b",
311
+ "xDAN-AI/xDAN_13b_l2_lora",
312
+ "lmsys/vicuna-13b-v1.5-16k",
313
+ "openchat/openchat_v3.1",
314
+ "CHIH-HUNG/llama-2-13b-dolphin_5w",
315
+ "Aspik101/vicuna-13b-v1.5-PL-lora_unload",
316
+ "Undi95/MLewd-L2-13B",
317
+ "ehartford/minotaur-llama2-13b-qlora",
318
+ "kajdun/iubaris-13b-v3",
319
+ "TFLai/Limarp-Platypus2-13B-QLoRA-0.80-epoch",
320
+ "openchat/openchat_v3.1",
321
+ "uukuguy/speechless-orca-platypus-coig-lite-4k-0.6e-13b",
322
+ "ziqingyang/chinese-alpaca-2-13b",
323
+ "TFLai/Airboros2.1-Platypus2-13B-QLora-0.80-epoch",
324
+ "yeontaek/llama-2-13b-Guanaco-QLoRA",
325
+ "lmsys/vicuna-13b-v1.5-16k",
326
+ "ehartford/based-30b",
327
+ "kingbri/airolima-chronos-grad-l2-13B",
328
+ "openchat/openchat_v3.2",
329
+ "uukuguy/speechless-orca-platypus-coig-lite-4k-0.5e-13b",
330
+ "yeontaek/Platypus2-13B-LoRa",
331
+ "kingbri/chronolima-airo-grad-l2-13B",
332
+ "openchat/openchat_v3.2",
333
+ "TFLai/PuddleJumper-Platypus2-13B-QLoRA-0.80-epoch",
334
+ "shareAI/llama2-13b-Chinese-chat",
335
+ "ehartford/WizardLM-1.0-Uncensored-Llama2-13b",
336
+ "Aspik101/Redmond-Puffin-13B-instruct-PL-lora_unload",
337
+ "yeontaek/llama-2-13B-ensemble-v6",
338
+ "WizardLM/WizardLM-13B-V1.2",
339
+ "TheBloke/WizardLM-13B-V1.1-GPTQ",
340
+ "bhenrym14/airophin-13b-pntk-16k-fp16",
341
+ "ehartford/WizardLM-1.0-Uncensored-Llama2-13b",
342
+ "Mikael110/llama-2-13b-guanaco-fp16",
343
+ "yeontaek/airoboros-2.1-llama-2-13B-QLoRa",
344
+ "CalderaAI/13B-Legerdemain-L2",
345
+ "grimpep/llama2-22b-wizard_vicuna",
346
+ "grimpep/llama2-22B-GPLATTY",
347
+ "bhenrym14/airophin-13b-pntk-16k-fp16",
348
+ "yeontaek/llama-2-13b-QLoRA",
349
+ "OpenAssistant/llama2-13b-orca-8k-3319",
350
+ "TheBloke/WizardLM-13B-V1-1-SuperHOT-8K-fp16",
351
+ "duliadotio/dulia-13b-8k-alpha",
352
+ "Undi95/LewdEngine",
353
+ "OpenBuddy/openbuddy-llama2-13b-v8.1-fp16",
354
+ "CHIH-HUNG/llama-2-13b-open_orca_20w",
355
+ "bhenrym14/airoboros-33b-gpt4-1.4.1-lxctx-PI-16384-fp16",
356
+ "FlagAlpha/Llama2-Chinese-13b-Chat",
357
+ "LLMs/WizardLM-13B-V1.0",
358
+ "chansung/gpt4-alpaca-lora-13b-decapoda-1024",
359
+ "TheBloke/wizardLM-13B-1.0-fp16",
360
+ "digitous/13B-Chimera",
361
+ "yeontaek/Platypus2xOpenOrcaxGuanaco-13B-LoRa",
362
+ "jondurbin/airoboros-l2-13b-2.1",
363
+ "Monero/WizardLM-30B-Uncensored-Guanaco-SuperCOT-30b",
364
+ "TheBloke/UltraLM-13B-fp16",
365
+ "openaccess-ai-collective/minotaur-13b-fixed",
366
+ "NousResearch/Redmond-Puffin-13B",
367
+ "KoboldAI/LLaMA2-13B-Holomax",
368
+ "Lajonbot/WizardLM-13B-V1.2-PL-lora_unload",
369
+ "yeontaek/Platypus2-13B-LoRa-v2",
370
+ "TheBloke/airoboros-13B-HF",
371
+ "jondurbin/airoboros-13b",
372
+ "jjaaaww/posi_13b",
373
+ "CoolWP/llama-2-13b-guanaco-fp16",
374
+ "yeontaek/Platypus2-13B-QLoRa",
375
+ "h2oai/h2ogpt-research-oig-oasst1-512-30b",
376
+ "dfurman/llama-2-13b-guanaco-peft",
377
+ "NousResearch/Redmond-Puffin-13B",
378
+ "pe-nlp/llama-2-13b-platypus-vicuna-wizard",
379
+ "CHIH-HUNG/llama-2-13b-dolphin_20w",
380
+ "NousResearch/Nous-Hermes-13b",
381
+ "NobodyExistsOnTheInternet/GiftedConvo13bLoraNoEconsE4",
382
+ "ehartford/Wizard-Vicuna-13B-Uncensored",
383
+ "TheBloke/Wizard-Vicuna-13B-Uncensored-HF",
384
+ "openchat/openchat_v3.2_super",
385
+ "bhenrym14/airophin-v2-13b-PI-8k-fp16",
386
+ "openaccess-ai-collective/manticore-13b",
387
+ "The-Face-Of-Goonery/Huginn-22b-Prototype",
388
+ "jphme/Llama-2-13b-chat-german",
389
+ "grimpep/llama2-28B-Airo03",
390
+ "TheBloke/Kimiko-v2-13B-fp16",
391
+ "FPHam/Free_Sydney_13b_HF",
392
+ "lmsys/vicuna-13b-v1.3",
393
+ "FelixChao/llama2-13b-math1.1",
394
+ "CalderaAI/13B-BlueMethod",
395
+ "meta-llama/Llama-2-13b-chat-hf",
396
+ "deepse/CodeUp-Llama-2-13b-chat-hf",
397
+ "WizardLM/WizardMath-13B-V1.0",
398
+ "WizardLM/WizardMath-13B-V1.0",
399
+ "HyperbeeAI/Tulpar-7b-v0",
400
+ "xxyyy123/test_qkvo_adptor",
401
+ "xxyyy123/mc_data_30k_from_platpus_orca_7b_10k_v1_lora_qkvo_rank14_v2",
402
+ "openchat/openchat_v2_w",
403
+ "FelixChao/llama2-13b-math1.1",
404
+ "psmathur/orca_mini_v3_7b",
405
+ "TehVenom/Metharme-13b-Merged",
406
+ "xxyyy123/10k_v1_lora_qkvo_rank14_v3",
407
+ "OpenAssistant/llama2-13b-orca-v2-8k-3166",
408
+ "openaccess-ai-collective/wizard-mega-13b",
409
+ "jondurbin/airoboros-13b-gpt4-1.4",
410
+ "jondurbin/airoboros-13b-gpt4-1.4-fp16",
411
+ "Monero/Manticore-13b-Chat-Pyg-Guanaco",
412
+ "FelixChao/llama2-13b-math1.2",
413
+ "chargoddard/platypus-2-22b-relora",
414
+ "FelixChao/llama2-13b-math1.2",
415
+ "Gryphe/MythoBoros-13b",
416
+ "CalderaAI/13B-Ouroboros",
417
+ "OpenAssistant/llama2-13b-orca-v2-8k-3166",
418
+ "heegyu/LIMA2-13b-hf",
419
+ "digitous/13B-HyperMantis",
420
+ "Gryphe/MythoLogic-13b",
421
+ "TheBloke/Airoboros-L2-13B-2.1-GPTQ",
422
+ "chargoddard/platypus2-22b-relora",
423
+ "openchat/openchat_v2",
424
+ "yeontaek/Platypus2-13B-IA3",
425
+ "stabilityai/StableBeluga-7B",
426
+ "circulus/Llama-2-7b-orca-v1",
427
+ "budecosystem/genz-13b-v2",
428
+ "TheBloke/gpt4-x-vicuna-13B-HF",
429
+ "NobodyExistsOnTheInternet/GiftedConvo13bLoraNoEcons",
430
+ "zarakiquemparte/zarafusionex-1.1-l2-7b",
431
+ "Lajonbot/tableBeluga-7B-instruct-pl-lora_unload",
432
+ "jondurbin/airoboros-13b-gpt4",
433
+ "gaodrew/gaodrew-gorgonzola-13b",
434
+ "jondurbin/airoboros-13b-gpt4-1.1",
435
+ "TheBloke/gpt4-alpaca-lora-13B-HF",
436
+ "zarakiquemparte/zarablendex-vq-l2-7b",
437
+ "openaccess-ai-collective/manticore-13b-chat-pyg",
438
+ "Lajonbot/Llama-2-13b-hf-instruct-pl-lora_unload",
439
+ "NobodyExistsOnTheInternet/PuffedLIMA13bQLORA",
440
+ "xxyyy123/10k_v1_lora_qkvo_rank28_v2",
441
+ "jondurbin/airoboros-l2-13b-gpt4-1.4.1",
442
+ "dhmeltzer/Llama-2-13b-hf-eli5-wiki-1024_r_64_alpha_16",
443
+ "NobodyExistsOnTheInternet/PuffedConvo13bLoraE4",
444
+ "yihan6324/llama2-7b-instructmining-40k-sharegpt",
445
+ "CHIH-HUNG/llama-2-13b-Open_Platypus_and_ccp_2.6w",
446
+ "Aeala/GPT4-x-Alpasta-13b",
447
+ "psmathur/orca_mini_v2_13b",
448
+ "YeungNLP/firefly-llama-13b",
449
+ "psmathur/orca_mini_v2_13b",
450
+ "zarakiquemparte/zarafusionix-l2-7b",
451
+ "yihan6324/llama2-7b-instructmining-60k-sharegpt",
452
+ "yihan6324/llama-2-7b-instructmining-60k-sharegpt",
453
+ "layoric/llama-2-13b-code-alpaca",
454
+ "bofenghuang/vigogne-13b-instruct",
455
+ "Lajonbot/vicuna-13b-v1.3-PL-lora_unload",
456
+ "lvkaokao/llama2-7b-hf-chat-lora-v3",
457
+ "ehartford/dolphin-llama-13b",
458
+ "YeungNLP/firefly-llama-13b-v1.2",
459
+ "TheBloke/Kimiko-13B-fp16",
460
+ "kevinpro/Vicuna-13B-CoT",
461
+ "eachadea/vicuna-13b-1.1",
462
+ "pillowtalks-ai/delta13b",
463
+ "TheBloke/vicuna-13B-1.1-HF",
464
+ "TheBloke/Vicuna-13B-CoT-fp16",
465
+ "lmsys/vicuna-13b-delta-v1.1",
466
+ "lmsys/vicuna-13b-v1.1",
467
+ "xxyyy123/20k_v1_lora_qkvo_rank14_v2",
468
+ "TheBloke/guanaco-13B-HF",
469
+ "TheBloke/vicuna-13b-v1.3.0-GPTQ",
470
+ "edor/Stable-Platypus2-mini-7B",
471
+ "totally-not-an-llm/EverythingLM-13b-V2-16k",
472
+ "zarakiquemparte/zaraxe-l2-7b",
473
+ "beaugogh/Llama2-7b-openorca-mc-v2",
474
+ "TheBloke/Nous-Hermes-13B-SuperHOT-8K-fp16",
475
+ "quantumaikr/QuantumLM",
476
+ "jondurbin/airoboros-13b-gpt4-1.2",
477
+ "TheBloke/robin-13B-v2-fp16",
478
+ "TFLai/llama-2-13b-4bit-alpaca-gpt4",
479
+ "yihan6324/llama2-7b-instructmining-orca-40k",
480
+ "dvruette/oasst-llama-13b-2-epochs",
481
+ "Open-Orca/LlongOrca-7B-16k",
482
+ "Aspik101/Nous-Hermes-13b-pl-lora_unload",
483
+ "ehartford/Samantha-1.11-CodeLlama-34b",
484
+ "nkpz/llama2-22b-chat-wizard-uncensored",
485
+ "bofenghuang/vigogne-13b-chat",
486
+ "beaugogh/Llama2-7b-openorca-mc-v1",
487
+ "OptimalScale/robin-13b-v2-delta",
488
+ "pe-nlp/llama-2-13b-vicuna-wizard",
489
+ "chargoddard/llama2-22b",
490
+ "gywy/llama2-13b-chinese-v1",
491
+ "frank098/Wizard-Vicuna-13B-juniper",
492
+ "IGeniusDev/llama13B-quant8-testv1-openorca-customdataset",
493
+ "CHIH-HUNG/llama-2-13b-huangyt_Fintune_1_17w-gate_up_down_proj",
494
+ "eachadea/vicuna-13b",
495
+ "yihan6324/llama2-7b-instructmining-orca-90k",
496
+ "chargoddard/llama2-22b-blocktriangular",
497
+ "luffycodes/mcq-vicuna-13b-v1.5",
498
+ "Yhyu13/chimera-inst-chat-13b-hf",
499
+ "luffycodes/mcq-vicuna-13b-v1.5",
500
+ "chargoddard/ypotryll-22b-epoch2-qlora",
501
+ "totally-not-an-llm/EverythingLM-13b-16k",
502
+ "luffycodes/mcq-hal-vicuna-13b-v1.5",
503
+ "openaccess-ai-collective/minotaur-13b",
504
+ "IGeniusDev/llama13B-quant8-testv1-openorca-customdataset",
505
+ "chargoddard/llama2-22b-blocktriangular",
506
+ "TFLai/Platypus2-13B-QLoRA-0.80-epoch",
507
+ "meta-llama/Llama-2-13b-hf",
508
+ "CHIH-HUNG/llama-2-13b-huangyt_FINETUNE2_3w-gate_up_down_proj",
509
+ "luffycodes/mcq-hal-vicuna-13b-v1.5",
510
+ "TheBloke/Llama-2-13B-fp16",
511
+ "TaylorAI/Flash-Llama-13B",
512
+ "shareAI/bimoGPT-llama2-13b",
513
+ "wahaha1987/llama_13b_sharegpt94k_fastchat",
514
+ "openchat/openchat_8192",
515
+ "CHIH-HUNG/llama-2-13b-huangyt_Fintune_1_17w-q_k_v_o_proj",
516
+ "dvruette/llama-13b-pretrained-sft-do2",
517
+ "CHIH-HUNG/llama-2-13b-alpaca-test",
518
+ "OpenBuddy/openbuddy-llama2-13b-v11.1-bf16",
519
+ "CHIH-HUNG/llama-2-13b-FINETUNE2_TEST_2.2w",
520
+ "project-baize/baize-v2-13b",
521
+ "jondurbin/airoboros-l2-13b-gpt4-m2.0",
522
+ "yeontaek/Platypus2xOpenOrca-13B-LoRa-v2",
523
+ "CHIH-HUNG/llama-2-13b-huangyt_FINETUNE2_3w",
524
+ "xzuyn/Alpacino-SuperCOT-13B",
525
+ "jondurbin/airoboros-l2-13b-gpt4-2.0",
526
+ "aiplanet/effi-13b",
527
+ "clibrain/Llama-2-13b-ft-instruct-es",
528
+ "CHIH-HUNG/llama-2-13b-huangyt_Fintune_1_17w",
529
+ "bofenghuang/vigogne-2-7b-instruct",
530
+ "CHIH-HUNG/llama-2-13b-huangyt_FINETUNE2_3w-q_k_v_o_proj",
531
+ "bofenghuang/vigogne-2-7b-chat",
532
+ "aiplanet/effi-13b",
533
+ "haonan-li/bactrian-x-llama-13b-merged",
534
+ "beaugogh/Llama2-7b-sharegpt4",
535
+ "HWERI/Llama2-7b-sharegpt4",
536
+ "jondurbin/airoboros-13b-gpt4-1.3",
537
+ "jondurbin/airoboros-c34b-2.1",
538
+ "junelee/wizard-vicuna-13b",
539
+ "TheBloke/wizard-vicuna-13B-HF",
540
+ "Open-Orca/OpenOrca-Preview1-13B",
541
+ "TheBloke/h2ogpt-oasst1-512-30B-HF",
542
+ "TheBloke/Llama-2-13B-GPTQ",
543
+ "camel-ai/CAMEL-13B-Combined-Data",
544
+ "lmsys/vicuna-7b-v1.5",
545
+ "lmsys/vicuna-7b-v1.5-16k",
546
+ "lmsys/vicuna-7b-v1.5",
547
+ "ausboss/llama-13b-supercot",
548
+ "TheBloke/tulu-13B-fp16",
549
+ "NousResearch/Nous-Hermes-llama-2-7b",
550
+ "jlevin/guanaco-13b-llama-2",
551
+ "lmsys/vicuna-7b-v1.5-16k",
552
+ "dvruette/llama-13b-pretrained",
553
+ "nkpz/llama2-22b-daydreamer-v3",
554
+ "dvruette/llama-13b-pretrained-dropout",
555
+ "jondurbin/airoboros-l2-13b-2.1",
556
+ "LLMs/Stable-Vicuna-13B",
557
+ "64bits/LexPodLM-13B",
558
+ "lizhuang144/llama_mirror_13b_v1.0",
559
+ "TheBloke/stable-vicuna-13B-HF",
560
+ "zarakiquemparte/zaraxls-l2-7b",
561
+ "TheBloke/Llama-2-13B-GPTQ",
562
+ "Kiddyz/testlm-3",
563
+ "migtissera/Synthia-7B",
564
+ "zarakiquemparte/zarablend-l2-7b",
565
+ "mosaicml/mpt-30b-instruct",
566
+ "PocketDoc/Dans-PileOfSets-Mk1-llama-13b-merged",
567
+ "vonjack/Qwen-LLaMAfied-HFTok-7B-Chat",
568
+ "l3utterfly/llama2-7b-layla",
569
+ "Lajonbot/vicuna-7b-v1.5-PL-lora_unload",
570
+ "heegyu/LIMA-13b-hf",
571
+ "frank098/WizardLM_13B_juniper",
572
+ "ashercn97/manatee-7b",
573
+ "chavinlo/gpt4-x-alpaca",
574
+ "PocketDoc/Dans-PersonalityEngine-13b",
575
+ "ehartford/WizardLM-1.0-Uncensored-CodeLlama-34b",
576
+ "digitous/Alpacino13b",
577
+ "edor/Hermes-Platypus2-mini-7B",
578
+ "lvkaokao/llama2-7b-hf-chat-lora-v2",
579
+ "Kiddyz/testlm-1-1",
580
+ "Kiddyz/testlm",
581
+ "Kiddyz/testlm-1",
582
+ "Kiddyz/testlm2",
583
+ "radm/Philosophy-Platypus2-13b",
584
+ "aiplanet/effi-13b",
585
+ "Harshvir/Llama-2-7B-physics",
586
+ "YeungNLP/firefly-ziya-13b",
587
+ "LinkSoul/Chinese-Llama-2-7b",
588
+ "PeanutJar/LLaMa-2-PeanutButter_v10-7B",
589
+ "OpenBuddy/openbuddy-llama2-13b-v11-bf16",
590
+ "StudentLLM/Alpagasus-2-13B-QLoRA-pipeline",
591
+ "meta-llama/Llama-2-13b-hf",
592
+ "WizardLM/WizardCoder-Python-34B-V1.0",
593
+ "dvruette/llama-13b-pretrained-sft-epoch-1",
594
+ "camel-ai/CAMEL-13B-Role-Playing-Data",
595
+ "ziqingyang/chinese-llama-2-13b",
596
+ "rombodawg/LosslessMegaCoder-llama2-7b-mini",
597
+ "TheBloke/koala-13B-HF",
598
+ "lmsys/vicuna-7b-delta-v1.1",
599
+ "eachadea/vicuna-7b-1.1",
600
+ "Ejafa/vicuna_7B_vanilla_1.1",
601
+ "lvkaokao/llama2-7b-hf-chat-lora",
602
+ "OpenBuddy/openbuddy-atom-13b-v9-bf16",
603
+ "Norquinal/llama-2-7b-claude-chat-rp",
604
+ "Danielbrdz/Barcenas-7b",
605
+ "heegyu/WizardVicuna2-13b-hf",
606
+ "meta-llama/Llama-2-7b-chat-hf",
607
+ "PeanutJar/LLaMa-2-PeanutButter_v14-7B",
608
+ "PeanutJar/LLaMa-2-PeanutButter_v4-7B",
609
+ "davzoku/cria-llama2-7b-v1.3",
610
+ "OpenBuddy/openbuddy-atom-13b-v9-bf16",
611
+ "lvkaokao/llama2-7b-hf-instruction-lora",
612
+ "Tap-M/Luna-AI-Llama2-Uncensored",
613
+ "ehartford/Samantha-1.11-7b",
614
+ "WizardLM/WizardCoder-Python-34B-V1.0",
615
+ "TheBloke/Manticore-13B-Chat-Pyg-Guanaco-SuperHOT-8K-GPTQ",
616
+ "Mikael110/llama-2-7b-guanaco-fp16",
617
+ "garage-bAInd/Platypus2-7B",
618
+ "PeanutJar/LLaMa-2-PeanutButter_v18_B-7B",
619
+ "mosaicml/mpt-30b",
620
+ "garage-bAInd/Platypus2-7B",
621
+ "huggingface/llama-13b",
622
+ "dvruette/oasst-llama-13b-1000-steps",
623
+ "jordiclive/gpt4all-alpaca-oa-codealpaca-lora-13b",
624
+ "huggyllama/llama-13b",
625
+ "Voicelab/trurl-2-7b",
626
+ "TFLai/llama-13b-4bit-alpaca",
627
+ "gywy/llama2-13b-chinese-v2",
628
+ "lmsys/longchat-13b-16k",
629
+ "Aspik101/trurl-2-7b-pl-instruct_unload",
630
+ "WizardLM/WizardMath-7B-V1.0",
631
+ "Norquinal/llama-2-7b-claude-chat",
632
+ "TheTravellingEngineer/llama2-7b-chat-hf-dpo",
633
+ "HuggingFaceH4/starchat-beta",
634
+ "joehuangx/spatial-vicuna-7b-v1.5-LoRA",
635
+ "conceptofmind/LLongMA-2-13b-16k",
636
+ "tianyil1/denas-llama2",
637
+ "lmsys/vicuna-7b-v1.3",
638
+ "conceptofmind/LLongMA-2-13b-16k",
639
+ "openchat/opencoderplus",
640
+ "ajibawa-2023/scarlett-7b",
641
+ "dhmeltzer/llama-7b-SFT_eli5_wiki65k_1024_r_64_alpha_16_merged",
642
+ "psyche/kollama2-7b-v2",
643
+ "heegyu/LIMA2-7b-hf",
644
+ "dhmeltzer/llama-7b-SFT-qlora-eli5-wiki_DPO_ds_RM_top_2_1024_r_64_alpha_16",
645
+ "abhishek/llama2guanacotest",
646
+ "jondurbin/airoboros-l2-7b-2.1",
647
+ "llama-anon/instruct-13b",
648
+ "FelixChao/vicuna-7B-physics",
649
+ "Aspik101/Llama-2-7b-hf-instruct-pl-lora_unload",
650
+ "shibing624/chinese-alpaca-plus-13b-hf",
651
+ "davzoku/cria-llama2-7b-v1.3_peft",
652
+ "quantumaikr/llama-2-7b-hf-guanaco-1k",
653
+ "togethercomputer/Llama-2-7B-32K-Instruct",
654
+ "sia-ai/llama-2-7b-1-percent-open-orca-1000-steps-v0",
655
+ "TheTravellingEngineer/llama2-7b-hf-guanaco",
656
+ "Lajonbot/Llama-2-7b-chat-hf-instruct-pl-lora_unload",
657
+ "jondurbin/airoboros-l2-7b-gpt4-1.4.1",
658
+ "wahaha1987/llama_7b_sharegpt94k_fastchat",
659
+ "FelixChao/vicuna-7B-chemical",
660
+ "TinyPixel/llama2-7b-oa",
661
+ "chaoyi-wu/MedLLaMA_13B",
662
+ "edor/Platypus2-mini-7B",
663
+ "RoversX/llama-2-7b-hf-small-shards-Samantha-V1-SFT",
664
+ "venkycs/llama-v2-7b-32kC-Security",
665
+ "psyche/kollama2-7b",
666
+ "Fredithefish/Guanaco-7B-Uncensored",
667
+ "TheTravellingEngineer/llama2-7b-chat-hf-guanaco",
668
+ "ehartford/WizardLM-13B-Uncensored",
669
+ "PocketDoc/Dans-CreepingSenseOfDoom",
670
+ "wenge-research/yayi-7b-llama2",
671
+ "georgesung/llama2_7b_chat_uncensored",
672
+ "TinyPixel/llama2-7b-instruct",
673
+ "quantumaikr/QuantumLM-7B",
674
+ "xzuyn/MedicWizard-7B",
675
+ "wenge-research/yayi-7b-llama2",
676
+ "TinyPixel/lima-test",
677
+ "elyza/ELYZA-japanese-Llama-2-7b-instruct",
678
+ "lgaalves/llama-2-7b-hf_open-platypus",
679
+ "ziqingyang/chinese-alpaca-2-7b",
680
+ "TehVenom/Pygmalion-Vicuna-1.1-7b",
681
+ "meta-llama/Llama-2-7b-hf",
682
+ "bongchoi/test-llama2-7b",
683
+ "TaylorAI/Flash-Llama-7B",
684
+ "TheTravellingEngineer/llama2-7b-chat-hf-v2",
685
+ "TheTravellingEngineer/llama2-7b-chat-hf-v4",
686
+ "kashif/stack-llama-2",
687
+ "PeanutJar/LLaMa-2-PeanutButter_v18_A-7B",
688
+ "ToolBench/ToolLLaMA-7b-LoRA",
689
+ "Monero/WizardLM-13b-OpenAssistant-Uncensored",
690
+ "TheTravellingEngineer/llama2-7b-chat-hf-v2",
691
+ "TheTravellingEngineer/llama2-7b-chat-hf-v4",
692
+ "mrm8488/llama-2-coder-7b",
693
+ "elyza/ELYZA-japanese-Llama-2-7b-fast-instruct",
694
+ "clibrain/Llama-2-7b-ft-instruct-es",
695
+ "medalpaca/medalpaca-7b",
696
+ "TheBloke/tulu-7B-fp16",
697
+ "OpenBuddy/openbuddy-openllama-13b-v7-fp16",
698
+ "TaylorAI/FLAN-Llama-7B-2_Llama2-7B-Flash_868_full_model",
699
+ "Aspik101/vicuna-7b-v1.3-instruct-pl-lora_unload",
700
+ "jondurbin/airoboros-l2-7b-gpt4-2.0",
701
+ "dhmeltzer/llama-7b-SFT_ds_eli5_1024_r_64_alpha_16_merged",
702
+ "GOAT-AI/GOAT-7B-Community",
703
+ "AtomEchoAI/AtomGPT_56k",
704
+ "julianweng/Llama-2-7b-chat-orcah",
705
+ "TehVenom/Pygmalion-13b-Merged",
706
+ "jondurbin/airoboros-7b-gpt4-1.1",
707
+ "dhmeltzer/llama-7b-SFT_ds_wiki65k_1024_r_64_alpha_16_merged",
708
+ "bofenghuang/vigogne-7b-chat",
709
+ "lmsys/longchat-7b-v1.5-32k",
710
+ "jondurbin/airoboros-l2-7b-gpt4-m2.0",
711
+ "synapsoft/Llama-2-7b-chat-hf-flan2022-1.2M",
712
+ "jondurbin/airoboros-7b-gpt4-1.4",
713
+ "Charlie911/vicuna-7b-v1.5-lora-mctaco",
714
+ "yihan6324/instructmining-platypus-15k",
715
+ "meta-llama/Llama-2-7b-hf",
716
+ "TheTravellingEngineer/llama2-7b-chat-hf-v3",
717
+ "quantumaikr/KoreanLM-hf",
718
+ "openthaigpt/openthaigpt-1.0.0-alpha-7b-chat-ckpt-hf",
719
+ "TheBloke/Llama-2-7B-GPTQ",
720
+ "TheBloke/Llama-2-7B-GPTQ",
721
+ "LLMs/AlpacaGPT4-7B-elina",
722
+ "ehartford/Wizard-Vicuna-7B-Uncensored",
723
+ "TheBloke/Wizard-Vicuna-7B-Uncensored-HF",
724
+ "TheTravellingEngineer/llama2-7b-chat-hf-v3",
725
+ "golaxy/gowizardlm",
726
+ "ehartford/dolphin-llama2-7b",
727
+ "CHIH-HUNG/llama-2-7b-dolphin_10w-test",
728
+ "mncai/chatdoctor",
729
+ "psyche/kollama2-7b-v3",
730
+ "jondurbin/airoboros-7b-gpt4",
731
+ "jondurbin/airoboros-7b",
732
+ "TheBloke/airoboros-7b-gpt4-fp16",
733
+ "mosaicml/mpt-7b-8k-chat",
734
+ "elyza/ELYZA-japanese-Llama-2-7b",
735
+ "bofenghuang/vigogne-7b-instruct",
736
+ "jxhong/CAlign-alpaca-7b",
737
+ "golaxy/goims",
738
+ "jondurbin/airoboros-7b-gpt4-1.2",
739
+ "jphme/orca_mini_v2_ger_7b",
740
+ "psmathur/orca_mini_v2_7b",
741
+ "notstoic/PygmalionCoT-7b",
742
+ "golaxy/gogpt2-13b",
743
+ "golaxy/gogpt2-13b-chat",
744
+ "togethercomputer/LLaMA-2-7B-32K",
745
+ "TheBloke/wizardLM-7B-HF",
746
+ "keyfan/vicuna-chinese-replication-v1.1",
747
+ "golaxy/gogpt2-7b",
748
+ "aiplanet/effi-7b",
749
+ "arver/llama7b-qlora",
750
+ "titan087/OpenLlama13B-Guanaco",
751
+ "chavinlo/alpaca-native",
752
+ "project-baize/baize-healthcare-lora-7B",
753
+ "AlpinDale/pygmalion-instruct",
754
+ "openlm-research/open_llama_13b",
755
+ "jondurbin/airoboros-7b-gpt4-1.3",
756
+ "elyza/ELYZA-japanese-Llama-2-7b-fast",
757
+ "jondurbin/airoboros-gpt-3.5-turbo-100k-7b",
758
+ "uukuguy/speechless-codellama-orca-13b",
759
+ "bigcode/starcoderplus",
760
+ "TheBloke/guanaco-7B-HF",
761
+ "Neko-Institute-of-Science/metharme-7b",
762
+ "TigerResearch/tigerbot-7b-base",
763
+ "golaxy/gogpt-7b",
764
+ "togethercomputer/LLaMA-2-7B-32K",
765
+ "yhyhy3/open_llama_7b_v2_med_instruct",
766
+ "ajibawa-2023/carl-7b",
767
+ "stabilityai/stablelm-base-alpha-7b-v2",
768
+ "conceptofmind/LLongMA-2-7b-16k",
769
+ "TehVenom/Pygmalion_AlpacaLora-7b",
770
+ "jondurbin/airoboros-7b-gpt4-1.4.1-qlora",
771
+ "wannaphong/openthaigpt-0.1.0-beta-full-model_for_open_llm_leaderboard",
772
+ "ausboss/llama7b-wizardlm-unfiltered",
773
+ "project-baize/baize-v2-7b",
774
+ "LMFlow/Robin-v2",
775
+ "HanningZhang/Robin-v2",
776
+ "LMFlow/Robin-7b-v2",
777
+ "OptimalScale/robin-7b-v2-delta",
778
+ "uukuguy/speechless-codellama-platypus-13b",
779
+ "jerryjalapeno/nart-100k-7b",
780
+ "wenge-research/yayi-13b-llama2",
781
+ "fireballoon/baichuan-vicuna-chinese-7b",
782
+ "jlevin/guanaco-unchained-llama-2-7b",
783
+ "csitfun/llama-7b-logicot",
784
+ "DevaMalla/llama7b_alpaca_1gpu_bf16",
785
+ "WeOpenML/PandaLM-Alpaca-7B-v1",
786
+ "illuin/test-custom-llama",
787
+ "yeontaek/WizardCoder-Python-13B-LoRa",
788
+ "ashercn97/giraffe-7b",
789
+ "mosaicml/mpt-7b-chat",
790
+ "abhishek/autotrain-llama-alpaca-peft-52508123785",
791
+ "Neko-Institute-of-Science/pygmalion-7b",
792
+ "TFLai/llama-7b-4bit-alpaca",
793
+ "huggingface/llama-7b",
794
+ "TheBloke/Planner-7B-fp16",
795
+ "shibing624/chinese-llama-plus-13b-hf",
796
+ "AGI-inc/lora_moe_7b_baseline",
797
+ "DevaMalla/llama-base-7b",
798
+ "AGI-inc/lora_moe_7b",
799
+ "togethercomputer/GPT-JT-6B-v0",
800
+ "ehartford/WizardLM-7B-Uncensored",
801
+ "shibing624/chinese-alpaca-plus-7b-hf",
802
+ "beomi/llama-2-ko-7b",
803
+ "mosaicml/mpt-7b-8k-instruct",
804
+ "Enno-Ai/ennodata-7b",
805
+ "mosaicml/mpt-7b-instruct",
806
+ "facebook/opt-iml-max-30b",
807
+ "WeOpenML/Alpaca-7B-v1",
808
+ "TheBloke/Project-Baize-v2-7B-GPTQ",
809
+ "codellama/CodeLlama-13b-Instruct-hf",
810
+ "TheBloke/CodeLlama-13B-Instruct-fp16",
811
+ "facebook/galactica-30b",
812
+ "FreedomIntelligence/phoenix-inst-chat-7b",
813
+ "openlm-research/open_llama_7b_v2",
814
+ "GeorgiaTechResearchInstitute/galpaca-30b",
815
+ "THUDM/chatglm2-6b",
816
+ "togethercomputer/GPT-JT-6B-v1",
817
+ "TheBloke/koala-7B-HF",
818
+ "nathan0/mpt_delta_tuned_model_v3",
819
+ "nathan0/mpt_delta_tuned_model_v2",
820
+ "GeorgiaTechResearchInstitute/galpaca-30b",
821
+ "JosephusCheung/Guanaco",
822
+ "shareAI/CodeLLaMA-chat-13b-Chinese",
823
+ "TigerResearch/tigerbot-7b-sft",
824
+ "Writer/InstructPalmyra-20b",
825
+ "OpenAssistant/codellama-13b-oasst-sft-v10",
826
+ "bigscience/bloomz-7b1-mt",
827
+ "nathan0/mpt_delta_tuned_model_v3",
828
+ "VMware/open-llama-7b-open-instruct",
829
+ "baichuan-inc/Baichuan-7B",
830
+ "anas-awadalla/mpt-7b",
831
+ "mosaicml/mpt-7b",
832
+ "bigscience/bloomz-7b1",
833
+ "ziqingyang/chinese-llama-2-7b",
834
+ "OpenAssistant/codellama-13b-oasst-sft-v10",
835
+ "wenge-research/yayi-7b",
836
+ "tiiuae/falcon-7b",
837
+ "togethercomputer/RedPajama-INCITE-Instruct-7B-v0.1",
838
+ "togethercomputer/RedPajama-INCITE-7B-Instruct",
839
+ "TheBloke/landmark-attention-llama7b-fp16",
840
+ "togethercomputer/GPT-JT-Moderation-6B",
841
+ "h2oai/h2ogpt-gm-oasst1-en-1024-20b",
842
+ "dvruette/gpt-neox-20b-full-precision",
843
+ "TehVenom/Moderator-Chan_GPT-JT-6b",
844
+ "dvruette/oasst-gpt-neox-20b-1000-steps",
845
+ "AlekseyKorshuk/pygmalion-6b-vicuna-chatml",
846
+ "facebook/opt-66b",
847
+ "Salesforce/codegen-16B-nl",
848
+ "Vmware/open-llama-7b-v2-open-instruct",
849
+ "mosaicml/mpt-7b-storywriter",
850
+ "acrastt/Marx-3B-V2",
851
+ "openlm-research/open_llama_7b",
852
+ "Fredithefish/ReasonixPajama-3B-HF",
853
+ "togethercomputer/GPT-NeoXT-Chat-Base-20B",
854
+ "psmathur/orca_mini_13b",
855
+ "RWKV/rwkv-raven-14b",
856
+ "h2oai/h2ogpt-oasst1-512-20b",
857
+ "acrastt/Marx-3B",
858
+ "klosax/open_llama_13b_600bt_preview",
859
+ "synapsoft/Llama-2-7b-hf-flan2022-1.2M",
860
+ "OpenAssistant/oasst-sft-1-pythia-12b",
861
+ "golaxy/gogpt-7b-bloom",
862
+ "Writer/palmyra-large",
863
+ "psmathur/orca_mini_7b",
864
+ "dvruette/oasst-pythia-12b-6000-steps",
865
+ "NousResearch/CodeLlama-13b-hf",
866
+ "codellama/CodeLlama-13b-hf",
867
+ "h2oai/h2ogpt-gm-oasst1-multilang-1024-20b",
868
+ "VMware/open-llama-0.7T-7B-open-instruct-v1.1",
869
+ "dvruette/oasst-pythia-12b-flash-attn-5000-steps",
870
+ "dvruette/oasst-gpt-neox-20b-3000-steps",
871
+ "RobbeD/OpenLlama-Platypus-3B",
872
+ "facebook/opt-30b",
873
+ "acrastt/Puma-3B",
874
+ "OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5",
875
+ "dvruette/oasst-pythia-12b-pretrained-sft",
876
+ "digitous/GPT-R",
877
+ "acrastt/Griffin-3B",
878
+ "togethercomputer/RedPajama-INCITE-Base-7B-v0.1",
879
+ "togethercomputer/RedPajama-INCITE-7B-Base",
880
+ "CobraMamba/mamba-gpt-3b-v3",
881
+ "Danielbrdz/CodeBarcenas-7b",
882
+ "l3utterfly/open-llama-3b-v2-layla",
883
+ "CobraMamba/mamba-gpt-3b-v2",
884
+ "OpenAssistant/pythia-12b-sft-v8-7k-steps",
885
+ "KoboldAI/GPT-NeoX-20B-Erebus",
886
+ "RobbeD/Orca-Platypus-3B",
887
+ "h2oai/h2ogpt-gm-oasst1-en-1024-12b",
888
+ "OpenAssistant/pythia-12b-sft-v8-2.5k-steps",
889
+ "AlekseyKorshuk/chatml-pyg-v1",
890
+ "togethercomputer/RedPajama-INCITE-Chat-7B-v0.1",
891
+ "togethercomputer/RedPajama-INCITE-7B-Chat",
892
+ "digitous/Javelin-R",
893
+ "dvruette/oasst-pythia-12b-reference",
894
+ "EleutherAI/gpt-neox-20b",
895
+ "KoboldAI/fairseq-dense-13B",
896
+ "OpenAssistant/pythia-12b-sft-v8-rlhf-2k-steps",
897
+ "codellama/CodeLlama-7b-Instruct-hf",
898
+ "digitous/Javelin-GPTJ",
899
+ "KoboldAI/GPT-NeoX-20B-Skein",
900
+ "digitous/Javalion-R",
901
+ "h2oai/h2ogpt-oasst1-512-12b",
902
+ "acrastt/Bean-3B",
903
+ "KoboldAI/GPT-J-6B-Skein",
904
+ "nomic-ai/gpt4all-j",
905
+ "databricks/dolly-v2-12b",
906
+ "TehVenom/Dolly_Shygmalion-6b-Dev_V8P2",
907
+ "databricks/dolly-v2-7b",
908
+ "Aspik101/WizardVicuna-Uncensored-3B-instruct-PL-lora_unload",
909
+ "digitous/Adventien-GPTJ",
910
+ "openlm-research/open_llama_3b_v2",
911
+ "RWKV/rwkv-4-14b-pile",
912
+ "Lazycuber/Janemalion-6B",
913
+ "OpenAssistant/pythia-12b-pre-v8-12.5k-steps",
914
+ "digitous/Janin-R",
915
+ "kfkas/Llama-2-ko-7b-Chat",
916
+ "heegyu/WizardVicuna-Uncensored-3B-0719",
917
+ "h2oai/h2ogpt-gm-oasst1-en-1024-open-llama-7b-preview-400bt",
918
+ "TaylorAI/Flash-Llama-3B",
919
+ "kfkas/Llama-2-ko-7b-Chat",
920
+ "digitous/Skegma-GPTJ",
921
+ "digitous/Javalion-GPTJ",
922
+ "Pirr/pythia-13b-deduped-green_devil",
923
+ "TehVenom/PPO_Shygmalion-V8p4_Dev-6b",
924
+ "dvruette/oasst-pythia-6.9b-4000-steps",
925
+ "heegyu/WizardVicuna-3B-0719",
926
+ "psmathur/orca_mini_3b",
927
+ "OpenAssistant/galactica-6.7b-finetuned",
928
+ "frank098/orca_mini_3b_juniper",
929
+ "PygmalionAI/pygmalion-6b",
930
+ "TehVenom/PPO_Pygway-V8p4_Dev-6b",
931
+ "TFLai/gpt-neox-20b-4bit-alpaca",
932
+ "Corianas/gpt-j-6B-Dolly",
933
+ "TehVenom/Dolly_Shygmalion-6b",
934
+ "digitous/Janin-GPTJ",
935
+ "TehVenom/GPT-J-Pyg_PPO-6B-Dev-V8p4",
936
+ "EleutherAI/gpt-j-6b",
937
+ "KoboldAI/GPT-J-6B-Shinen",
938
+ "TehVenom/Dolly_Malion-6b",
939
+ "TehVenom/ChanMalion",
940
+ "Salesforce/codegen-6B-nl",
941
+ "Fredithefish/RedPajama-INCITE-Chat-3B-Instruction-Tuning-with-GPT-4",
942
+ "KoboldAI/GPT-J-6B-Janeway",
943
+ "togethercomputer/RedPajama-INCITE-Chat-3B-v1",
944
+ "togethercomputer/Pythia-Chat-Base-7B",
945
+ "heegyu/RedTulu-Uncensored-3B-0719",
946
+ "KoboldAI/PPO_Pygway-6b-Mix",
947
+ "KoboldAI/OPT-13B-Erebus",
948
+ "KoboldAI/fairseq-dense-6.7B",
949
+ "EleutherAI/pythia-12b-deduped",
950
+ "pszemraj/pythia-6.9b-HC3",
951
+ "Fredithefish/Guanaco-3B-Uncensored-v2",
952
+ "facebook/opt-13b",
953
+ "TehVenom/GPT-J-Pyg_PPO-6B",
954
+ "EleutherAI/pythia-6.9b-deduped",
955
+ "Devio/test-1400",
956
+ "Fredithefish/Guanaco-3B-Uncensored",
957
+ "codellama/CodeLlama-7b-hf",
958
+ "acrastt/RedPajama-INCITE-Chat-Instruct-3B-V1",
959
+ "Fredithefish/ScarletPajama-3B-HF",
960
+ "KoboldAI/OPT-13B-Nerybus-Mix",
961
+ "YeungNLP/firefly-bloom-7b1",
962
+ "DanielSc4/RedPajama-INCITE-Chat-3B-v1-RL-LoRA-8bit-test1",
963
+ "klosax/open_llama_7b_400bt_preview",
964
+ "KoboldAI/OPT-13B-Nerys-v2",
965
+ "TehVenom/PPO_Shygmalion-6b",
966
+ "amazon/LightGPT",
967
+ "KnutJaegersberg/black_goo_recipe_c",
968
+ "NousResearch/CodeLlama-7b-hf",
969
+ "togethercomputer/RedPajama-INCITE-Instruct-3B-v1",
970
+ "heegyu/WizardVicuna-open-llama-3b-v2",
971
+ "bigscience/bloom-7b1",
972
+ "Devio/test-22B",
973
+ "RWKV/rwkv-raven-7b",
974
+ "hakurei/instruct-12b",
975
+ "CobraMamba/mamba-gpt-3b",
976
+ "KnutJaegersberg/black_goo_recipe_a",
977
+ "acrastt/OmegLLaMA-3B",
978
+ "codellama/CodeLlama-7b-Instruct-hf",
979
+ "h2oai/h2ogpt-oig-oasst1-512-6_9b",
980
+ "KoboldAI/OPT-6.7B-Erebus",
981
+ "facebook/opt-6.7b",
982
+ "KnutJaegersberg/black_goo_recipe_d",
983
+ "KnutJaegersberg/LLongMA-3b-LIMA",
984
+ "KnutJaegersberg/black_goo_recipe_b",
985
+ "KoboldAI/OPT-6.7B-Nerybus-Mix",
986
+ "health360/Healix-3B",
987
+ "EleutherAI/pythia-12b",
988
+ "Fredithefish/RedPajama-INCITE-Chat-3B-ShareGPT-11K",
989
+ "GeorgiaTechResearchInstitute/galactica-6.7b-evol-instruct-70k",
990
+ "h2oai/h2ogpt-oig-oasst1-256-6_9b",
991
+ "ikala/bloom-zh-3b-chat",
992
+ "Taekyoon/llama2-ko-7b-test",
993
+ "anhnv125/pygmalion-6b-roleplay",
994
+ "TehVenom/DiffMerge_Pygmalion_Main-onto-V8P4",
995
+ "KoboldAI/OPT-6B-nerys-v2",
996
+ "Lazycuber/pyg-instruct-wizardlm",
997
+ "Devio/testC",
998
+ "KoboldAI/OPT-30B-Erebus",
999
+ "Fredithefish/CrimsonPajama",
1000
+ "togethercomputer/RedPajama-INCITE-Base-3B-v1",
1001
+ "bigscience/bloomz-3b",
1002
+ "conceptofmind/Open-LLongMA-3b",
1003
+ "RWKV/rwkv-4-7b-pile",
1004
+ "openlm-research/open_llama_3b",
1005
+ "ewof/koishi-instruct-3b",
1006
+ "DanielSc4/RedPajama-INCITE-Chat-3B-v1-FT-LoRA-8bit-test1",
1007
+ "cerebras/Cerebras-GPT-13B",
1008
+ "EleutherAI/pythia-6.7b",
1009
+ "aisquared/chopt-2_7b",
1010
+ "Azure99/blossom-v1-3b",
1011
+ "PSanni/Deer-3b",
1012
+ "bertin-project/bertin-gpt-j-6B-alpaca",
1013
+ "OpenBuddy/openbuddy-openllama-3b-v10-bf16",
1014
+ "KoboldAI/fairseq-dense-2.7B",
1015
+ "ehartford/CodeLlama-34b-Instruct-hf",
1016
+ "codellama/CodeLlama-34b-Instruct-hf",
1017
+ "TheBloke/CodeLlama-34B-Instruct-fp16",
1018
+ "h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt-v2",
1019
+ "openlm-research/open_llama_7b_700bt_preview",
1020
+ "NbAiLab/nb-gpt-j-6B-alpaca",
1021
+ "KoboldAI/OPT-2.7B-Erebus",
1022
+ "Writer/camel-5b-hf",
1023
+ "EleutherAI/pythia-2.7b",
1024
+ "facebook/xglm-7.5B",
1025
+ "EleutherAI/pythia-2.8b-deduped",
1026
+ "klosax/open_llama_3b_350bt_preview",
1027
+ "klosax/openllama-3b-350bt",
1028
+ "KoboldAI/OPT-2.7B-Nerybus-Mix",
1029
+ "KoboldAI/GPT-J-6B-Adventure",
1030
+ "cerebras/Cerebras-GPT-6.7B",
1031
+ "TFLai/pythia-2.8b-4bit-alpaca",
1032
+ "facebook/opt-2.7b",
1033
+ "KoboldAI/OPT-2.7B-Nerys-v2",
1034
+ "bigscience/bloom-3b",
1035
+ "Devio/test100",
1036
+ "RWKV/rwkv-raven-3b",
1037
+ "Azure99/blossom-v2-3b",
1038
+ "codellama/CodeLlama-34b-Python-hf",
1039
+ "bhenrym14/airoboros-33b-gpt4-1.4.1-PI-8192-fp16",
1040
+ "EleutherAI/gpt-neo-2.7B",
1041
+ "danielhanchen/open_llama_3b_600bt_preview",
1042
+ "HuggingFaceH4/starchat-alpha",
1043
+ "pythainlp/wangchanglm-7.5B-sft-en-sharded",
1044
+ "beaugogh/pythia-1.4b-deduped-sharegpt",
1045
+ "HWERI/pythia-1.4b-deduped-sharegpt",
1046
+ "OpenAssistant/stablelm-7b-sft-v7-epoch-3",
1047
+ "codellama/CodeLlama-7b-Python-hf",
1048
+ "aisquared/chopt-1_3b",
1049
+ "PygmalionAI/metharme-1.3b",
1050
+ "Linly-AI/Chinese-LLaMA-2-13B-hf",
1051
+ "chargoddard/llama-2-34b-uncode",
1052
+ "RWKV/rwkv-4-3b-pile",
1053
+ "pythainlp/wangchanglm-7.5B-sft-enth",
1054
+ "MBZUAI/LaMini-GPT-1.5B",
1055
+ "Writer/palmyra-base",
1056
+ "KoboldAI/fairseq-dense-1.3B",
1057
+ "EleutherAI/pythia-1.4b-deduped",
1058
+ "MBZUAI/lamini-neo-1.3b",
1059
+ "h2oai/h2ogpt-gm-oasst1-en-2048-open-llama-7b-preview-300bt",
1060
+ "sartmis1/starcoder-finetune-openapi",
1061
+ "MayaPH/opt-flan-iml-6.7b",
1062
+ "facebook/xglm-4.5B",
1063
+ "WizardLM/WizardCoder-15B-V1.0",
1064
+ "facebook/opt-iml-max-1.3b",
1065
+ "stabilityai/stablelm-tuned-alpha-7b",
1066
+ "aisquared/dlite-v2-1_5b",
1067
+ "stabilityai/stablelm-base-alpha-7b",
1068
+ "sartmis1/starcoder-finetune-selfinstruct",
1069
+ "lizhuang144/starcoder_mirror",
1070
+ "bigcode/starcoder",
1071
+ "TheBloke/CodeLlama-34B-Python-fp16",
1072
+ "open-llm-leaderboard/bloomz-1b7-4bit-alpaca-auto-eval-adapter-applied",
1073
+ "ehartford/CodeLlama-34b-Python-hf",
1074
+ "codellama/CodeLlama-7b-Python-hf",
1075
+ "GeorgiaTechResearchInstitute/starcoder-gpteacher-code-instruct",
1076
+ "LoupGarou/WizardCoder-Guanaco-15B-V1.0",
1077
+ "golaxy/gogpt-3b-bloom",
1078
+ "EleutherAI/pythia-1.3b",
1079
+ "codellama/CodeLlama-13b-Python-hf",
1080
+ "hakurei/lotus-12B",
1081
+ "NYTK/PULI-GPTrio",
1082
+ "facebook/opt-1.3b",
1083
+ "TheBloke/CodeLlama-13B-Python-fp16",
1084
+ "codellama/CodeLlama-13b-Python-hf",
1085
+ "RWKV/rwkv-raven-1b5",
1086
+ "PygmalionAI/pygmalion-2.7b",
1087
+ "bigscience/bloom-1b7",
1088
+ "gpt2-xl",
1089
+ "LoupGarou/WizardCoder-Guanaco-15B-V1.1",
1090
+ "RWKV/rwkv-4-1b5-pile",
1091
+ "codellama/CodeLlama-34b-hf",
1092
+ "NousResearch/CodeLlama-34b-hf",
1093
+ "rinna/bilingual-gpt-neox-4b-8k",
1094
+ "lxe/Cerebras-GPT-2.7B-Alpaca-SP",
1095
+ "cerebras/Cerebras-GPT-2.7B",
1096
+ "jzjiao/opt-1.3b-rlhf",
1097
+ "EleutherAI/gpt-neo-1.3B",
1098
+ "aisquared/dlite-v1-1_5b",
1099
+ "Corianas/Quokka_2.7b",
1100
+ "MrNJK/gpt2-xl-sft",
1101
+ "facebook/galactica-1.3b",
1102
+ "aisquared/dlite-v2-774m",
1103
+ "EleutherAI/pythia-1b-deduped",
1104
+ "Kunhao/pile-7b-250b-tokens",
1105
+ "w601sxs/b1ade-1b",
1106
+ "rinna/bilingual-gpt-neox-4b",
1107
+ "shaohang/SparseOPT-1.3B",
1108
+ "shaohang/Sparse0.5_OPT-1.3",
1109
+ "EleutherAI/polyglot-ko-12.8b",
1110
+ "Salesforce/codegen-6B-multi",
1111
+ "bigscience/bloom-1b1",
1112
+ "TFLai/gpt-neo-1.3B-4bit-alpaca",
1113
+ "FabbriSimo01/Bloom_1b_Quantized",
1114
+ "MBZUAI/LaMini-GPT-774M",
1115
+ "Locutusque/gpt2-large-conversational",
1116
+ "Devio/test-3b",
1117
+ "stabilityai/stablelm-tuned-alpha-3b",
1118
+ "PygmalionAI/pygmalion-1.3b",
1119
+ "KoboldAI/fairseq-dense-355M",
1120
+ "Rachneet/gpt2-xl-alpaca",
1121
+ "gpt2-large",
1122
+ "Mikivis/gpt2-large-lora-sft",
1123
+ "stabilityai/stablelm-base-alpha-3b",
1124
+ "gpt2-medium",
1125
+ "Kunhao/pile-7b",
1126
+ "aisquared/dlite-v1-774m",
1127
+ "aisquared/dlite-v2-355m",
1128
+ "YeungNLP/firefly-bloom-2b6-v2",
1129
+ "KnutJaegersberg/gpt-2-xl-EvolInstruct",
1130
+ "KnutJaegersberg/galactica-orca-wizardlm-1.3b",
1131
+ "cerebras/Cerebras-GPT-1.3B",
1132
+ "FabbriSimo01/Cerebras_1.3b_Quantized",
1133
+ "facebook/xglm-1.7B",
1134
+ "EleutherAI/pythia-410m-deduped",
1135
+ "TheBloke/GPlatty-30B-SuperHOT-8K-fp16",
1136
+ "DataLinguistic/DataLinguistic-34B-V1.0",
1137
+ "Corianas/Quokka_1.3b",
1138
+ "TheTravellingEngineer/bloom-560m-RLHF-v2",
1139
+ "Corianas/1.3b",
1140
+ "RWKV/rwkv-4-430m-pile",
1141
+ "porkorbeef/Llama-2-13b-sf",
1142
+ "xhyi/PT_GPTNEO350_ATG",
1143
+ "TheBloke/Wizard-Vicuna-13B-Uncensored-GPTQ",
1144
+ "bigscience/bloomz-560m",
1145
+ "TheBloke/medalpaca-13B-GPTQ-4bit",
1146
+ "TheBloke/Vicuna-33B-1-3-SuperHOT-8K-fp16",
1147
+ "aisquared/dlite-v1-355m",
1148
+ "uukuguy/speechless-codellama-orca-airoboros-13b-0.10e",
1149
+ "yhyhy3/med-orca-instruct-33b",
1150
+ "TheBloke/Wizard-Vicuna-30B-Superhot-8K-fp16",
1151
+ "TheTravellingEngineer/bloom-1b1-RLHF",
1152
+ "MBZUAI/lamini-cerebras-1.3b",
1153
+ "IDEA-CCNL/Ziya-LLaMA-13B-Pretrain-v1",
1154
+ "TheBloke/WizardLM-7B-uncensored-GPTQ",
1155
+ "TheBloke/EverythingLM-13B-16K-GPTQ",
1156
+ "quantumaikr/open_llama_7b_hf",
1157
+ "TheBloke/chronos-wizardlm-uc-scot-st-13B-GPTQ",
1158
+ "TheBloke/WizardLM-30B-Uncensored-GPTQ",
1159
+ "IDEA-CCNL/Ziya-LLaMA-13B-v1",
1160
+ "Phind/Phind-CodeLlama-34B-v1",
1161
+ "robowaifudev/megatron-gpt2-345m",
1162
+ "MayaPH/GodziLLa-30B-instruct",
1163
+ "TheBloke/CAMEL-33B-Combined-Data-SuperHOT-8K-fp16",
1164
+ "uukuguy/speechless-codellama-orca-platypus-13b-0.10e",
1165
+ "doas/test2",
1166
+ "BreadAi/PM_modelV2",
1167
+ "bigcode/santacoder",
1168
+ "TheBloke/wizard-vicuna-13B-GPTQ",
1169
+ "porkorbeef/Llama-2-13b",
1170
+ "TehVenom/DiffMerge-DollyGPT-Pygmalion",
1171
+ "PygmalionAI/pygmalion-350m",
1172
+ "TheBloke/orca_mini_v3_7B-GPTQ",
1173
+ "TheBloke/WizardLM-Uncensored-SuperCOT-StoryTelling-30B-GPTQ",
1174
+ "TheBloke/WizardLM-30B-GPTQ",
1175
+ "bigscience/bloom-560m",
1176
+ "TFLai/gpt2-turkish-uncased",
1177
+ "TheBloke/guanaco-33B-GPTQ",
1178
+ "TheBloke/openchat_v2_openorca_preview-GPTQ",
1179
+ "porkorbeef/Llama-2-13b-public",
1180
+ "TheBloke/LongChat-13B-GPTQ",
1181
+ "yhyhy3/med-orca-instruct-33b",
1182
+ "TheBloke/airoboros-33B-gpt4-1-4-SuperHOT-8K-fp16",
1183
+ "TheBloke/Chinese-Alpaca-33B-SuperHOT-8K-fp16",
1184
+ "MayaPH/FinOPT-Franklin",
1185
+ "TheBloke/WizardLM-33B-V1.0-Uncensored-GPTQ",
1186
+ "TheBloke/Project-Baize-v2-13B-GPTQ",
1187
+ "malhajar/Platypus2-70B-instruct-4bit-gptq",
1188
+ "KoboldAI/OPT-350M-Erebus",
1189
+ "rishiraj/bloom-560m-guanaco",
1190
+ "Panchovix/WizardLM-33B-V1.0-Uncensored-SuperHOT-8k",
1191
+ "doas/test5",
1192
+ "vicgalle/alpaca-7b",
1193
+ "beomi/KoAlpaca-Polyglot-5.8B",
1194
+ "Phind/Phind-CodeLlama-34B-Python-v1",
1195
+ "timdettmers/guanaco-65b-merged",
1196
+ "TheBloke/wizard-mega-13B-GPTQ",
1197
+ "MayaPH/GodziLLa-30B-plus",
1198
+ "TheBloke/Platypus-30B-SuperHOT-8K-fp16",
1199
+ "facebook/opt-350m",
1200
+ "KoboldAI/OPT-350M-Nerys-v2",
1201
+ "TheBloke/robin-33B-v2-GPTQ",
1202
+ "jaspercatapang/Echidna-30B",
1203
+ "TheBloke/llama-30b-supercot-SuperHOT-8K-fp16",
1204
+ "marcchew/test1",
1205
+ "Harshvir/LaMini-Neo-1.3B-Mental-Health_lora",
1206
+ "golaxy/gogpt-560m",
1207
+ "TheBloke/orca_mini_13B-GPTQ",
1208
+ "Panchovix/airoboros-33b-gpt4-1.2-SuperHOT-8k",
1209
+ "Aspik101/tulu-7b-instruct-pl-lora_unload",
1210
+ "Phind/Phind-CodeLlama-34B-v2",
1211
+ "BreadAi/MusePy-1-2",
1212
+ "cerebras/Cerebras-GPT-590M",
1213
+ "microsoft/CodeGPT-small-py",
1214
+ "victor123/WizardLM-13B-1.0",
1215
+ "OptimalScale/robin-65b-v2-delta",
1216
+ "voidful/changpt-bart",
1217
+ "FabbriSimo01/GPT_Large_Quantized",
1218
+ "MayaPH/FinOPT-Lincoln",
1219
+ "KoboldAI/fairseq-dense-125M",
1220
+ "SebastianSchramm/Cerebras-GPT-111M-instruction",
1221
+ "TheTravellingEngineer/bloom-560m-RLHF",
1222
+ "breadlicker45/dough-instruct-base-001",
1223
+ "WizardLM/WizardLM-30B-V1.0",
1224
+ "WizardLM/WizardLM-30B-V1.0",
1225
+ "WizardLM/WizardLM-30B-V1.0",
1226
+ "TaylorAI/Flash-Llama-30M-20001",
1227
+ "porkorbeef/Llama-2-13b-12_153950",
1228
+ "huggingtweets/bladeecity-jerma985",
1229
+ "KnutJaegersberg/megatron-GPT-2-345m-EvolInstruct",
1230
+ "bhenrym14/airoboros-33b-gpt4-1.4.1-lxctx-PI-16384-fp16",
1231
+ "microsoft/DialoGPT-small",
1232
+ "Corianas/590m",
1233
+ "facebook/xglm-564M",
1234
+ "EleutherAI/gpt-neo-125m",
1235
+ "EleutherAI/pythia-160m-deduped",
1236
+ "klosax/pythia-160m-deduped-step92k-193bt",
1237
+ "MBZUAI/lamini-neo-125m",
1238
+ "bigcode/tiny_starcoder_py",
1239
+ "concedo/OPT-19M-ChatSalad",
1240
+ "anton-l/gpt-j-tiny-random",
1241
+ "grantprice/Cerebras-GPT-590M-finetuned-DND",
1242
+ "deepnight-research/zsc-text",
1243
+ "WangZeJun/bloom-820m-chat",
1244
+ "cerebras/Cerebras-GPT-256M",
1245
+ "ai-forever/rugpt3large_based_on_gpt2",
1246
+ "alibidaran/medical_transcription_generator",
1247
+ "Deci/DeciCoder-1b",
1248
+ "microsoft/DialoGPT-medium",
1249
+ "ogimgio/gpt-neo-125m-neurallinguisticpioneers",
1250
+ "open-llm-leaderboard/bloom-560m-4bit-alpaca-auto-eval-adapter-applied",
1251
+ "BreadAi/gpt-YA-1-1_160M",
1252
+ "microsoft/DialoGPT-large",
1253
+ "facebook/opt-125m",
1254
+ "huggingtweets/jerma985",
1255
+ "Locutusque/gpt2-conversational-or-qa",
1256
+ "concedo/Pythia-70M-ChatSalad",
1257
+ "roneneldan/TinyStories-1M",
1258
+ "BreadAi/DiscordPy",
1259
+ "bigcode/gpt_bigcode-santacoder",
1260
+ "Tincando/fiction_story_generator",
1261
+ "klosax/pythia-70m-deduped-step44k-92bt",
1262
+ "Quake24/easyTermsSummerizer",
1263
+ "BreadAi/gpt-YA-1-1_70M",
1264
+ "EleutherAI/pythia-160m",
1265
+ "euclaise/gpt-neox-122m-minipile-digits",
1266
+ "MBZUAI/lamini-cerebras-590m",
1267
+ "nicholasKluge/Aira-124M",
1268
+ "MayaPH/FinOPT-Washington",
1269
+ "cyberagent/open-calm-large",
1270
+ "BreadAi/StoryPy",
1271
+ "EleutherAI/pythia-70m",
1272
+ "BreadAi/gpt-Youtube",
1273
+ "roneneldan/TinyStories-33M",
1274
+ "EleutherAI/pythia-70m-deduped",
1275
+ "lgaalves/gpt2_guanaco-dolly-platypus",
1276
+ "Corianas/Quokka_590m",
1277
+ "lgaalves/gpt2_platypus-dolly-guanaco",
1278
+ "cyberagent/open-calm-7b",
1279
+ "RWKV/rwkv-4-169m-pile",
1280
+ "gpt2",
1281
+ "roneneldan/TinyStories-28M",
1282
+ "lgaalves/gpt2_open-platypus",
1283
+ "gpt2",
1284
+ "SaylorTwift/gpt2_test",
1285
+ "roneneldan/TinyStories-3M",
1286
+ "nthngdy/pythia-owt2-70m-50k",
1287
+ "Corianas/256_5epoch",
1288
+ "roneneldan/TinyStories-8M",
1289
+ "lgaalves/gpt2-dolly",
1290
+ "nthngdy/pythia-owt2-70m-100k",
1291
+ "aisquared/dlite-v2-124m",
1292
+ "mncai/SGPT-1.3B-insurance-epoch10",
1293
+ "huggingtweets/gladosystem",
1294
+ "abhiramtirumala/DialoGPT-sarcastic-medium",
1295
+ "MBZUAI/lamini-cerebras-256m",
1296
+ "cerebras/Cerebras-GPT-111M",
1297
+ "uberkie/metharme-1.3b-finetuned",
1298
+ "MBZUAI/lamini-cerebras-111m",
1299
+ "psyche/kogpt",
1300
+ "Corianas/Quokka_256m",
1301
+ "vicgalle/gpt2-alpaca-gpt4",
1302
+ "aisquared/dlite-v1-124m",
1303
+ "Mikivis/xuanxuan",
1304
+ "MBZUAI/LaMini-GPT-124M",
1305
+ "vicgalle/gpt2-alpaca",
1306
+ "huashiyiqike/testmodel",
1307
+ "Corianas/111m",
1308
+ "baseline",
1309
+ ]
src/tools/plots.py ADDED
@@ -0,0 +1,155 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import pandas as pd
2
+ import numpy as np
3
+ import plotly.express as px
4
+ from plotly.graph_objs import Figure
5
+
6
+ from src.leaderboard.filter_models import FLAGGED_MODELS
7
+ from src.display.utils import human_baseline_row as HUMAN_BASELINE, AutoEvalColumn, BENCHMARK_COLS
8
+ from src.about import Tasks, Task
9
+ from src.leaderboard.read_evals import EvalResult
10
+
11
+
12
+
13
+ def create_scores_df(raw_data: list[EvalResult]) -> pd.DataFrame:
14
+ """
15
+ Generates a DataFrame containing the maximum scores until each date.
16
+
17
+ :param results_df: A DataFrame containing result information including metric scores and dates.
18
+ :return: A new DataFrame containing the maximum scores until each date for every metric.
19
+ """
20
+ # Step 1: Ensure 'date' is in datetime format and sort the DataFrame by it
21
+ results_df = pd.DataFrame(raw_data)
22
+ #results_df["date"] = pd.to_datetime(results_df["date"], format="mixed", utc=True)
23
+ results_df.sort_values(by="date", inplace=True)
24
+
25
+ # Step 2: Initialize the scores dictionary
26
+ scores = {k: [] for k in BENCHMARK_COLS + [AutoEvalColumn.average.name]}
27
+
28
+ # Step 3: Iterate over the rows of the DataFrame and update the scores dictionary
29
+ for task in [t.value for t in Tasks] + [Task("Average", "avg", AutoEvalColumn.average.name)]:
30
+ current_max = 0
31
+ last_date = ""
32
+ column = task.col_name
33
+ for _, row in results_df.iterrows():
34
+ current_model = row["full_model"]
35
+ if current_model in FLAGGED_MODELS:
36
+ continue
37
+
38
+ current_date = row["date"]
39
+ if task.benchmark == "Average":
40
+ current_score = np.mean(list(row["results"].values()))
41
+ else:
42
+ current_score = row["results"][task.benchmark]
43
+
44
+ if current_score > current_max:
45
+ if current_date == last_date and len(scores[column]) > 0:
46
+ scores[column][-1] = {"model": current_model, "date": current_date, "score": current_score}
47
+ else:
48
+ scores[column].append({"model": current_model, "date": current_date, "score": current_score})
49
+ current_max = current_score
50
+ last_date = current_date
51
+
52
+ # Step 4: Return all dictionaries as DataFrames
53
+ return {k: pd.DataFrame(v) for k, v in scores.items()}
54
+
55
+
56
+ def create_plot_df(scores_df: dict[str: pd.DataFrame]) -> pd.DataFrame:
57
+ """
58
+ Transforms the scores DataFrame into a new format suitable for plotting.
59
+
60
+ :param scores_df: A DataFrame containing metric scores and dates.
61
+ :return: A new DataFrame reshaped for plotting purposes.
62
+ """
63
+ # Initialize the list to store DataFrames
64
+ dfs = []
65
+
66
+ # Iterate over the cols and create a new DataFrame for each column
67
+ for col in BENCHMARK_COLS + [AutoEvalColumn.average.name]:
68
+ d = scores_df[col].reset_index(drop=True)
69
+ d["task"] = col
70
+ dfs.append(d)
71
+
72
+ # Concatenate all the created DataFrames
73
+ concat_df = pd.concat(dfs, ignore_index=True)
74
+
75
+ # Sort values by 'date'
76
+ concat_df.sort_values(by="date", inplace=True)
77
+ concat_df.reset_index(drop=True, inplace=True)
78
+ return concat_df
79
+
80
+
81
+ def create_metric_plot_obj(
82
+ df: pd.DataFrame, metrics: list[str], title: str
83
+ ) -> Figure:
84
+ """
85
+ Create a Plotly figure object with lines representing different metrics
86
+ and horizontal dotted lines representing human baselines.
87
+
88
+ :param df: The DataFrame containing the metric values, names, and dates.
89
+ :param metrics: A list of strings representing the names of the metrics
90
+ to be included in the plot.
91
+ :param title: A string representing the title of the plot.
92
+ :return: A Plotly figure object with lines representing metrics and
93
+ horizontal dotted lines representing human baselines.
94
+ """
95
+
96
+ # Filter the DataFrame based on the specified metrics
97
+ df = df[df["task"].isin(metrics)]
98
+
99
+ # Filter the human baselines based on the specified metrics
100
+ filtered_human_baselines = {k: v for k, v in HUMAN_BASELINE.items() if k in metrics}
101
+
102
+ # Create a line figure using plotly express with specified markers and custom data
103
+ fig = px.line(
104
+ df,
105
+ x="date",
106
+ y="score",
107
+ color="task",
108
+ markers=True,
109
+ custom_data=["task", "score", "model"],
110
+ title=title,
111
+ )
112
+
113
+ # Update hovertemplate for better hover interaction experience
114
+ fig.update_traces(
115
+ hovertemplate="<br>".join(
116
+ [
117
+ "Model Name: %{customdata[2]}",
118
+ "Metric Name: %{customdata[0]}",
119
+ "Date: %{x}",
120
+ "Metric Value: %{y}",
121
+ ]
122
+ )
123
+ )
124
+
125
+ # Update the range of the y-axis
126
+ fig.update_layout(yaxis_range=[0, 100])
127
+
128
+ # Create a dictionary to hold the color mapping for each metric
129
+ metric_color_mapping = {}
130
+
131
+ # Map each metric name to its color in the figure
132
+ for trace in fig.data:
133
+ metric_color_mapping[trace.name] = trace.line.color
134
+
135
+ # Iterate over filtered human baselines and add horizontal lines to the figure
136
+ #for metric, value in filtered_human_baselines.items():
137
+ # color = metric_color_mapping.get(metric, "blue") # Retrieve color from mapping; default to blue if not found
138
+ # location = "top left" if metric == "HellaSwag" else "bottom left" # Set annotation position
139
+ # # Add horizontal line with matched color and positioned annotation
140
+ # fig.add_hline(
141
+ # y=value,
142
+ # line_dash="dot",
143
+ # annotation_text=f"{metric} human baseline",
144
+ # annotation_position=location,
145
+ # annotation_font_size=10,
146
+ # annotation_font_color=color,
147
+ # line_color=color,
148
+ # )
149
+
150
+ return fig
151
+
152
+
153
+ # Example Usage:
154
+ # human_baselines dictionary is defined.
155
+ # chart = create_metric_plot_obj(scores_df, ["ARC", "HellaSwag", "MMLU", "TruthfulQA"], human_baselines, "Graph Title")