yentinglin commited on
Commit
65a9e72
1 Parent(s): d30a6b1

add tw tasks

Browse files
Files changed (1) hide show
  1. src/about.py +5 -3
src/about.py CHANGED
@@ -12,8 +12,9 @@ class Task:
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
14
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
15
- task0 = Task("anli_r1", "acc", "ANLI")
16
- task1 = Task("logiqa", "acc_norm", "LogiQA")
 
17
 
18
  NUM_FEWSHOT = 0 # Change with your few shot
19
  # ---------------------------------------------------
@@ -35,6 +36,7 @@ LLM_BENCHMARKS_TEXT = f"""
35
  ## Reproducibility
36
  To reproduce our results, here is the commands you can run:
37
 
 
38
  """
39
 
40
  EVALUATION_QUEUE_TEXT = """
@@ -69,7 +71,7 @@ If everything is done, check you can launch the EleutherAIHarness on your model
69
 
70
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
71
  CITATION_BUTTON_TEXT = r"""
72
- @misc{open-ko-llm-leaderboard,
73
  author = {Yen{-}Ting Lin, Yun{-}Nung Chen},
74
  title = {Open TW-LLM Leaderboard},
75
  year = {2024},
 
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
14
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
15
+ task2 = Task("tmlu", "acc", "TMLU")
16
+ task3 = Task("twllm_eval", "acc", "TW Truthful QA")
17
+ task4 = Task("tw_legal", "acc", "TW Legal Eval")
18
 
19
  NUM_FEWSHOT = 0 # Change with your few shot
20
  # ---------------------------------------------------
 
36
  ## Reproducibility
37
  To reproduce our results, here is the commands you can run:
38
 
39
+ please checkout this command https://github.com/adamlin120/lm-evaluation-harness/blob/main/run_all.sh
40
  """
41
 
42
  EVALUATION_QUEUE_TEXT = """
 
71
 
72
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
73
  CITATION_BUTTON_TEXT = r"""
74
+ @misc{open-tw-llm-leaderboard,
75
  author = {Yen{-}Ting Lin, Yun{-}Nung Chen},
76
  title = {Open TW-LLM Leaderboard},
77
  year = {2024},