.. |
__init__.py
|
[Feature] add dataset Fofo (#1224)
|
2024-06-06 11:40:48 +08:00 |
alignmentbench.py
|
[Sync] update taco (#1030)
|
2024-04-09 17:50:23 +08:00 |
all_obj.py
|
[Fix] Fix Math Evaluation with Judge Model Evaluator & Add README (#1103)
|
2024-04-28 21:58:58 +08:00 |
alpacaeval.py
|
[Feature] Add multi-model judge and fix some problems (#1016)
|
2024-04-02 11:52:06 +08:00 |
arenahard.py
|
[Fix] fix summarizer (#1217)
|
2024-05-31 11:40:47 +08:00 |
compass_arena.py
|
[Sync] deprecate old mbpps (#1064)
|
2024-04-19 20:49:46 +08:00 |
compassbench.py
|
[Sync] format (#1214)
|
2024-05-30 00:21:58 +08:00 |
corev2.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
creationbench.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
flames.py
|
[Feature] add support for Flames datasets (#1093)
|
2024-04-28 18:56:24 +08:00 |
fofo.py
|
[Feature] add dataset Fofo (#1224)
|
2024-06-06 11:40:48 +08:00 |
information_retrival.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
mtbench101.py
|
MT-Bench-101 (#1215)
|
2024-06-03 14:52:12 +08:00 |
mtbench.py
|
[Sync] deprecate old mbpps (#1064)
|
2024-04-19 20:49:46 +08:00 |
multiround.py
|
[Fix] Fix MultiRound Subjective Evaluation(#1043)
|
2024-04-22 12:06:03 +08:00 |
subjective_post_process.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
utils.py
|
fix compass arena (#854)
|
2024-01-30 16:34:38 +08:00 |