.. |
__init__.py
|
[Update] update docs and add compassarena (#1614)
|
2024-10-17 14:39:06 +08:00 |
alignbench.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
alpacaeval.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
arena_hard.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
compass_arena.py
|
[Update] update docs and add compassarena (#1614)
|
2024-10-17 14:39:06 +08:00 |
compassbench_checklist.py
|
[Feature] support compassbench Checklist evaluation (#1339)
|
2024-07-19 16:40:44 +08:00 |
compassbench_control_length_bias.py
|
[Refactor] Reorganize subjective eval (#1284)
|
2024-07-05 22:11:37 +08:00 |
compassbench.py
|
[Refactor] Reorganize subjective eval (#1284)
|
2024-07-05 22:11:37 +08:00 |
corev2.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
creationbench.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
flames.py
|
[Fix] fix Flames (#1599)
|
2024-10-12 14:34:59 +08:00 |
fofo.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
followbench.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
hellobench.py
|
Upload HelloBench (#1607)
|
2024-10-15 17:11:37 +08:00 |
judgerbench.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
mtbench101.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
mtbench.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
multiround.py
|
reorganize subject files (#801)
|
2024-01-16 18:03:11 +08:00 |
subjective_cmp.py
|
[Fix] Fix Slurm ENV (#1392)
|
2024-08-06 01:35:20 +08:00 |
utils.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |
wildbench.py
|
[Feature] Add Judgerbench and reorg subeval (#1593)
|
2024-10-15 16:36:05 +08:00 |