|
Up
|
|
|
|
|
alpaca-eval.md
|
|
|
|
|
arena-hard-auto.md
|
|
|
|
|
arena-hard.md
|
|
|
|
|
berkeley-function-calling-leaderboard.md
|
|
|
|
|
comparing-llm-performance-anyscale.md
|
|
|
|
|
enterprise-scenarios-patronus.md
|
|
|
|
|
facts-grounding-leaderboard.md
|
|
|
|
|
gaia-benchmark.md
|
|
|
|
|
length-controlled-alpacaeval.md
|
|
|
|
|
llmperf-leaderboard.md
|
|
|
|
|
lmsys-arena.md
|
|
|
|
|
matharena.md
|
|
|
|
|
open-llm-leaderboard.md
|
|
|
|
|
vectara-hallucination-leaderboard.md
|
|
|
|
|
vidore-v2.md
|
|
|
|
|
zeroeval.md
|
|
|
|