Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
File size: 1,888 Bytes
a8ede2f 24eddae a8ede2f 24eddae a8ede2f dc1ba50 a8ede2f dc1ba50 a8ede2f dc1ba50 a8ede2f dc1ba50 a8ede2f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 |
from src.display.utils import ModelType
TITLE = """<h1 align="center" id="space-title">π€ Open Hallucinations Leaderboard</h1>"""
INTRODUCTION_TEXT = """
π The π€ Open Hallucinations Leaderboard aims to track, rank and evaluate hallucinations in LLMs and chatbots.
π€ Submit a model for automated evaluation on the π€ GPU cluster on the "Submit" page!
The leaderboard's backend runs the great [Eleuther AI Language Model Evaluation Harness](https://github.com/EleutherAI/lm-evaluation-harness) - read more details in the "About" page!
"""
LLM_BENCHMARKS_TEXT = f"""
XXX
"""
EVALUATION_QUEUE_TEXT = """
XXX
"""
CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
CITATION_BUTTON_TEXT = r"""
@misc{hallucinations-leaderboard,
author = {Pasquale Minervini},
title = {Hallucinations Leaderboard},
year = {2023},
publisher = {Hugging Face},
howpublished = "\url{https://huggingface.co/spaces/hallucinations-leaderboard/leaderboard}"
}
@software{eval-harness,
author = {Gao, Leo and
Tow, Jonathan and
Biderman, Stella and
Black, Sid and
DiPofi, Anthony and
Foster, Charles and
Golding, Laurence and
Hsu, Jeffrey and
McDonell, Kyle and
Muennighoff, Niklas and
Phang, Jason and
Reynolds, Laria and
Tang, Eric and
Thite, Anish and
Wang, Ben and
Wang, Kevin and
Zou, Andy},
title = {A framework for few-shot language model evaluation},
month = sep,
year = 2021,
publisher = {Zenodo},
version = {v0.0.1},
doi = {10.5281/zenodo.5371628},
url = {https://doi.org/10.5281/zenodo.5371628}
}
}"""
|