Spaces:
Running
Running
Andrea Seveso
commited on
Commit
Β·
7853dd1
1
Parent(s):
48d0e61
Add changelog
Browse files- app.py +5 -1
- src/about.py +17 -0
app.py
CHANGED
|
@@ -14,6 +14,7 @@ from src.about import (
|
|
| 14 |
EVALUATION_QUEUE_TEXT,
|
| 15 |
QUESTION_FORMAT_TEXT,
|
| 16 |
MACRO_AREA_TEXT,
|
|
|
|
| 17 |
)
|
| 18 |
from src.display.css_html_js import custom_css
|
| 19 |
from src.display.utils import (
|
|
@@ -263,7 +264,10 @@ with demo:
|
|
| 263 |
with gr.TabItem("π About", elem_id="llm-benchmark-tab-table", id=2):
|
| 264 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
|
| 265 |
|
| 266 |
-
with gr.TabItem("
|
|
|
|
|
|
|
|
|
|
| 267 |
with gr.Column():
|
| 268 |
with gr.Row():
|
| 269 |
gr.Markdown(EVALUATION_QUEUE_TEXT,
|
|
|
|
| 14 |
EVALUATION_QUEUE_TEXT,
|
| 15 |
QUESTION_FORMAT_TEXT,
|
| 16 |
MACRO_AREA_TEXT,
|
| 17 |
+
CHANGELOG_TEXT,
|
| 18 |
)
|
| 19 |
from src.display.css_html_js import custom_css
|
| 20 |
from src.display.utils import (
|
|
|
|
| 264 |
with gr.TabItem("π About", elem_id="llm-benchmark-tab-table", id=2):
|
| 265 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
|
| 266 |
|
| 267 |
+
with gr.TabItem("π οΈ Changelog", elem_id="changelog-tab", id=3):
|
| 268 |
+
gr.Markdown(CHANGELOG_TEXT, elem_classes="markdown-text")
|
| 269 |
+
|
| 270 |
+
with gr.TabItem("π Submit here! ", elem_id="llm-benchmark-tab-table", id=4):
|
| 271 |
with gr.Column():
|
| 272 |
with gr.Row():
|
| 273 |
gr.Markdown(EVALUATION_QUEUE_TEXT,
|
src/about.py
CHANGED
|
@@ -290,3 +290,20 @@ Categories are abbreviated as:
|
|
| 290 |
* _SY_: Syntax.
|
| 291 |
* _TP_: Textuality and pragmatics.
|
| 292 |
"""
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 290 |
* _SY_: Syntax.
|
| 291 |
* _TP_: Textuality and pragmatics.
|
| 292 |
"""
|
| 293 |
+
|
| 294 |
+
CHANGELOG_TEXT = """
|
| 295 |
+
## Changelog
|
| 296 |
+
|
| 297 |
+
### 27/06/2024
|
| 298 |
+
- π Added changelog.
|
| 299 |
+
- π New model: claude-3.5-sonnet
|
| 300 |
+
|
| 301 |
+
### 26/06/2024
|
| 302 |
+
- π Initial leaderboard launch.
|
| 303 |
+
- π Added evaluation metrics for the INVALSI benchmark.
|
| 304 |
+
- π Added leaderboard introduction.
|
| 305 |
+
- β Added INVALSI benchmark description.
|
| 306 |
+
- π Added evaluation queue form.
|
| 307 |
+
- π¬ Added citation button.
|
| 308 |
+
- π Added question format and macro area descriptions.
|
| 309 |
+
"""
|