llm-leaderboard / streamlit_app.py
Ludwig Stumpp
Add sources
3be1fea
raw
history blame
3.56 kB
import io
import pandas as pd
import requests
import streamlit as st
REPO_URL = "https://github.com/LudwigStumpp/llm-leaderboard"
def grab_file_from_repo(repo_url: str, filename: str) -> str:
"""Grabs a file from a GitHub repository.
Args:
repo_url (str): URL of the GitHub repository.
filename (str): Name of the file to grab.
Returns:
str: Content of the file.
"""
url = repo_url.replace("github.com", "raw.githubusercontent.com") + f"/main/{filename}"
return requests.get(url).text
def filter_dataframe(df: pd.DataFrame) -> pd.DataFrame:
"""
Adds a UI on top of a dataframe to let viewers filter columns
Modified from https://blog.streamlit.io/auto-generate-a-dataframe-filtering-ui-in-streamlit-with-filter_dataframe/
Args:
df (pd.DataFrame): Original dataframe
Returns:
pd.DataFrame: Filtered dataframe
"""
modify = st.checkbox("Add filters")
if not modify:
return df
df = df.copy()
modification_container = st.container()
with modification_container:
to_filter_index = st.multiselect("Filter by model:", df.index)
if to_filter_index:
df = pd.DataFrame(df.loc[to_filter_index])
to_filter_columns = st.multiselect("Filter by benchmark:", df.columns)
if to_filter_columns:
df = pd.DataFrame(df[to_filter_columns])
return df
def setup_basic():
title = "LLM-Leaderboard"
st.set_page_config(
page_title=title,
page_icon="πŸ†",
layout="wide",
)
st.title(title)
st.markdown(
"""
A joint community effort to create one central leaderboard for LLMs.
Visit [llm-leaderboard](https://github.com/LudwigStumpp/llm-leaderboard) to contribute.
"""
)
def setup_table():
csv_table = grab_file_from_repo(REPO_URL, "leaderboard.csv")
df = pd.read_csv(io.StringIO(csv_table), index_col=0)
df = df.sort_index(ascending=True)
df = df.replace(r"^\s*$", float("nan"), regex=True)
df = df.astype(float, errors="ignore")
st.markdown("### Leaderboard")
st.dataframe(filter_dataframe(df))
def setup_benchmarks():
csv_table = grab_file_from_repo(REPO_URL, "benchmarks.csv")
df = pd.read_csv(io.StringIO(csv_table), index_col=0)
df = df.sort_index(ascending=True)
st.markdown("### Covered Benchmarks")
selected_benchmark = st.selectbox("Select a benchmark to learn more:", df.index.unique())
df_selected = df.loc[selected_benchmark]
text = [
f"Name: {selected_benchmark} ",
]
for key in df_selected.keys():
text.append(f"{key}: {df_selected[key]} ")
st.markdown("\n".join(text))
def setup_sources():
csv_table = grab_file_from_repo(REPO_URL, "sources.csv")
df = pd.read_csv(io.StringIO(csv_table), index_col=0)
df = df.sort_index(ascending=True)
st.markdown("### Sources")
selected_source = st.selectbox("Select a source to learn more:", df.index.unique())
df_selected = df.loc[selected_source]
text = [
f"Author: {selected_source} ",
]
for key in df_selected.keys():
text.append(f"{key}: {df_selected[key]} ")
st.markdown("\n".join(text))
def setup_footer():
st.markdown(
"""
---
Made with ❀️ by the awesome open-source community from all over 🌍.
"""
)
def main():
setup_basic()
setup_table()
setup_benchmarks()
setup_sources()
setup_footer()
if __name__ == "__main__":
main()