in-the-stack / app.py
lvwerra's picture
lvwerra HF staff
Update app.py
da1ef91
raw
history blame
1 kB
from datasets import load_dataset
import streamlit as st
@st.cache()
def get_repo_names():
list_of_repo_names = ["lvwerra/test", "lvwerra/test2", "numpy/numpy"]
return list_of_repo_names
st.title("Am I in The Stack?")
st.markdown("This tool lets you check if a repository under a given username is part of [The Stack dataset](https://huggingface.co/datasets/bigcode/the-stack).")
repo_names = get_repo_names()
username = st.text_input("GitHub Username:")
if st.button("Check!"):
list_of_repos = [repo_name for repo_name in repo_names if repo_name.split("/")[0]==username]
if len(list_of_repos)==0:
st.markdown("There is **no repository** under that username in The Stack.")
else:
if len(list_of_repos)==1:
st.markdown("There is **1 repository** under that username in The Stack:")
else:
st.markdown(f"There are **{len(list_of_repos)} repositories** under that username in The Stack:")
st.text("\n".join(list_of_repos))