from datasets import load_dataset import streamlit as st @st.cache() def load_all_repository_names(): list_of_repo_names = ["test"] #list_of_repo_names = load_dataset("bigcode/the-stack-paths", split="train")["repository_name"] return list_of_repo_names st.title("Am I in The Stack?") st.markdown("This tool lets you check if a repository under a given username is part of [The Stack dataset](https://huggingface.co/datasets/bigcode/the-stack).") repo_names = load_all_repository_names() n_repos = len(repo_names) username = st.text_input("GitHub Username:") st.markdown("_Note_: this Space is currently under construction.")