auto_evals/ venv/ __pycache__/ .env .ipynb_checkpoints *ipynb .vscode/ eval-queue/ eval-results/ eval-queue-bk/ eval-results-bk/ logs/ envs/ tmp.py print.py leaderboard.tex