{"cells":[{"cell_type":"code","execution_count":1,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"0ea8b46b-839b-445b-8043-ccdf4e920ace","showTitle":false,"title":""},"executionInfo":{"elapsed":5,"status":"ok","timestamp":1720336753526,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"KSWhkNUGHk6J"},"outputs":[],"source":["%load_ext autoreload\n","%autoreload 2"]},{"cell_type":"code","execution_count":2,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":18914,"status":"ok","timestamp":1720336772436,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"O1N25gePH3nR","outputId":"d4dc260f-ea46-48f7-cb49-6d25beae279e"},"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/drive\n"]}],"source":["from google.colab import drive\n","drive.mount('/content/drive')"]},{"cell_type":"code","execution_count":3,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":170894,"status":"ok","timestamp":1720336943324,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"ExKl7VacH6Va","outputId":"39d09e8a-f5fe-48bc-86bf-ee997c9c3103"},"outputs":[{"output_type":"stream","name":"stdout","text":["/content\n","Cloning into 'LLaMA-Factory'...\n","remote: Enumerating objects: 15281, done.\u001b[K\n","remote: Counting objects: 100% (231/231), done.\u001b[K\n","remote: Compressing objects: 100% (99/99), done.\u001b[K\n","remote: Total 15281 (delta 141), reused 191 (delta 131), pack-reused 15050\u001b[K\n","Receiving objects: 100% (15281/15281), 221.43 MiB | 20.24 MiB/s, done.\n","Resolving deltas: 100% (11190/11190), done.\n","/content/LLaMA-Factory\n","\u001b[0m\u001b[01;34massets\u001b[0m/ \u001b[01;34mdocker\u001b[0m/ LICENSE pyproject.toml requirements.txt \u001b[01;34msrc\u001b[0m/\n","CITATION.cff \u001b[01;34mevaluation\u001b[0m/ Makefile README.md \u001b[01;34mscripts\u001b[0m/ \u001b[01;34mtests\u001b[0m/\n","\u001b[01;34mdata\u001b[0m/ \u001b[01;34mexamples\u001b[0m/ MANIFEST.in README_zh.md setup.py\n","Obtaining file:///content/LLaMA-Factory\n"," Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n"," Checking if build backend supports build_editable ... \u001b[?25l\u001b[?25hdone\n"," Getting requirements to build editable ... \u001b[?25l\u001b[?25hdone\n"," Preparing editable metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n","Requirement already satisfied: transformers>=4.41.2 in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (4.41.2)\n","Collecting datasets>=2.16.0 (from llamafactory==0.8.3.dev0)\n"," Downloading datasets-2.20.0-py3-none-any.whl (547 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m547.8/547.8 kB\u001b[0m \u001b[31m6.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting accelerate>=0.30.1 (from llamafactory==0.8.3.dev0)\n"," Downloading accelerate-0.32.1-py3-none-any.whl (314 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m314.1/314.1 kB\u001b[0m \u001b[31m8.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting peft>=0.11.1 (from llamafactory==0.8.3.dev0)\n"," Downloading peft-0.11.1-py3-none-any.whl (251 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m251.6/251.6 kB\u001b[0m \u001b[31m11.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting trl>=0.8.6 (from llamafactory==0.8.3.dev0)\n"," Downloading trl-0.9.4-py3-none-any.whl (226 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m226.7/226.7 kB\u001b[0m \u001b[31m10.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting gradio>=4.0.0 (from llamafactory==0.8.3.dev0)\n"," Downloading gradio-4.37.2-py3-none-any.whl (12.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m12.3/12.3 MB\u001b[0m \u001b[31m32.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pandas>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (2.0.3)\n","Requirement already satisfied: scipy in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (1.11.4)\n","Collecting einops (from llamafactory==0.8.3.dev0)\n"," Downloading einops-0.8.0-py3-none-any.whl (43 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m43.2/43.2 kB\u001b[0m \u001b[31m6.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: sentencepiece in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (0.1.99)\n","Collecting tiktoken (from llamafactory==0.8.3.dev0)\n"," Downloading tiktoken-0.7.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.1 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.1/1.1 MB\u001b[0m \u001b[31m61.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: protobuf in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (3.20.3)\n","Collecting uvicorn (from llamafactory==0.8.3.dev0)\n"," Downloading uvicorn-0.30.1-py3-none-any.whl (62 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.4/62.4 kB\u001b[0m \u001b[31m7.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pydantic in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (2.8.0)\n","Collecting fastapi (from llamafactory==0.8.3.dev0)\n"," Downloading fastapi-0.111.0-py3-none-any.whl (91 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m92.0/92.0 kB\u001b[0m \u001b[31m13.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting sse-starlette (from llamafactory==0.8.3.dev0)\n"," Downloading sse_starlette-2.1.2-py3-none-any.whl (9.3 kB)\n","Requirement already satisfied: matplotlib>=3.7.0 in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (3.7.1)\n","Collecting fire (from llamafactory==0.8.3.dev0)\n"," Downloading fire-0.6.0.tar.gz (88 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m88.4/88.4 kB\u001b[0m \u001b[31m14.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n","Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (24.1)\n","Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (6.0.1)\n","Requirement already satisfied: numpy<2.0.0 in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (1.25.2)\n","Requirement already satisfied: torch>=1.13.1 in /usr/local/lib/python3.10/dist-packages (from llamafactory==0.8.3.dev0) (2.3.0+cu121)\n","Collecting bitsandbytes>=0.39.0 (from llamafactory==0.8.3.dev0)\n"," Downloading bitsandbytes-0.43.1-py3-none-manylinux_2_24_x86_64.whl (119.8 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m119.8/119.8 MB\u001b[0m \u001b[31m7.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.30.1->llamafactory==0.8.3.dev0) (5.9.5)\n","Requirement already satisfied: huggingface-hub in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.30.1->llamafactory==0.8.3.dev0) (0.23.4)\n","Requirement already satisfied: safetensors>=0.3.1 in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.30.1->llamafactory==0.8.3.dev0) (0.4.3)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->llamafactory==0.8.3.dev0) (3.15.4)\n","Collecting pyarrow>=15.0.0 (from datasets>=2.16.0->llamafactory==0.8.3.dev0)\n"," Downloading pyarrow-16.1.0-cp310-cp310-manylinux_2_28_x86_64.whl (40.8 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m40.8/40.8 MB\u001b[0m \u001b[31m19.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pyarrow-hotfix in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->llamafactory==0.8.3.dev0) (0.6)\n","Collecting dill<0.3.9,>=0.3.0 (from datasets>=2.16.0->llamafactory==0.8.3.dev0)\n"," Downloading dill-0.3.8-py3-none-any.whl (116 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m116.3/116.3 kB\u001b[0m \u001b[31m14.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting requests>=2.32.2 (from datasets>=2.16.0->llamafactory==0.8.3.dev0)\n"," Downloading requests-2.32.3-py3-none-any.whl (64 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m64.9/64.9 kB\u001b[0m \u001b[31m9.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: tqdm>=4.66.3 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->llamafactory==0.8.3.dev0) (4.66.4)\n","Collecting xxhash (from datasets>=2.16.0->llamafactory==0.8.3.dev0)\n"," Downloading xxhash-3.4.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (194 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m22.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting multiprocess (from datasets>=2.16.0->llamafactory==0.8.3.dev0)\n"," Downloading multiprocess-0.70.16-py310-none-any.whl (134 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m15.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: fsspec[http]<=2024.5.0,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->llamafactory==0.8.3.dev0) (2023.6.0)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->llamafactory==0.8.3.dev0) (3.9.5)\n","Collecting aiofiles<24.0,>=22.0 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading aiofiles-23.2.1-py3-none-any.whl (15 kB)\n","Requirement already satisfied: altair<6.0,>=4.2.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (4.2.2)\n","Collecting ffmpy (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading ffmpy-0.3.2.tar.gz (5.5 kB)\n"," Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n","Collecting gradio-client==1.0.2 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading gradio_client-1.0.2-py3-none-any.whl (318 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m318.2/318.2 kB\u001b[0m \u001b[31m32.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting httpx>=0.24.1 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading httpx-0.27.0-py3-none-any.whl (75 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m75.6/75.6 kB\u001b[0m \u001b[31m9.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: importlib-resources<7.0,>=1.3 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (6.4.0)\n","Requirement already satisfied: jinja2<4.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (3.1.4)\n","Requirement already satisfied: markupsafe~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (2.1.5)\n","Collecting orjson~=3.0 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading orjson-3.10.6-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (141 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m141.1/141.1 kB\u001b[0m \u001b[31m10.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pillow<11.0,>=8.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (9.4.0)\n","Collecting pydub (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)\n","Collecting python-multipart>=0.0.9 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading python_multipart-0.0.9-py3-none-any.whl (22 kB)\n","Collecting ruff>=0.2.2 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading ruff-0.5.1-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (10.1 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m10.1/10.1 MB\u001b[0m \u001b[31m75.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting semantic-version~=2.0 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading semantic_version-2.10.0-py2.py3-none-any.whl (15 kB)\n","Collecting tomlkit==0.12.0 (from gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading tomlkit-0.12.0-py3-none-any.whl (37 kB)\n","Requirement already satisfied: typer<1.0,>=0.12 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (0.12.3)\n","Requirement already satisfied: typing-extensions~=4.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (4.12.2)\n","Requirement already satisfied: urllib3~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=4.0.0->llamafactory==0.8.3.dev0) (2.0.7)\n","Collecting websockets<12.0,>=10.0 (from gradio-client==1.0.2->gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading websockets-11.0.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (129 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m129.9/129.9 kB\u001b[0m \u001b[31m23.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib>=3.7.0->llamafactory==0.8.3.dev0) (1.2.1)\n","Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib>=3.7.0->llamafactory==0.8.3.dev0) (0.12.1)\n","Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib>=3.7.0->llamafactory==0.8.3.dev0) (4.53.0)\n","Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib>=3.7.0->llamafactory==0.8.3.dev0) (1.4.5)\n","Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib>=3.7.0->llamafactory==0.8.3.dev0) (3.1.2)\n","Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib>=3.7.0->llamafactory==0.8.3.dev0) (2.8.2)\n","Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas>=2.0.0->llamafactory==0.8.3.dev0) (2023.4)\n","Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas>=2.0.0->llamafactory==0.8.3.dev0) (2024.1)\n","Requirement already satisfied: annotated-types>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from pydantic->llamafactory==0.8.3.dev0) (0.7.0)\n","Requirement already satisfied: pydantic-core==2.20.0 in /usr/local/lib/python3.10/dist-packages (from pydantic->llamafactory==0.8.3.dev0) (2.20.0)\n","Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch>=1.13.1->llamafactory==0.8.3.dev0) (1.12.1)\n","Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=1.13.1->llamafactory==0.8.3.dev0) (3.3)\n","Collecting nvidia-cuda-nvrtc-cu12==12.1.105 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cuda_nvrtc_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (23.7 MB)\n","Collecting nvidia-cuda-runtime-cu12==12.1.105 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cuda_runtime_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (823 kB)\n","Collecting nvidia-cuda-cupti-cu12==12.1.105 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cuda_cupti_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (14.1 MB)\n","Collecting nvidia-cudnn-cu12==8.9.2.26 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cudnn_cu12-8.9.2.26-py3-none-manylinux1_x86_64.whl (731.7 MB)\n","Collecting nvidia-cublas-cu12==12.1.3.1 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cublas_cu12-12.1.3.1-py3-none-manylinux1_x86_64.whl (410.6 MB)\n","Collecting nvidia-cufft-cu12==11.0.2.54 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cufft_cu12-11.0.2.54-py3-none-manylinux1_x86_64.whl (121.6 MB)\n","Collecting nvidia-curand-cu12==10.3.2.106 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_curand_cu12-10.3.2.106-py3-none-manylinux1_x86_64.whl (56.5 MB)\n","Collecting nvidia-cusolver-cu12==11.4.5.107 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cusolver_cu12-11.4.5.107-py3-none-manylinux1_x86_64.whl (124.2 MB)\n","Collecting nvidia-cusparse-cu12==12.1.0.106 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_cusparse_cu12-12.1.0.106-py3-none-manylinux1_x86_64.whl (196.0 MB)\n","Collecting nvidia-nccl-cu12==2.20.5 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_nccl_cu12-2.20.5-py3-none-manylinux2014_x86_64.whl (176.2 MB)\n","Collecting nvidia-nvtx-cu12==12.1.105 (from torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Using cached nvidia_nvtx_cu12-12.1.105-py3-none-manylinux1_x86_64.whl (99 kB)\n","Requirement already satisfied: triton==2.3.0 in /usr/local/lib/python3.10/dist-packages (from torch>=1.13.1->llamafactory==0.8.3.dev0) (2.3.0)\n","Collecting nvidia-nvjitlink-cu12 (from nvidia-cusolver-cu12==11.4.5.107->torch>=1.13.1->llamafactory==0.8.3.dev0)\n"," Downloading nvidia_nvjitlink_cu12-12.5.82-py3-none-manylinux2014_x86_64.whl (21.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m21.3/21.3 MB\u001b[0m \u001b[31m72.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers>=4.41.2->llamafactory==0.8.3.dev0) (2024.5.15)\n","Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers>=4.41.2->llamafactory==0.8.3.dev0) (0.19.1)\n","Collecting tyro>=0.5.11 (from trl>=0.8.6->llamafactory==0.8.3.dev0)\n"," Downloading tyro-0.8.5-py3-none-any.whl (103 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m103.4/103.4 kB\u001b[0m \u001b[31m14.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: click>=7.0 in /usr/local/lib/python3.10/dist-packages (from uvicorn->llamafactory==0.8.3.dev0) (8.1.7)\n","Collecting h11>=0.8 (from uvicorn->llamafactory==0.8.3.dev0)\n"," Downloading h11-0.14.0-py3-none-any.whl (58 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.3/58.3 kB\u001b[0m \u001b[31m8.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting starlette<0.38.0,>=0.37.2 (from fastapi->llamafactory==0.8.3.dev0)\n"," Downloading starlette-0.37.2-py3-none-any.whl (71 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m71.9/71.9 kB\u001b[0m \u001b[31m7.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting fastapi-cli>=0.0.2 (from fastapi->llamafactory==0.8.3.dev0)\n"," Downloading fastapi_cli-0.0.4-py3-none-any.whl (9.5 kB)\n","Collecting ujson!=4.0.2,!=4.1.0,!=4.2.0,!=4.3.0,!=5.0.0,!=5.1.0,>=4.0.1 (from fastapi->llamafactory==0.8.3.dev0)\n"," Downloading ujson-5.10.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (53 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m53.6/53.6 kB\u001b[0m \u001b[31m7.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting email_validator>=2.0.0 (from fastapi->llamafactory==0.8.3.dev0)\n"," Downloading email_validator-2.2.0-py3-none-any.whl (33 kB)\n","Requirement already satisfied: six in /usr/local/lib/python3.10/dist-packages (from fire->llamafactory==0.8.3.dev0) (1.16.0)\n","Requirement already satisfied: termcolor in /usr/local/lib/python3.10/dist-packages (from fire->llamafactory==0.8.3.dev0) (2.4.0)\n","Requirement already satisfied: anyio in /usr/local/lib/python3.10/dist-packages (from sse-starlette->llamafactory==0.8.3.dev0) (3.7.1)\n","Requirement already satisfied: entrypoints in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio>=4.0.0->llamafactory==0.8.3.dev0) (0.4)\n","Requirement already satisfied: jsonschema>=3.0 in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio>=4.0.0->llamafactory==0.8.3.dev0) (4.19.2)\n","Requirement already satisfied: toolz in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio>=4.0.0->llamafactory==0.8.3.dev0) (0.12.1)\n","Collecting dnspython>=2.0.0 (from email_validator>=2.0.0->fastapi->llamafactory==0.8.3.dev0)\n"," Downloading dnspython-2.6.1-py3-none-any.whl (307 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m307.7/307.7 kB\u001b[0m \u001b[31m33.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: idna>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from email_validator>=2.0.0->fastapi->llamafactory==0.8.3.dev0) (3.7)\n","Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->llamafactory==0.8.3.dev0) (1.3.1)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->llamafactory==0.8.3.dev0) (23.2.0)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->llamafactory==0.8.3.dev0) (1.4.1)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->llamafactory==0.8.3.dev0) (6.0.5)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->llamafactory==0.8.3.dev0) (1.9.4)\n","Requirement already satisfied: async-timeout<5.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->llamafactory==0.8.3.dev0) (4.0.3)\n","Requirement already satisfied: certifi in /usr/local/lib/python3.10/dist-packages (from httpx>=0.24.1->gradio>=4.0.0->llamafactory==0.8.3.dev0) (2024.6.2)\n","Collecting httpcore==1.* (from httpx>=0.24.1->gradio>=4.0.0->llamafactory==0.8.3.dev0)\n"," Downloading httpcore-1.0.5-py3-none-any.whl (77 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m77.9/77.9 kB\u001b[0m \u001b[31m11.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: sniffio in /usr/local/lib/python3.10/dist-packages (from httpx>=0.24.1->gradio>=4.0.0->llamafactory==0.8.3.dev0) (1.3.1)\n","Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets>=2.16.0->llamafactory==0.8.3.dev0) (3.3.2)\n","Requirement already satisfied: exceptiongroup in /usr/local/lib/python3.10/dist-packages (from anyio->sse-starlette->llamafactory==0.8.3.dev0) (1.2.1)\n","Requirement already satisfied: shellingham>=1.3.0 in /usr/local/lib/python3.10/dist-packages (from typer<1.0,>=0.12->gradio>=4.0.0->llamafactory==0.8.3.dev0) (1.5.4)\n","Requirement already satisfied: rich>=10.11.0 in /usr/local/lib/python3.10/dist-packages (from typer<1.0,>=0.12->gradio>=4.0.0->llamafactory==0.8.3.dev0) (13.7.1)\n","Requirement already satisfied: docstring-parser>=0.16 in /usr/local/lib/python3.10/dist-packages (from tyro>=0.5.11->trl>=0.8.6->llamafactory==0.8.3.dev0) (0.16)\n","Collecting shtab>=1.5.6 (from tyro>=0.5.11->trl>=0.8.6->llamafactory==0.8.3.dev0)\n"," Downloading shtab-1.7.1-py3-none-any.whl (14 kB)\n","Collecting httptools>=0.5.0 (from uvicorn->llamafactory==0.8.3.dev0)\n"," Downloading httptools-0.6.1-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (341 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m341.4/341.4 kB\u001b[0m \u001b[31m28.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting python-dotenv>=0.13 (from uvicorn->llamafactory==0.8.3.dev0)\n"," Downloading python_dotenv-1.0.1-py3-none-any.whl (19 kB)\n","Collecting uvloop!=0.15.0,!=0.15.1,>=0.14.0 (from uvicorn->llamafactory==0.8.3.dev0)\n"," Downloading uvloop-0.19.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (3.4 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.4/3.4 MB\u001b[0m \u001b[31m63.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting watchfiles>=0.13 (from uvicorn->llamafactory==0.8.3.dev0)\n"," Downloading watchfiles-0.22.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.2 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.2/1.2 MB\u001b[0m \u001b[31m50.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: mpmath<1.4.0,>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=1.13.1->llamafactory==0.8.3.dev0) (1.3.0)\n","Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio>=4.0.0->llamafactory==0.8.3.dev0) (2023.12.1)\n","Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio>=4.0.0->llamafactory==0.8.3.dev0) (0.35.1)\n","Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio>=4.0.0->llamafactory==0.8.3.dev0) (0.18.1)\n","Requirement already satisfied: markdown-it-py>=2.2.0 in /usr/local/lib/python3.10/dist-packages (from rich>=10.11.0->typer<1.0,>=0.12->gradio>=4.0.0->llamafactory==0.8.3.dev0) (3.0.0)\n","Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from rich>=10.11.0->typer<1.0,>=0.12->gradio>=4.0.0->llamafactory==0.8.3.dev0) (2.16.1)\n","Requirement already satisfied: mdurl~=0.1 in /usr/local/lib/python3.10/dist-packages (from markdown-it-py>=2.2.0->rich>=10.11.0->typer<1.0,>=0.12->gradio>=4.0.0->llamafactory==0.8.3.dev0) (0.1.2)\n","Building wheels for collected packages: fire, llamafactory, ffmpy\n"," Building wheel for fire (setup.py) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for fire: filename=fire-0.6.0-py2.py3-none-any.whl size=117029 sha256=c64ebd407f170d7db51aceffccdd092ec79d86844c8552e251c40660637453bc\n"," Stored in directory: /root/.cache/pip/wheels/d6/6d/5d/5b73fa0f46d01a793713f8859201361e9e581ced8c75e5c6a3\n"," Building editable for llamafactory (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for llamafactory: filename=llamafactory-0.8.3.dev0-0.editable-py3-none-any.whl size=20620 sha256=36ad2730270a69171004741bc1f5182879cb8a0a88956fd12806e360bcc50120\n"," Stored in directory: /tmp/pip-ephem-wheel-cache-3yg6uk3a/wheels/de/aa/c5/27b5682c5592b7c0eecc3e208f176dedf6b11a61cf2a910b85\n"," Building wheel for ffmpy (setup.py) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for ffmpy: filename=ffmpy-0.3.2-py3-none-any.whl size=5584 sha256=fe676a1c4325d83b3ea67bc0abbd0573e5b110e737679343aecb9e5c5e44d5bb\n"," Stored in directory: /root/.cache/pip/wheels/bd/65/9a/671fc6dcde07d4418df0c592f8df512b26d7a0029c2a23dd81\n","Successfully built fire llamafactory ffmpy\n","Installing collected packages: pydub, ffmpy, xxhash, websockets, uvloop, ujson, tomlkit, shtab, semantic-version, ruff, requests, python-multipart, python-dotenv, pyarrow, orjson, nvidia-nvtx-cu12, nvidia-nvjitlink-cu12, nvidia-nccl-cu12, nvidia-curand-cu12, nvidia-cufft-cu12, nvidia-cuda-runtime-cu12, nvidia-cuda-nvrtc-cu12, nvidia-cuda-cupti-cu12, nvidia-cublas-cu12, httptools, h11, fire, einops, dnspython, dill, aiofiles, watchfiles, uvicorn, tiktoken, starlette, nvidia-cusparse-cu12, nvidia-cudnn-cu12, multiprocess, httpcore, email_validator, tyro, sse-starlette, nvidia-cusolver-cu12, httpx, gradio-client, fastapi-cli, datasets, fastapi, bitsandbytes, accelerate, trl, peft, gradio, llamafactory\n"," Attempting uninstall: requests\n"," Found existing installation: requests 2.31.0\n"," Uninstalling requests-2.31.0:\n"," Successfully uninstalled requests-2.31.0\n"," Attempting uninstall: pyarrow\n"," Found existing installation: pyarrow 14.0.2\n"," Uninstalling pyarrow-14.0.2:\n"," Successfully uninstalled pyarrow-14.0.2\n","\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n","cudf-cu12 24.4.1 requires pyarrow<15.0.0a0,>=14.0.1, but you have pyarrow 16.1.0 which is incompatible.\n","google-colab 1.0.0 requires requests==2.31.0, but you have requests 2.32.3 which is incompatible.\n","ibis-framework 8.0.0 requires pyarrow<16,>=2, but you have pyarrow 16.1.0 which is incompatible.\u001b[0m\u001b[31m\n","\u001b[0mSuccessfully installed accelerate-0.32.1 aiofiles-23.2.1 bitsandbytes-0.43.1 datasets-2.20.0 dill-0.3.8 dnspython-2.6.1 einops-0.8.0 email_validator-2.2.0 fastapi-0.111.0 fastapi-cli-0.0.4 ffmpy-0.3.2 fire-0.6.0 gradio-4.37.2 gradio-client-1.0.2 h11-0.14.0 httpcore-1.0.5 httptools-0.6.1 httpx-0.27.0 llamafactory-0.8.3.dev0 multiprocess-0.70.16 nvidia-cublas-cu12-12.1.3.1 nvidia-cuda-cupti-cu12-12.1.105 nvidia-cuda-nvrtc-cu12-12.1.105 nvidia-cuda-runtime-cu12-12.1.105 nvidia-cudnn-cu12-8.9.2.26 nvidia-cufft-cu12-11.0.2.54 nvidia-curand-cu12-10.3.2.106 nvidia-cusolver-cu12-11.4.5.107 nvidia-cusparse-cu12-12.1.0.106 nvidia-nccl-cu12-2.20.5 nvidia-nvjitlink-cu12-12.5.82 nvidia-nvtx-cu12-12.1.105 orjson-3.10.6 peft-0.11.1 pyarrow-16.1.0 pydub-0.25.1 python-dotenv-1.0.1 python-multipart-0.0.9 requests-2.32.3 ruff-0.5.1 semantic-version-2.10.0 shtab-1.7.1 sse-starlette-2.1.2 starlette-0.37.2 tiktoken-0.7.0 tomlkit-0.12.0 trl-0.9.4 tyro-0.8.5 ujson-5.10.0 uvicorn-0.30.1 uvloop-0.19.0 watchfiles-0.22.0 websockets-11.0.3 xxhash-3.4.1\n","Collecting unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git\n"," Cloning https://github.com/unslothai/unsloth.git to /tmp/pip-install-3p7tr3jg/unsloth_2bf70fff93774cd9be69ff218e188a9d\n"," Running command git clone --filter=blob:none --quiet https://github.com/unslothai/unsloth.git /tmp/pip-install-3p7tr3jg/unsloth_2bf70fff93774cd9be69ff218e188a9d\n"," Resolved https://github.com/unslothai/unsloth.git to commit dd6ea68d609ba14fcdd13b4a200d1f11135411f2\n"," Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n"," Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n"," Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n","Requirement already satisfied: tyro in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.8.5)\n","Collecting transformers>=4.42.3 (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git)\n"," Downloading transformers-4.42.3-py3-none-any.whl (9.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m9.3/9.3 MB\u001b[0m \u001b[31m21.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: datasets>=2.16.0 in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2.20.0)\n","Collecting sentencepiece>=0.2.0 (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git)\n"," Downloading sentencepiece-0.2.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m42.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (4.66.4)\n","Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (5.9.5)\n","Requirement already satisfied: wheel>=0.42.0 in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.43.0)\n","Requirement already satisfied: numpy in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (1.25.2)\n","Requirement already satisfied: protobuf<4.0.0 in /usr/local/lib/python3.10/dist-packages (from unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.20.3)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.15.4)\n","Requirement already satisfied: pyarrow>=15.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (16.1.0)\n","Requirement already satisfied: pyarrow-hotfix in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.6)\n","Requirement already satisfied: dill<0.3.9,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.3.8)\n","Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2.0.3)\n","Requirement already satisfied: requests>=2.32.2 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2.32.3)\n","Requirement already satisfied: xxhash in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.4.1)\n","Requirement already satisfied: multiprocess in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.70.16)\n","Requirement already satisfied: fsspec[http]<=2024.5.0,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2023.6.0)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.9.5)\n","Requirement already satisfied: huggingface-hub>=0.21.2 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.23.4)\n","Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (24.1)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (6.0.1)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers>=4.42.3->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2024.5.15)\n","Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers>=4.42.3->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.4.3)\n","Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers>=4.42.3->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.19.1)\n","Requirement already satisfied: docstring-parser>=0.16 in /usr/local/lib/python3.10/dist-packages (from tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.16)\n","Requirement already satisfied: typing-extensions>=4.7.0 in /usr/local/lib/python3.10/dist-packages (from tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (4.12.2)\n","Requirement already satisfied: rich>=11.1.0 in /usr/local/lib/python3.10/dist-packages (from tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (13.7.1)\n","Requirement already satisfied: shtab>=1.5.6 in /usr/local/lib/python3.10/dist-packages (from tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (1.7.1)\n","Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (1.3.1)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (23.2.0)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (1.4.1)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (6.0.5)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (1.9.4)\n","Requirement already satisfied: async-timeout<5.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (4.0.3)\n","Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.3.2)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.7)\n","Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2.0.7)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2024.6.2)\n","Requirement already satisfied: markdown-it-py>=2.2.0 in /usr/local/lib/python3.10/dist-packages (from rich>=11.1.0->tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (3.0.0)\n","Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from rich>=11.1.0->tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2.16.1)\n","Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2.8.2)\n","Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2023.4)\n","Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (2024.1)\n","Requirement already satisfied: mdurl~=0.1 in /usr/local/lib/python3.10/dist-packages (from markdown-it-py>=2.2.0->rich>=11.1.0->tyro->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (0.1.2)\n","Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.2->pandas->datasets>=2.16.0->unsloth[colab-new]@ git+https://github.com/unslothai/unsloth.git) (1.16.0)\n","Building wheels for collected packages: unsloth\n"," Building wheel for unsloth (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for unsloth: filename=unsloth-2024.7-py3-none-any.whl size=127188 sha256=fd4982defa26e9fe5729cc146526e76bfd32ee2557bbb95ae67b068560ee8a87\n"," Stored in directory: /tmp/pip-ephem-wheel-cache-pjrrubd4/wheels/ed/d4/e9/76fb290ee3df0a5fc21ce5c2c788e29e9607a2353d8342fd0d\n","Successfully built unsloth\n","Installing collected packages: sentencepiece, unsloth, transformers\n"," Attempting uninstall: sentencepiece\n"," Found existing installation: sentencepiece 0.1.99\n"," Uninstalling sentencepiece-0.1.99:\n"," Successfully uninstalled sentencepiece-0.1.99\n"," Attempting uninstall: transformers\n"," Found existing installation: transformers 4.41.2\n"," Uninstalling transformers-4.41.2:\n"," Successfully uninstalled transformers-4.41.2\n","Successfully installed sentencepiece-0.2.0 transformers-4.42.3 unsloth-2024.7\n","Collecting xformers\n"," Downloading xformers-0.0.26.post1-cp310-cp310-manylinux2014_x86_64.whl (222.7 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m222.7/222.7 MB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting trl<0.9.0\n"," Downloading trl-0.8.6-py3-none-any.whl (245 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m245.2/245.2 kB\u001b[0m \u001b[31m30.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: peft in /usr/local/lib/python3.10/dist-packages (0.11.1)\n","Requirement already satisfied: accelerate in /usr/local/lib/python3.10/dist-packages (0.32.1)\n","Requirement already satisfied: bitsandbytes in /usr/local/lib/python3.10/dist-packages (0.43.1)\n","Installing collected packages: xformers, trl\n"," Attempting uninstall: trl\n"," Found existing installation: trl 0.9.4\n"," Uninstalling trl-0.9.4:\n"," Successfully uninstalled trl-0.9.4\n","Successfully installed trl-0.8.6 xformers-0.0.26.post1\n","CPU times: user 1.2 s, sys: 222 ms, total: 1.42 s\n","Wall time: 2min 50s\n"]}],"source":["%%time\n","\n","%cd /content/\n","%rm -rf LLaMA-Factory\n","!git clone https://github.com/hiyouga/LLaMA-Factory.git\n","%cd LLaMA-Factory\n","%ls\n","!pip install -e .[torch,bitsandbytes]\n","# Installs Unsloth, Xformers (Flash Attention) and all other packages!\n","!pip install \"unsloth[colab-new] @ git+https://github.com/unslothai/unsloth.git\"\n","!pip install --no-deps xformers \"trl<0.9.0\" peft accelerate bitsandbytes"]},{"cell_type":"code","execution_count":4,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"6d394937-6c99-4a7c-9d32-7600a280032f","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":10,"status":"ok","timestamp":1720336943325,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"aVAhR0LPHk6J","outputId":"02fb829d-275d-48bd-803c-8cddd3d4bc19"},"outputs":[{"output_type":"stream","name":"stdout","text":["workding dir: /content/drive/MyDrive/logical-reasoning/\n"]}],"source":["import os\n","import sys\n","from pathlib import Path\n","\n","workding_dir = \"/content/drive/MyDrive/logical-reasoning/\"\n","os.chdir(workding_dir)\n","sys.path.append(workding_dir)\n","print(\"workding dir:\", workding_dir)"]},{"cell_type":"code","execution_count":5,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"ac667aba-076e-4de6-9984-8f6a67cb09cd","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":5,"status":"ok","timestamp":1720336943325,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"pQYZ1k-4Hk6J","outputId":"26c2eedb-c639-426a-c38e-fcc0e96b7d51"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["True"]},"metadata":{},"execution_count":5}],"source":["need_to_setup_env = True\n","need_to_setup_env"]},{"cell_type":"code","execution_count":6,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"72f9cf79-7b0d-4d9e-90a0-1fa5251b947f","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":31967,"status":"ok","timestamp":1720336975288,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"Ant0nzR8Hk6J","outputId":"d949471f-ba20-4c7e-8d12-adac2b598972"},"outputs":[{"output_type":"stream","name":"stdout","text":["Collecting huggingface_hub==0.23.2 (from -r requirements.txt (line 1))\n"," Downloading huggingface_hub-0.23.2-py3-none-any.whl (401 kB)\n","\u001b[?25l \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/401.7 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━━━\u001b[0m\u001b[90m╺\u001b[0m\u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m102.4/401.7 kB\u001b[0m \u001b[31m2.9 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m\u001b[91m╸\u001b[0m \u001b[32m399.4/401.7 kB\u001b[0m \u001b[31m5.9 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m401.7/401.7 kB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: nltk==3.8.1 in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 2)) (3.8.1)\n","Requirement already satisfied: python-dotenv==1.0.1 in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 3)) (1.0.1)\n","Collecting black==24.4.0 (from -r requirements.txt (line 4))\n"," Downloading black-24.4.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.7 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.7/1.7 MB\u001b[0m \u001b[31m13.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting evaluate==0.4.2 (from -r requirements.txt (line 5))\n"," Downloading evaluate-0.4.2-py3-none-any.whl (84 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m84.1/84.1 kB\u001b[0m \u001b[31m12.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting rouge_score==0.1.2 (from -r requirements.txt (line 6))\n"," Downloading rouge_score-0.1.2.tar.gz (17 kB)\n"," Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n","Collecting pytest==8.2.1 (from -r requirements.txt (line 7))\n"," Downloading pytest-8.2.1-py3-none-any.whl (339 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m339.6/339.6 kB\u001b[0m \u001b[31m16.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting seaborn==0.13.2 (from -r requirements.txt (line 8))\n"," Downloading seaborn-0.13.2-py3-none-any.whl (294 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m294.9/294.9 kB\u001b[0m \u001b[31m17.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting scikit-learn==1.5.0 (from -r requirements.txt (line 9))\n"," Downloading scikit_learn-1.5.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (13.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m13.3/13.3 MB\u001b[0m \u001b[31m12.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting jupyter (from -r requirements.txt (line 10))\n"," Downloading jupyter-1.0.0-py2.py3-none-any.whl (2.7 kB)\n","Requirement already satisfied: ipywidgets in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 11)) (7.7.1)\n","Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 12)) (24.1)\n","Collecting langchain_openai==0.1.13 (from -r requirements.txt (line 13))\n"," Downloading langchain_openai-0.1.13-py3-none-any.whl (45 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m45.9/45.9 kB\u001b[0m \u001b[31m6.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting wandb==0.17.4 (from -r requirements.txt (line 14))\n"," Downloading wandb-0.17.4-py3-none-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (6.9 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.9/6.9 MB\u001b[0m \u001b[31m69.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface_hub==0.23.2->-r requirements.txt (line 1)) (3.15.4)\n","Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub==0.23.2->-r requirements.txt (line 1)) (2023.6.0)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub==0.23.2->-r requirements.txt (line 1)) (6.0.1)\n","Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from huggingface_hub==0.23.2->-r requirements.txt (line 1)) (2.32.3)\n","Requirement already satisfied: tqdm>=4.42.1 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub==0.23.2->-r requirements.txt (line 1)) (4.66.4)\n","Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface_hub==0.23.2->-r requirements.txt (line 1)) (4.12.2)\n","Requirement already satisfied: click in /usr/local/lib/python3.10/dist-packages (from nltk==3.8.1->-r requirements.txt (line 2)) (8.1.7)\n","Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from nltk==3.8.1->-r requirements.txt (line 2)) (1.4.2)\n","Requirement already satisfied: regex>=2021.8.3 in /usr/local/lib/python3.10/dist-packages (from nltk==3.8.1->-r requirements.txt (line 2)) (2024.5.15)\n","Collecting mypy-extensions>=0.4.3 (from black==24.4.0->-r requirements.txt (line 4))\n"," Downloading mypy_extensions-1.0.0-py3-none-any.whl (4.7 kB)\n","Collecting pathspec>=0.9.0 (from black==24.4.0->-r requirements.txt (line 4))\n"," Downloading pathspec-0.12.1-py3-none-any.whl (31 kB)\n","Requirement already satisfied: platformdirs>=2 in /usr/local/lib/python3.10/dist-packages (from black==24.4.0->-r requirements.txt (line 4)) (4.2.2)\n","Requirement already satisfied: tomli>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from black==24.4.0->-r requirements.txt (line 4)) (2.0.1)\n","Requirement already satisfied: datasets>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from evaluate==0.4.2->-r requirements.txt (line 5)) (2.20.0)\n","Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from evaluate==0.4.2->-r requirements.txt (line 5)) (1.25.2)\n","Requirement already satisfied: dill in /usr/local/lib/python3.10/dist-packages (from evaluate==0.4.2->-r requirements.txt (line 5)) (0.3.8)\n","Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from evaluate==0.4.2->-r requirements.txt (line 5)) (2.0.3)\n","Requirement already satisfied: xxhash in /usr/local/lib/python3.10/dist-packages (from evaluate==0.4.2->-r requirements.txt (line 5)) (3.4.1)\n","Requirement already satisfied: multiprocess in /usr/local/lib/python3.10/dist-packages (from evaluate==0.4.2->-r requirements.txt (line 5)) (0.70.16)\n","Requirement already satisfied: absl-py in /usr/local/lib/python3.10/dist-packages (from rouge_score==0.1.2->-r requirements.txt (line 6)) (1.4.0)\n","Requirement already satisfied: six>=1.14.0 in /usr/local/lib/python3.10/dist-packages (from rouge_score==0.1.2->-r requirements.txt (line 6)) (1.16.0)\n","Requirement already satisfied: iniconfig in /usr/local/lib/python3.10/dist-packages (from pytest==8.2.1->-r requirements.txt (line 7)) (2.0.0)\n","Requirement already satisfied: pluggy<2.0,>=1.5 in /usr/local/lib/python3.10/dist-packages (from pytest==8.2.1->-r requirements.txt (line 7)) (1.5.0)\n","Requirement already satisfied: exceptiongroup>=1.0.0rc8 in /usr/local/lib/python3.10/dist-packages (from pytest==8.2.1->-r requirements.txt (line 7)) (1.2.1)\n","Requirement already satisfied: matplotlib!=3.6.1,>=3.4 in /usr/local/lib/python3.10/dist-packages (from seaborn==0.13.2->-r requirements.txt (line 8)) (3.7.1)\n","Requirement already satisfied: scipy>=1.6.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn==1.5.0->-r requirements.txt (line 9)) (1.11.4)\n","Requirement already satisfied: threadpoolctl>=3.1.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn==1.5.0->-r requirements.txt (line 9)) (3.5.0)\n","Collecting langchain-core<0.3,>=0.2.2 (from langchain_openai==0.1.13->-r requirements.txt (line 13))\n"," Downloading langchain_core-0.2.11-py3-none-any.whl (337 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m337.4/337.4 kB\u001b[0m \u001b[31m37.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting openai<2.0.0,>=1.32.0 (from langchain_openai==0.1.13->-r requirements.txt (line 13))\n"," Downloading openai-1.35.10-py3-none-any.whl (328 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m328.3/328.3 kB\u001b[0m \u001b[31m38.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: tiktoken<1,>=0.7 in /usr/local/lib/python3.10/dist-packages (from langchain_openai==0.1.13->-r requirements.txt (line 13)) (0.7.0)\n","Collecting docker-pycreds>=0.4.0 (from wandb==0.17.4->-r requirements.txt (line 14))\n"," Downloading docker_pycreds-0.4.0-py2.py3-none-any.whl (9.0 kB)\n","Collecting gitpython!=3.1.29,>=1.0.0 (from wandb==0.17.4->-r requirements.txt (line 14))\n"," Downloading GitPython-3.1.43-py3-none-any.whl (207 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m207.3/207.3 kB\u001b[0m \u001b[31m27.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: protobuf!=4.21.0,<6,>=3.19.0 in /usr/local/lib/python3.10/dist-packages (from wandb==0.17.4->-r requirements.txt (line 14)) (3.20.3)\n","Requirement already satisfied: psutil>=5.0.0 in /usr/local/lib/python3.10/dist-packages (from wandb==0.17.4->-r requirements.txt (line 14)) (5.9.5)\n","Collecting sentry-sdk>=1.0.0 (from wandb==0.17.4->-r requirements.txt (line 14))\n"," Downloading sentry_sdk-2.7.1-py2.py3-none-any.whl (300 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m300.2/300.2 kB\u001b[0m \u001b[31m37.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting setproctitle (from wandb==0.17.4->-r requirements.txt (line 14))\n"," Downloading setproctitle-1.3.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (30 kB)\n","Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from wandb==0.17.4->-r requirements.txt (line 14)) (67.7.2)\n","Requirement already satisfied: notebook in /usr/local/lib/python3.10/dist-packages (from jupyter->-r requirements.txt (line 10)) (6.5.5)\n","Collecting qtconsole (from jupyter->-r requirements.txt (line 10))\n"," Downloading qtconsole-5.5.2-py3-none-any.whl (123 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m123.4/123.4 kB\u001b[0m \u001b[31m18.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: jupyter-console in /usr/local/lib/python3.10/dist-packages (from jupyter->-r requirements.txt (line 10)) (6.1.0)\n","Requirement already satisfied: nbconvert in /usr/local/lib/python3.10/dist-packages (from jupyter->-r requirements.txt (line 10)) (6.5.4)\n","Requirement already satisfied: ipykernel in /usr/local/lib/python3.10/dist-packages (from jupyter->-r requirements.txt (line 10)) (5.5.6)\n","Requirement already satisfied: ipython-genutils~=0.2.0 in /usr/local/lib/python3.10/dist-packages (from ipywidgets->-r requirements.txt (line 11)) (0.2.0)\n","Requirement already satisfied: traitlets>=4.3.1 in /usr/local/lib/python3.10/dist-packages (from ipywidgets->-r requirements.txt (line 11)) (5.7.1)\n","Requirement already satisfied: widgetsnbextension~=3.6.0 in /usr/local/lib/python3.10/dist-packages (from ipywidgets->-r requirements.txt (line 11)) (3.6.6)\n","Requirement already satisfied: ipython>=4.0.0 in /usr/local/lib/python3.10/dist-packages (from ipywidgets->-r requirements.txt (line 11)) (7.34.0)\n","Requirement already satisfied: jupyterlab-widgets>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from ipywidgets->-r requirements.txt (line 11)) (3.0.11)\n","Requirement already satisfied: pyarrow>=15.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (16.1.0)\n","Requirement already satisfied: pyarrow-hotfix in /usr/local/lib/python3.10/dist-packages (from datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (0.6)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (3.9.5)\n","Collecting gitdb<5,>=4.0.1 (from gitpython!=3.1.29,>=1.0.0->wandb==0.17.4->-r requirements.txt (line 14))\n"," Downloading gitdb-4.0.11-py3-none-any.whl (62 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.7/62.7 kB\u001b[0m \u001b[31m9.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: jupyter-client in /usr/local/lib/python3.10/dist-packages (from ipykernel->jupyter->-r requirements.txt (line 10)) (6.1.12)\n","Requirement already satisfied: tornado>=4.2 in /usr/local/lib/python3.10/dist-packages (from ipykernel->jupyter->-r requirements.txt (line 10)) (6.3.3)\n","Collecting jedi>=0.16 (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11))\n"," Downloading jedi-0.19.1-py2.py3-none-any.whl (1.6 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.6/1.6 MB\u001b[0m \u001b[31m78.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: decorator in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (4.4.2)\n","Requirement already satisfied: pickleshare in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (0.7.5)\n","Requirement already satisfied: prompt-toolkit!=3.0.0,!=3.0.1,<3.1.0,>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (3.0.47)\n","Requirement already satisfied: pygments in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (2.16.1)\n","Requirement already satisfied: backcall in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (0.2.0)\n","Requirement already satisfied: matplotlib-inline in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (0.1.7)\n","Requirement already satisfied: pexpect>4.3 in /usr/local/lib/python3.10/dist-packages (from ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (4.9.0)\n","Collecting jsonpatch<2.0,>=1.33 (from langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13))\n"," Downloading jsonpatch-1.33-py2.py3-none-any.whl (12 kB)\n","Collecting langsmith<0.2.0,>=0.1.75 (from langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13))\n"," Downloading langsmith-0.1.83-py3-none-any.whl (127 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m127.5/127.5 kB\u001b[0m \u001b[31m15.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pydantic<3,>=1 in /usr/local/lib/python3.10/dist-packages (from langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13)) (2.8.0)\n","Requirement already satisfied: tenacity!=8.4.0,<9.0.0,>=8.1.0 in /usr/local/lib/python3.10/dist-packages (from langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13)) (8.4.2)\n","Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (1.2.1)\n","Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (0.12.1)\n","Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (4.53.0)\n","Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (1.4.5)\n","Requirement already satisfied: pillow>=6.2.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (9.4.0)\n","Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (3.1.2)\n","Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib!=3.6.1,>=3.4->seaborn==0.13.2->-r requirements.txt (line 8)) (2.8.2)\n","Requirement already satisfied: anyio<5,>=3.5.0 in /usr/local/lib/python3.10/dist-packages (from openai<2.0.0,>=1.32.0->langchain_openai==0.1.13->-r requirements.txt (line 13)) (3.7.1)\n","Requirement already satisfied: distro<2,>=1.7.0 in /usr/lib/python3/dist-packages (from openai<2.0.0,>=1.32.0->langchain_openai==0.1.13->-r requirements.txt (line 13)) (1.7.0)\n","Requirement already satisfied: httpx<1,>=0.23.0 in /usr/local/lib/python3.10/dist-packages (from openai<2.0.0,>=1.32.0->langchain_openai==0.1.13->-r requirements.txt (line 13)) (0.27.0)\n","Requirement already satisfied: sniffio in /usr/local/lib/python3.10/dist-packages (from openai<2.0.0,>=1.32.0->langchain_openai==0.1.13->-r requirements.txt (line 13)) (1.3.1)\n","Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->evaluate==0.4.2->-r requirements.txt (line 5)) (2023.4)\n","Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas->evaluate==0.4.2->-r requirements.txt (line 5)) (2024.1)\n","Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub==0.23.2->-r requirements.txt (line 1)) (3.3.2)\n","Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub==0.23.2->-r requirements.txt (line 1)) (3.7)\n","Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub==0.23.2->-r requirements.txt (line 1)) (2.0.7)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface_hub==0.23.2->-r requirements.txt (line 1)) (2024.6.2)\n","Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (3.1.4)\n","Requirement already satisfied: pyzmq<25,>=17 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (24.0.1)\n","Requirement already satisfied: argon2-cffi in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (23.1.0)\n","Requirement already satisfied: jupyter-core>=4.6.1 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (5.7.2)\n","Requirement already satisfied: nbformat in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (5.10.4)\n","Requirement already satisfied: nest-asyncio>=1.5 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (1.6.0)\n","Requirement already satisfied: Send2Trash>=1.8.0 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (1.8.3)\n","Requirement already satisfied: terminado>=0.8.3 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (0.18.1)\n","Requirement already satisfied: prometheus-client in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (0.20.0)\n","Requirement already satisfied: nbclassic>=0.4.7 in /usr/local/lib/python3.10/dist-packages (from notebook->jupyter->-r requirements.txt (line 10)) (1.1.0)\n","Requirement already satisfied: lxml in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (4.9.4)\n","Requirement already satisfied: beautifulsoup4 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (4.12.3)\n","Requirement already satisfied: bleach in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (6.1.0)\n","Requirement already satisfied: defusedxml in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (0.7.1)\n","Requirement already satisfied: entrypoints>=0.2.2 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (0.4)\n","Requirement already satisfied: jupyterlab-pygments in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (0.3.0)\n","Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (2.1.5)\n","Requirement already satisfied: mistune<2,>=0.8.1 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (0.8.4)\n","Requirement already satisfied: nbclient>=0.5.0 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (0.10.0)\n","Requirement already satisfied: pandocfilters>=1.4.1 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (1.5.1)\n","Requirement already satisfied: tinycss2 in /usr/local/lib/python3.10/dist-packages (from nbconvert->jupyter->-r requirements.txt (line 10)) (1.3.0)\n","Collecting qtpy>=2.4.0 (from qtconsole->jupyter->-r requirements.txt (line 10))\n"," Downloading QtPy-2.4.1-py3-none-any.whl (93 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m93.5/93.5 kB\u001b[0m \u001b[31m12.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (1.3.1)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (23.2.0)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (1.4.1)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (6.0.5)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (1.9.4)\n","Requirement already satisfied: async-timeout<5.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets>=2.0.0->evaluate==0.4.2->-r requirements.txt (line 5)) (4.0.3)\n","Collecting smmap<6,>=3.0.1 (from gitdb<5,>=4.0.1->gitpython!=3.1.29,>=1.0.0->wandb==0.17.4->-r requirements.txt (line 14))\n"," Downloading smmap-5.0.1-py3-none-any.whl (24 kB)\n","Requirement already satisfied: httpcore==1.* in /usr/local/lib/python3.10/dist-packages (from httpx<1,>=0.23.0->openai<2.0.0,>=1.32.0->langchain_openai==0.1.13->-r requirements.txt (line 13)) (1.0.5)\n","Requirement already satisfied: h11<0.15,>=0.13 in /usr/local/lib/python3.10/dist-packages (from httpcore==1.*->httpx<1,>=0.23.0->openai<2.0.0,>=1.32.0->langchain_openai==0.1.13->-r requirements.txt (line 13)) (0.14.0)\n","Requirement already satisfied: parso<0.9.0,>=0.8.3 in /usr/local/lib/python3.10/dist-packages (from jedi>=0.16->ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (0.8.4)\n","Collecting jsonpointer>=1.9 (from jsonpatch<2.0,>=1.33->langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13))\n"," Downloading jsonpointer-3.0.0-py2.py3-none-any.whl (7.6 kB)\n","Requirement already satisfied: orjson<4.0.0,>=3.9.14 in /usr/local/lib/python3.10/dist-packages (from langsmith<0.2.0,>=0.1.75->langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13)) (3.10.6)\n","Requirement already satisfied: notebook-shim>=0.2.3 in /usr/local/lib/python3.10/dist-packages (from nbclassic>=0.4.7->notebook->jupyter->-r requirements.txt (line 10)) (0.2.4)\n","Requirement already satisfied: fastjsonschema>=2.15 in /usr/local/lib/python3.10/dist-packages (from nbformat->notebook->jupyter->-r requirements.txt (line 10)) (2.20.0)\n","Requirement already satisfied: jsonschema>=2.6 in /usr/local/lib/python3.10/dist-packages (from nbformat->notebook->jupyter->-r requirements.txt (line 10)) (4.19.2)\n","Requirement already satisfied: ptyprocess>=0.5 in /usr/local/lib/python3.10/dist-packages (from pexpect>4.3->ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (0.7.0)\n","Requirement already satisfied: wcwidth in /usr/local/lib/python3.10/dist-packages (from prompt-toolkit!=3.0.0,!=3.0.1,<3.1.0,>=2.0.0->ipython>=4.0.0->ipywidgets->-r requirements.txt (line 11)) (0.2.13)\n","Requirement already satisfied: annotated-types>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from pydantic<3,>=1->langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13)) (0.7.0)\n","Requirement already satisfied: pydantic-core==2.20.0 in /usr/local/lib/python3.10/dist-packages (from pydantic<3,>=1->langchain-core<0.3,>=0.2.2->langchain_openai==0.1.13->-r requirements.txt (line 13)) (2.20.0)\n","Requirement already satisfied: argon2-cffi-bindings in /usr/local/lib/python3.10/dist-packages (from argon2-cffi->notebook->jupyter->-r requirements.txt (line 10)) (21.2.0)\n","Requirement already satisfied: soupsieve>1.2 in /usr/local/lib/python3.10/dist-packages (from beautifulsoup4->nbconvert->jupyter->-r requirements.txt (line 10)) (2.5)\n","Requirement already satisfied: webencodings in /usr/local/lib/python3.10/dist-packages (from bleach->nbconvert->jupyter->-r requirements.txt (line 10)) (0.5.1)\n","Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=2.6->nbformat->notebook->jupyter->-r requirements.txt (line 10)) (2023.12.1)\n","Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=2.6->nbformat->notebook->jupyter->-r requirements.txt (line 10)) (0.35.1)\n","Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=2.6->nbformat->notebook->jupyter->-r requirements.txt (line 10)) (0.18.1)\n","Requirement already satisfied: jupyter-server<3,>=1.8 in /usr/local/lib/python3.10/dist-packages (from notebook-shim>=0.2.3->nbclassic>=0.4.7->notebook->jupyter->-r requirements.txt (line 10)) (1.24.0)\n","Requirement already satisfied: cffi>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from argon2-cffi-bindings->argon2-cffi->notebook->jupyter->-r requirements.txt (line 10)) (1.16.0)\n","Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0.1->argon2-cffi-bindings->argon2-cffi->notebook->jupyter->-r requirements.txt (line 10)) (2.22)\n","Requirement already satisfied: websocket-client in /usr/local/lib/python3.10/dist-packages (from jupyter-server<3,>=1.8->notebook-shim>=0.2.3->nbclassic>=0.4.7->notebook->jupyter->-r requirements.txt (line 10)) (1.8.0)\n","Building wheels for collected packages: rouge_score\n"," Building wheel for rouge_score (setup.py) ... \u001b[?25l\u001b[?25hdone\n"," Created wheel for rouge_score: filename=rouge_score-0.1.2-py3-none-any.whl size=24933 sha256=386cec87e33b658a8e2e7750635e52c2961434ed361db15ed1e66e1c33af2ee9\n"," Stored in directory: /root/.cache/pip/wheels/5f/dd/89/461065a73be61a532ff8599a28e9beef17985c9e9c31e541b4\n","Successfully built rouge_score\n","Installing collected packages: smmap, setproctitle, sentry-sdk, qtpy, pytest, pathspec, mypy-extensions, jsonpointer, jedi, docker-pycreds, scikit-learn, rouge_score, jsonpatch, huggingface_hub, gitdb, black, seaborn, openai, langsmith, gitpython, wandb, qtconsole, langchain-core, langchain_openai, evaluate, jupyter\n"," Attempting uninstall: pytest\n"," Found existing installation: pytest 7.4.4\n"," Uninstalling pytest-7.4.4:\n"," Successfully uninstalled pytest-7.4.4\n"," Attempting uninstall: scikit-learn\n"," Found existing installation: scikit-learn 1.2.2\n"," Uninstalling scikit-learn-1.2.2:\n"," Successfully uninstalled scikit-learn-1.2.2\n"," Attempting uninstall: huggingface_hub\n"," Found existing installation: huggingface-hub 0.23.4\n"," Uninstalling huggingface-hub-0.23.4:\n"," Successfully uninstalled huggingface-hub-0.23.4\n"," Attempting uninstall: seaborn\n"," Found existing installation: seaborn 0.13.1\n"," Uninstalling seaborn-0.13.1:\n"," Successfully uninstalled seaborn-0.13.1\n","Successfully installed black-24.4.0 docker-pycreds-0.4.0 evaluate-0.4.2 gitdb-4.0.11 gitpython-3.1.43 huggingface_hub-0.23.2 jedi-0.19.1 jsonpatch-1.33 jsonpointer-3.0.0 jupyter-1.0.0 langchain-core-0.2.11 langchain_openai-0.1.13 langsmith-0.1.83 mypy-extensions-1.0.0 openai-1.35.10 pathspec-0.12.1 pytest-8.2.1 qtconsole-5.5.2 qtpy-2.4.1 rouge_score-0.1.2 scikit-learn-1.5.0 seaborn-0.13.2 sentry-sdk-2.7.1 setproctitle-1.3.3 smmap-5.0.1 wandb-0.17.4\n"]}],"source":["if need_to_setup_env:\n"," %pip install -r requirements.txt"]},{"cell_type":"code","execution_count":7,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"9f67ec60-2f24-411c-84eb-0dd664b44775","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":594,"status":"ok","timestamp":1720336975872,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"p2eN5kdRHk6J","outputId":"359e95e6-f760-4ca9-8854-424ebbd1d32b"},"outputs":[{"output_type":"stream","name":"stdout","text":["loading env vars from: /content/drive/.shortcut-targets-by-id/1E09lTnfbsjtTgQg65dQ3y9D2R6l8waxR/logical-reasoning/.env\n"]},{"output_type":"execute_result","data":{"text/plain":["True"]},"metadata":{},"execution_count":7}],"source":["from dotenv import find_dotenv, load_dotenv\n","\n","found_dotenv = find_dotenv(\".env\")\n","\n","if len(found_dotenv) == 0:\n"," found_dotenv = find_dotenv(\".env.example\")\n","print(f\"loading env vars from: {found_dotenv}\")\n","load_dotenv(found_dotenv, override=True)"]},{"cell_type":"code","execution_count":8,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"f1597656-8042-4878-9d3b-9ebfb8dd86dc","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":11,"status":"ok","timestamp":1720336975872,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"i_5wPar_Hk6J","outputId":"5ffc7752-c17e-48c0-c7f6-e85fb7c5eb2d"},"outputs":[{"output_type":"execute_result","data":{"text/plain":["('Qwen2/Qwen2-7B-Instruct',\n"," True,\n"," None,\n"," None,\n"," 2048,\n"," 6,\n"," None,\n"," 'datasets/mgtv',\n"," 'results/mgtv-results_colab.csv',\n"," None,\n"," None)"]},"metadata":{},"execution_count":8}],"source":["import os\n","\n","model_name = os.getenv(\"MODEL_NAME\")\n","token = os.getenv(\"HF_TOKEN\") or None\n","load_in_4bit = os.getenv(\"LOAD_IN_4BIT\") == \"true\"\n","local_model = os.getenv(\"LOCAL_MODEL\")\n","hub_model = os.getenv(\"HUB_MODEL\")\n","num_train_epochs = int(os.getenv(\"NUM_TRAIN_EPOCHS\") or 0)\n","data_path = os.getenv(\"LOGICAL_REASONING_DATA_PATH\")\n","results_path = os.getenv(\"LOGICAL_REASONING_RESULTS_PATH\")\n","\n","max_seq_length = 2048 # Choose any! We auto support RoPE Scaling internally!\n","dtype = (\n"," None # None for auto detection. Float16 for Tesla T4, V100, Bfloat16 for Ampere+\n",")\n","\n","model_name, load_in_4bit, local_model, hub_model, max_seq_length, num_train_epochs, dtype, data_path, results_path, os.getenv(\"DISABLE_MLFLOW_INTEGRATION\"), os.getenv(\"WANDB_DISABLED\")"]},{"cell_type":"code","execution_count":9,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"e3ab54ba-7b6d-4817-bf2e-c5d711508b58","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":8,"status":"ok","timestamp":1720336975872,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"O9IDI1OsHk6J","outputId":"055cedb3-b2ce-4a08-f05c-5c25e629a6af"},"outputs":[{"output_type":"stream","name":"stdout","text":["Sun Jul 7 07:22:55 2024 \n","+---------------------------------------------------------------------------------------+\n","| NVIDIA-SMI 535.104.05 Driver Version: 535.104.05 CUDA Version: 12.2 |\n","|-----------------------------------------+----------------------+----------------------+\n","| GPU Name Persistence-M | Bus-Id Disp.A | Volatile Uncorr. ECC |\n","| Fan Temp Perf Pwr:Usage/Cap | Memory-Usage | GPU-Util Compute M. |\n","| | | MIG M. |\n","|=========================================+======================+======================|\n","| 0 Tesla T4 Off | 00000000:00:04.0 Off | 0 |\n","| N/A 48C P8 10W / 70W | 0MiB / 15360MiB | 0% Default |\n","| | | N/A |\n","+-----------------------------------------+----------------------+----------------------+\n"," \n","+---------------------------------------------------------------------------------------+\n","| Processes: |\n","| GPU GI CI PID Type Process name GPU Memory |\n","| ID ID Usage |\n","|=======================================================================================|\n","| No running processes found |\n","+---------------------------------------------------------------------------------------+\n"]}],"source":["!nvidia-smi"]},{"cell_type":"code","execution_count":10,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"b2a43943-9324-4839-9a47-cfa72de2244b","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"elapsed":801,"status":"ok","timestamp":1720336976667,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"hSMhuoKFHk6J","outputId":"ec6b372a-d648-48d3-a940-a3e68177afe8"},"outputs":[{"output_type":"stream","name":"stdout","text":["Python 3.10.12\n","\u001b[33mWARNING: Package(s) not found: flash-attn\u001b[0m\u001b[33m\n","\u001b[0mCPU times: user 11.2 ms, sys: 2.67 ms, total: 13.9 ms\n","Wall time: 709 ms\n"]}],"source":["%%time\n","!python --version\n","!pip show flash-attn"]},{"cell_type":"code","execution_count":11,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"4f51fafe-5527-49a2-8ccf-a0192e69493a","showTitle":false,"title":""},"executionInfo":{"elapsed":8,"status":"ok","timestamp":1720336976667,"user":{"displayName":"Inflaton Sng","userId":"00179918120580399412"},"user_tz":-480},"id":"xXCH_B2jHk6K"},"outputs":[],"source":["def evaluate_model_all_epochs(model_name, num_train_epochs, adapter_path_base, load_in_4bit=True, num_of_entries=-1):\n"," os.environ[\"MODEL_NAME\"] = model_name\n"," os.environ[\"LOAD_IN_4BIT\"] = \"true\" if load_in_4bit else \"false\"\n"," for i in range(num_train_epochs + 1):\n"," print(f\"Epoch {i}\")\n"," if i == 0:\n"," os.unsetenv(\"ADAPTER_NAME_OR_PATH\")\n"," else:\n"," adapter_path = f\"{adapter_path_base}/checkpoint-{560 * i}\"\n"," os.environ[\"ADAPTER_NAME_OR_PATH\"] = adapter_path\n","\n"," !python llm_toolkit/eval_logical_reasoning.py {num_of_entries}"]},{"cell_type":"code","execution_count":null,"metadata":{"application/vnd.databricks.v1+cell":{"cellMetadata":{"byteLimit":2048000,"rowLimit":10000},"inputWidgets":{},"nuid":"0894c329-05c5-4fe8-85ff-404defe8528a","showTitle":false,"title":""},"colab":{"base_uri":"https://localhost:8080/"},"id":"_E-9Zmn9Hk6K","outputId":"24d23e30-7093-4f68-fb76-1f741f4a44fe"},"outputs":[{"output_type":"stream","name":"stdout","text":["Epoch 0\n","loading env vars from: /content/drive/.shortcut-targets-by-id/1E09lTnfbsjtTgQg65dQ3y9D2R6l8waxR/logical-reasoning/.env\n","Adding /content/drive/.shortcut-targets-by-id/1E09lTnfbsjtTgQg65dQ3y9D2R6l8waxR/logical-reasoning to sys.path\n","2024-07-07 07:23:07.210078: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n","2024-07-07 07:23:07.210126: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n","2024-07-07 07:23:07.322753: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n","2024-07-07 07:23:07.540099: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n","To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n","2024-07-07 07:23:09.638184: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n","loading /content/drive/.shortcut-targets-by-id/1E09lTnfbsjtTgQg65dQ3y9D2R6l8waxR/logical-reasoning/llm_toolkit/logical_reasoning_utils.py\n","internlm/internlm2_5-7b-chat-1m None False datasets/mgtv results/mgtv-results_colab.csv\n","(1) GPU = Tesla T4. Max memory = 14.748 GB.\n","0.002 GB of memory reserved.\n","loading model: internlm/internlm2_5-7b-chat-1m\n","tokenizer_config.json: 100% 2.51k/2.51k [00:00<00:00, 18.3MB/s]\n","tokenization_internlm2_fast.py: 100% 7.80k/7.80k [00:00<00:00, 47.2MB/s]\n","tokenization_internlm2.py: 100% 8.81k/8.81k [00:00<00:00, 50.5MB/s]\n","A new version of the following files was downloaded from https://huggingface.co/internlm/internlm2_5-7b-chat-1m:\n","- tokenization_internlm2.py\n",". Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.\n","A new version of the following files was downloaded from https://huggingface.co/internlm/internlm2_5-7b-chat-1m:\n","- tokenization_internlm2_fast.py\n","- tokenization_internlm2.py\n",". Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.\n","tokenizer.model: 100% 1.48M/1.48M [00:00<00:00, 36.0MB/s]\n","special_tokens_map.json: 100% 713/713 [00:00<00:00, 4.71MB/s]\n","config.json: 100% 895/895 [00:00<00:00, 6.55MB/s]\n","configuration_internlm2.py: 100% 8.84k/8.84k [00:00<00:00, 48.9MB/s]\n","A new version of the following files was downloaded from https://huggingface.co/internlm/internlm2_5-7b-chat-1m:\n","- configuration_internlm2.py\n",". Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.\n","modeling_internlm2.py: 100% 80.7k/80.7k [00:00<00:00, 13.4MB/s]\n","A new version of the following files was downloaded from https://huggingface.co/internlm/internlm2_5-7b-chat-1m:\n","- modeling_internlm2.py\n",". Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.\n","model.safetensors.index.json: 100% 18.2k/18.2k [00:00<00:00, 85.6MB/s]\n","Downloading shards: 0% 0/8 [00:00, ?it/s]\n","model-00001-of-00008.safetensors: 0% 0.00/1.95G [00:00, ?B/s]\u001b[A\n","model-00001-of-00008.safetensors: 1% 21.0M/1.95G [00:00<00:11, 173MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 3% 52.4M/1.95G [00:00<00:07, 249MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 4% 83.9M/1.95G [00:00<00:07, 250MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 6% 115M/1.95G [00:00<00:07, 239MB/s] \u001b[A\n","model-00001-of-00008.safetensors: 8% 147M/1.95G [00:00<00:08, 211MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 9% 178M/1.95G [00:00<00:08, 208MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 11% 210M/1.95G [00:00<00:08, 208MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 12% 241M/1.95G [00:01<00:08, 202MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 13% 262M/1.95G [00:01<00:08, 200MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 15% 283M/1.95G [00:01<00:08, 202MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 16% 315M/1.95G [00:01<00:07, 209MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 17% 336M/1.95G [00:01<00:07, 209MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 19% 367M/1.95G [00:01<00:07, 215MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 20% 398M/1.95G [00:01<00:07, 221MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 22% 430M/1.95G [00:01<00:06, 230MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 24% 461M/1.95G [00:02<00:06, 235MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 25% 493M/1.95G [00:02<00:06, 224MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 27% 524M/1.95G [00:02<00:06, 206MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 29% 556M/1.95G [00:02<00:06, 211MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 30% 587M/1.95G [00:02<00:06, 225MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 32% 619M/1.95G [00:02<00:06, 211MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 33% 650M/1.95G [00:03<00:06, 187MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 34% 671M/1.95G [00:03<00:06, 189MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 36% 692M/1.95G [00:03<00:06, 193MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 37% 724M/1.95G [00:03<00:06, 204MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 38% 744M/1.95G [00:03<00:06, 179MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 39% 765M/1.95G [00:04<00:17, 66.1MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 41% 797M/1.95G [00:04<00:12, 89.9MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 42% 828M/1.95G [00:04<00:10, 108MB/s] \u001b[A\n","model-00001-of-00008.safetensors: 44% 849M/1.95G [00:05<00:12, 90.6MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 45% 870M/1.95G [00:05<00:12, 89.9MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 46% 902M/1.95G [00:05<00:09, 115MB/s] \u001b[A\n","model-00001-of-00008.safetensors: 48% 933M/1.95G [00:05<00:07, 138MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 49% 965M/1.95G [00:05<00:06, 160MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 51% 996M/1.95G [00:05<00:05, 180MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 53% 1.03G/1.95G [00:06<00:04, 198MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 54% 1.06G/1.95G [00:06<00:04, 218MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 56% 1.09G/1.95G [00:06<00:04, 203MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 58% 1.12G/1.95G [00:06<00:03, 213MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 59% 1.15G/1.95G [00:06<00:03, 223MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 61% 1.18G/1.95G [00:06<00:03, 226MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 62% 1.22G/1.95G [00:06<00:03, 234MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 64% 1.25G/1.95G [00:06<00:02, 240MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 66% 1.28G/1.95G [00:07<00:02, 245MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 67% 1.31G/1.95G [00:07<00:02, 239MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 69% 1.34G/1.95G [00:07<00:02, 245MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 70% 1.37G/1.95G [00:07<00:02, 241MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 72% 1.41G/1.95G [00:07<00:02, 248MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 74% 1.44G/1.95G [00:07<00:01, 259MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 75% 1.47G/1.95G [00:07<00:01, 269MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 77% 1.50G/1.95G [00:07<00:01, 275MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 79% 1.53G/1.95G [00:08<00:01, 276MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 80% 1.56G/1.95G [00:08<00:01, 262MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 82% 1.59G/1.95G [00:08<00:01, 223MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 83% 1.63G/1.95G [00:08<00:01, 229MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 85% 1.66G/1.95G [00:10<00:07, 40.0MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 87% 1.69G/1.95G [00:11<00:05, 49.9MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 88% 1.71G/1.95G [00:11<00:04, 55.5MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 89% 1.74G/1.95G [00:11<00:02, 75.0MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 91% 1.77G/1.95G [00:11<00:01, 97.8MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 93% 1.80G/1.95G [00:11<00:01, 121MB/s] \u001b[A\n","model-00001-of-00008.safetensors: 94% 1.84G/1.95G [00:11<00:00, 147MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 96% 1.87G/1.95G [00:11<00:00, 159MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 97% 1.90G/1.95G [00:12<00:00, 181MB/s]\u001b[A\n","model-00001-of-00008.safetensors: 100% 1.95G/1.95G [00:12<00:00, 159MB/s]\n","Downloading shards: 12% 1/8 [00:12<01:27, 12.52s/it]\n","model-00002-of-00008.safetensors: 0% 0.00/1.95G [00:00, ?B/s]\u001b[A\n","model-00002-of-00008.safetensors: 1% 21.0M/1.95G [00:00<00:14, 136MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 3% 52.4M/1.95G [00:00<00:10, 188MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 4% 83.9M/1.95G [00:00<00:08, 229MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 6% 115M/1.95G [00:00<00:08, 225MB/s] \u001b[A\n","model-00002-of-00008.safetensors: 8% 147M/1.95G [00:00<00:08, 216MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 9% 178M/1.95G [00:00<00:07, 234MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 11% 210M/1.95G [00:00<00:07, 243MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 12% 241M/1.95G [00:01<00:06, 247MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 14% 273M/1.95G [00:01<00:06, 250MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 16% 304M/1.95G [00:01<00:06, 253MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 17% 336M/1.95G [00:01<00:06, 246MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 19% 367M/1.95G [00:01<00:06, 255MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 20% 398M/1.95G [00:01<00:06, 256MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 22% 430M/1.95G [00:01<00:05, 260MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 24% 461M/1.95G [00:01<00:05, 255MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 25% 493M/1.95G [00:02<00:06, 238MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 27% 524M/1.95G [00:02<00:05, 239MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 29% 556M/1.95G [00:02<00:05, 232MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 30% 587M/1.95G [00:02<00:06, 214MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 32% 619M/1.95G [00:02<00:07, 178MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 33% 640M/1.95G [00:02<00:07, 181MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 34% 661M/1.95G [00:03<00:07, 175MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 35% 682M/1.95G [00:03<00:07, 158MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 36% 703M/1.95G [00:03<00:07, 164MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 37% 724M/1.95G [00:03<00:07, 172MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 38% 744M/1.95G [00:03<00:06, 176MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 39% 765M/1.95G [00:03<00:06, 183MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 41% 797M/1.95G [00:03<00:05, 197MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 43% 828M/1.95G [00:03<00:05, 207MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 44% 860M/1.95G [00:04<00:05, 207MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 45% 881M/1.95G [00:04<00:05, 206MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 47% 912M/1.95G [00:04<00:04, 222MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 48% 944M/1.95G [00:04<00:05, 195MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 50% 965M/1.95G [00:04<00:05, 191MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 51% 996M/1.95G [00:04<00:04, 200MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 53% 1.03G/1.95G [00:04<00:04, 206MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 54% 1.06G/1.95G [00:05<00:04, 210MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 56% 1.09G/1.95G [00:05<00:04, 208MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 58% 1.12G/1.95G [00:05<00:03, 212MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 59% 1.15G/1.95G [00:05<00:03, 219MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 61% 1.18G/1.95G [00:05<00:03, 227MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 62% 1.22G/1.95G [00:05<00:03, 228MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 64% 1.25G/1.95G [00:05<00:03, 212MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 66% 1.28G/1.95G [00:06<00:03, 193MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 67% 1.30G/1.95G [00:06<00:03, 193MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 68% 1.32G/1.95G [00:06<00:03, 190MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 70% 1.35G/1.95G [00:06<00:03, 197MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 71% 1.38G/1.95G [00:06<00:02, 201MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 72% 1.41G/1.95G [00:06<00:02, 201MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 74% 1.44G/1.95G [00:06<00:02, 207MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 75% 1.47G/1.95G [00:06<00:02, 217MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 77% 1.50G/1.95G [00:07<00:02, 223MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 79% 1.53G/1.95G [00:07<00:01, 230MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 80% 1.56G/1.95G [00:07<00:01, 231MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 82% 1.59G/1.95G [00:07<00:01, 234MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 84% 1.63G/1.95G [00:07<00:01, 241MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 85% 1.66G/1.95G [00:07<00:01, 240MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 87% 1.69G/1.95G [00:07<00:01, 243MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 88% 1.72G/1.95G [00:08<00:00, 240MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 90% 1.75G/1.95G [00:08<00:00, 244MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 92% 1.78G/1.95G [00:08<00:00, 249MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 93% 1.81G/1.95G [00:08<00:00, 248MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 95% 1.85G/1.95G [00:08<00:00, 252MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 96% 1.88G/1.95G [00:08<00:00, 256MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 98% 1.91G/1.95G [00:08<00:00, 254MB/s]\u001b[A\n","model-00002-of-00008.safetensors: 100% 1.95G/1.95G [00:08<00:00, 218MB/s]\n","Downloading shards: 25% 2/8 [00:21<01:02, 10.50s/it]\n","model-00003-of-00008.safetensors: 0% 0.00/1.98G [00:00, ?B/s]\u001b[A\n","model-00003-of-00008.safetensors: 1% 21.0M/1.98G [00:00<00:14, 135MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 2% 41.9M/1.98G [00:01<01:17, 24.9MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 3% 62.9M/1.98G [00:01<00:46, 40.9MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 5% 94.4M/1.98G [00:01<00:27, 68.8MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 6% 126M/1.98G [00:01<00:18, 100MB/s] \u001b[A\n","model-00003-of-00008.safetensors: 8% 157M/1.98G [00:01<00:13, 132MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 10% 189M/1.98G [00:02<00:11, 152MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 11% 220M/1.98G [00:03<00:31, 55.2MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 12% 241M/1.98G [00:03<00:26, 66.6MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 14% 273M/1.98G [00:03<00:19, 87.9MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 15% 304M/1.98G [00:03<00:14, 113MB/s] \u001b[A\n","model-00003-of-00008.safetensors: 17% 336M/1.98G [00:03<00:12, 137MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 19% 367M/1.98G [00:04<00:10, 154MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 20% 398M/1.98G [00:04<00:08, 178MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 22% 430M/1.98G [00:04<00:07, 201MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 23% 461M/1.98G [00:04<00:07, 216MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 25% 493M/1.98G [00:04<00:06, 219MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 26% 524M/1.98G [00:04<00:06, 231MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 28% 556M/1.98G [00:04<00:05, 237MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 30% 587M/1.98G [00:04<00:05, 248MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 31% 619M/1.98G [00:04<00:05, 257MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 33% 650M/1.98G [00:05<00:05, 264MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 34% 682M/1.98G [00:05<00:04, 260MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 36% 713M/1.98G [00:05<00:05, 250MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 38% 744M/1.98G [00:05<00:04, 253MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 39% 776M/1.98G [00:05<00:04, 252MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 41% 807M/1.98G [00:05<00:04, 249MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 42% 839M/1.98G [00:05<00:04, 253MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 44% 870M/1.98G [00:06<00:04, 241MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 46% 902M/1.98G [00:06<00:04, 243MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 47% 933M/1.98G [00:06<00:04, 246MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 49% 965M/1.98G [00:06<00:04, 251MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 50% 996M/1.98G [00:06<00:04, 235MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 52% 1.03G/1.98G [00:06<00:03, 243MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 53% 1.06G/1.98G [00:06<00:03, 248MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 55% 1.09G/1.98G [00:06<00:03, 249MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 57% 1.12G/1.98G [00:07<00:03, 249MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 58% 1.15G/1.98G [00:07<00:03, 246MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 60% 1.18G/1.98G [00:07<00:03, 256MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 61% 1.22G/1.98G [00:07<00:02, 256MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 63% 1.25G/1.98G [00:07<00:02, 248MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 65% 1.28G/1.98G [00:07<00:02, 251MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 66% 1.31G/1.98G [00:07<00:02, 251MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 68% 1.34G/1.98G [00:07<00:02, 235MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 69% 1.37G/1.98G [00:08<00:02, 228MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 71% 1.41G/1.98G [00:08<00:03, 172MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 73% 1.44G/1.98G [00:08<00:02, 185MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 74% 1.47G/1.98G [00:08<00:02, 199MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 76% 1.50G/1.98G [00:08<00:02, 198MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 77% 1.52G/1.98G [00:09<00:02, 163MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 78% 1.54G/1.98G [00:09<00:03, 144MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 79% 1.57G/1.98G [00:09<00:02, 167MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 81% 1.60G/1.98G [00:09<00:01, 191MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 83% 1.64G/1.98G [00:09<00:01, 203MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 84% 1.67G/1.98G [00:09<00:01, 190MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 85% 1.69G/1.98G [00:09<00:01, 186MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 86% 1.71G/1.98G [00:09<00:01, 189MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 87% 1.73G/1.98G [00:10<00:01, 193MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 88% 1.75G/1.98G [00:10<00:01, 145MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 90% 1.77G/1.98G [00:10<00:01, 115MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 91% 1.79G/1.98G [00:10<00:01, 114MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 92% 1.81G/1.98G [00:10<00:01, 123MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 93% 1.84G/1.98G [00:11<00:01, 128MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 94% 1.86G/1.98G [00:11<00:00, 135MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 95% 1.88G/1.98G [00:11<00:00, 143MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 96% 1.90G/1.98G [00:11<00:00, 154MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 97% 1.92G/1.98G [00:11<00:00, 135MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 98% 1.94G/1.98G [00:11<00:00, 149MB/s]\u001b[A\n","model-00003-of-00008.safetensors: 100% 1.98G/1.98G [00:14<00:00, 139MB/s] \n","Downloading shards: 38% 3/8 [00:35<01:01, 12.24s/it]\n","model-00004-of-00008.safetensors: 0% 0.00/1.95G [00:00, ?B/s]\u001b[A\n","model-00004-of-00008.safetensors: 1% 21.0M/1.95G [00:00<00:12, 154MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 2% 41.9M/1.95G [00:00<00:10, 178MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 4% 73.4M/1.95G [00:00<00:09, 203MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 5% 105M/1.95G [00:00<00:08, 210MB/s] \u001b[A\n","model-00004-of-00008.safetensors: 7% 136M/1.95G [00:00<00:08, 224MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 9% 168M/1.95G [00:00<00:07, 226MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 10% 199M/1.95G [00:00<00:07, 231MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 12% 231M/1.95G [00:01<00:07, 237MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 13% 262M/1.95G [00:01<00:06, 244MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 15% 294M/1.95G [00:01<00:06, 241MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 17% 325M/1.95G [00:01<00:06, 246MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 18% 357M/1.95G [00:01<00:06, 244MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 20% 388M/1.95G [00:01<00:06, 242MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 22% 419M/1.95G [00:01<00:06, 249MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 23% 451M/1.95G [00:01<00:05, 261MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 25% 482M/1.95G [00:02<00:05, 270MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 26% 514M/1.95G [00:02<00:05, 278MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 28% 545M/1.95G [00:02<00:05, 277MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 30% 577M/1.95G [00:02<00:05, 232MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 31% 608M/1.95G [00:02<00:05, 236MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 33% 640M/1.95G [00:05<00:43, 29.9MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 34% 671M/1.95G [00:05<00:31, 41.0MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 36% 703M/1.95G [00:05<00:22, 55.3MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 38% 734M/1.95G [00:06<00:16, 72.9MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 39% 765M/1.95G [00:06<00:13, 90.8MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 41% 797M/1.95G [00:06<00:10, 111MB/s] \u001b[A\n","model-00004-of-00008.safetensors: 43% 828M/1.95G [00:06<00:08, 132MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 44% 860M/1.95G [00:06<00:07, 154MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 46% 891M/1.95G [00:06<00:06, 172MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 47% 923M/1.95G [00:06<00:05, 186MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 49% 954M/1.95G [00:06<00:04, 203MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 51% 986M/1.95G [00:07<00:04, 216MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 52% 1.02G/1.95G [00:07<00:04, 217MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 54% 1.05G/1.95G [00:07<00:03, 226MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 55% 1.08G/1.95G [00:07<00:03, 228MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 57% 1.11G/1.95G [00:07<00:03, 225MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 59% 1.14G/1.95G [00:07<00:03, 218MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 60% 1.17G/1.95G [00:07<00:03, 223MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 62% 1.21G/1.95G [00:08<00:03, 211MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 64% 1.24G/1.95G [00:08<00:03, 220MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 65% 1.27G/1.95G [00:08<00:02, 229MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 67% 1.30G/1.95G [00:08<00:02, 240MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 68% 1.33G/1.95G [00:08<00:02, 224MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 70% 1.36G/1.95G [00:08<00:02, 212MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 72% 1.39G/1.95G [00:09<00:02, 190MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 73% 1.42G/1.95G [00:09<00:02, 189MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 74% 1.44G/1.95G [00:12<00:19, 26.6MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 75% 1.46G/1.95G [00:12<00:14, 33.5MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 77% 1.49G/1.95G [00:12<00:09, 48.9MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 78% 1.52G/1.95G [00:12<00:06, 67.9MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 80% 1.55G/1.95G [00:12<00:04, 89.1MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 81% 1.58G/1.95G [00:12<00:03, 108MB/s] \u001b[A\n","model-00004-of-00008.safetensors: 83% 1.61G/1.95G [00:12<00:02, 133MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 85% 1.65G/1.95G [00:12<00:01, 155MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 86% 1.68G/1.95G [00:13<00:01, 177MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 88% 1.71G/1.95G [00:13<00:01, 193MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 89% 1.74G/1.95G [00:13<00:00, 207MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 91% 1.77G/1.95G [00:13<00:00, 218MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 93% 1.80G/1.95G [00:13<00:00, 233MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 94% 1.84G/1.95G [00:13<00:00, 230MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 96% 1.87G/1.95G [00:13<00:00, 229MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 98% 1.90G/1.95G [00:13<00:00, 242MB/s]\u001b[A\n","model-00004-of-00008.safetensors: 100% 1.95G/1.95G [00:14<00:00, 137MB/s]\n","Downloading shards: 50% 4/8 [00:50<00:52, 13.05s/it]\n","model-00005-of-00008.safetensors: 0% 0.00/1.98G [00:00, ?B/s]\u001b[A\n","model-00005-of-00008.safetensors: 1% 10.5M/1.98G [00:00<00:23, 83.9MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 2% 31.5M/1.98G [00:00<00:13, 141MB/s] \u001b[A\n","model-00005-of-00008.safetensors: 3% 62.9M/1.98G [00:00<00:09, 213MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 5% 105M/1.98G [00:00<00:07, 263MB/s] \u001b[A\n","model-00005-of-00008.safetensors: 7% 136M/1.98G [00:00<00:06, 275MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 8% 168M/1.98G [00:00<00:07, 255MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 10% 199M/1.98G [00:00<00:09, 196MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 12% 231M/1.98G [00:01<00:07, 221MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 13% 262M/1.98G [00:01<00:07, 233MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 15% 294M/1.98G [00:01<00:06, 248MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 16% 325M/1.98G [00:01<00:06, 260MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 18% 357M/1.98G [00:01<00:06, 259MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 20% 388M/1.98G [00:01<00:06, 261MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 21% 419M/1.98G [00:01<00:06, 242MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 23% 451M/1.98G [00:01<00:05, 258MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 24% 482M/1.98G [00:02<00:06, 248MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 26% 514M/1.98G [00:02<00:06, 225MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 28% 545M/1.98G [00:02<00:06, 235MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 29% 577M/1.98G [00:02<00:05, 254MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 31% 619M/1.98G [00:02<00:04, 278MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 33% 650M/1.98G [00:02<00:04, 279MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 34% 682M/1.98G [00:02<00:04, 278MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 36% 713M/1.98G [00:02<00:05, 235MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 38% 744M/1.98G [00:03<00:05, 236MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 39% 776M/1.98G [00:03<00:05, 238MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 41% 807M/1.98G [00:03<00:04, 238MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 42% 839M/1.98G [00:03<00:04, 241MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 44% 870M/1.98G [00:03<00:04, 247MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 46% 912M/1.98G [00:03<00:03, 274MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 48% 944M/1.98G [00:03<00:03, 278MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 49% 975M/1.98G [00:03<00:03, 280MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 51% 1.01G/1.98G [00:04<00:03, 257MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 52% 1.04G/1.98G [00:04<00:04, 231MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 54% 1.07G/1.98G [00:04<00:04, 225MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 56% 1.10G/1.98G [00:04<00:04, 217MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 58% 1.14G/1.98G [00:04<00:03, 250MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 60% 1.18G/1.98G [00:04<00:02, 268MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 61% 1.22G/1.98G [00:04<00:02, 262MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 63% 1.25G/1.98G [00:05<00:02, 250MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 65% 1.28G/1.98G [00:05<00:02, 250MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 67% 1.32G/1.98G [00:05<00:02, 272MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 68% 1.35G/1.98G [00:05<00:02, 255MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 70% 1.38G/1.98G [00:05<00:02, 246MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 72% 1.42G/1.98G [00:05<00:02, 257MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 74% 1.46G/1.98G [00:05<00:01, 276MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 75% 1.49G/1.98G [00:05<00:01, 268MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 77% 1.52G/1.98G [00:06<00:01, 275MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 78% 1.55G/1.98G [00:06<00:01, 271MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 81% 1.59G/1.98G [00:06<00:01, 280MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 82% 1.63G/1.98G [00:06<00:01, 253MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 84% 1.66G/1.98G [00:06<00:01, 241MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 85% 1.69G/1.98G [00:06<00:01, 237MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 87% 1.72G/1.98G [00:06<00:01, 250MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 88% 1.75G/1.98G [00:07<00:00, 249MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 90% 1.78G/1.98G [00:07<00:00, 251MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 92% 1.81G/1.98G [00:07<00:00, 236MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 93% 1.85G/1.98G [00:07<00:00, 226MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 95% 1.88G/1.98G [00:07<00:00, 239MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 96% 1.91G/1.98G [00:07<00:00, 229MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 98% 1.94G/1.98G [00:07<00:00, 225MB/s]\u001b[A\n","model-00005-of-00008.safetensors: 100% 1.98G/1.98G [00:08<00:00, 245MB/s]\n","Downloading shards: 62% 5/8 [00:58<00:33, 11.30s/it]\n","model-00006-of-00008.safetensors: 0% 0.00/1.95G [00:00, ?B/s]\u001b[A\n","model-00006-of-00008.safetensors: 1% 21.0M/1.95G [00:00<00:12, 160MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 2% 41.9M/1.95G [00:00<00:10, 185MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 4% 73.4M/1.95G [00:00<00:08, 216MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 5% 105M/1.95G [00:00<00:07, 248MB/s] \u001b[A\n","model-00006-of-00008.safetensors: 7% 136M/1.95G [00:00<00:07, 233MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 9% 168M/1.95G [00:00<00:08, 209MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 10% 199M/1.95G [00:00<00:08, 207MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 12% 231M/1.95G [00:01<00:07, 225MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 13% 262M/1.95G [00:01<00:07, 226MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 15% 294M/1.95G [00:01<00:07, 222MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 17% 325M/1.95G [00:01<00:07, 224MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 18% 357M/1.95G [00:01<00:07, 223MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 20% 388M/1.95G [00:01<00:06, 231MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 22% 419M/1.95G [00:01<00:06, 233MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 23% 451M/1.95G [00:02<00:06, 230MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 25% 482M/1.95G [00:02<00:06, 238MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 26% 514M/1.95G [00:02<00:06, 221MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 28% 545M/1.95G [00:02<00:06, 233MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 30% 577M/1.95G [00:02<00:06, 228MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 31% 608M/1.95G [00:02<00:05, 227MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 33% 640M/1.95G [00:02<00:06, 215MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 34% 671M/1.95G [00:03<00:05, 223MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 36% 703M/1.95G [00:03<00:05, 229MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 38% 734M/1.95G [00:03<00:05, 232MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 39% 765M/1.95G [00:03<00:04, 248MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 41% 797M/1.95G [00:03<00:06, 174MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 43% 839M/1.95G [00:03<00:05, 210MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 45% 870M/1.95G [00:03<00:04, 231MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 46% 902M/1.95G [00:04<00:04, 247MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 48% 933M/1.95G [00:04<00:04, 246MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 50% 965M/1.95G [00:04<00:03, 259MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 51% 996M/1.95G [00:04<00:03, 252MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 53% 1.03G/1.95G [00:04<00:03, 245MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 54% 1.06G/1.95G [00:04<00:03, 253MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 56% 1.09G/1.95G [00:04<00:03, 260MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 58% 1.12G/1.95G [00:04<00:03, 267MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 59% 1.15G/1.95G [00:04<00:02, 273MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 61% 1.18G/1.95G [00:05<00:02, 275MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 62% 1.22G/1.95G [00:05<00:02, 271MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 64% 1.25G/1.95G [00:05<00:02, 272MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 66% 1.28G/1.95G [00:05<00:02, 243MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 67% 1.31G/1.95G [00:05<00:02, 242MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 69% 1.34G/1.95G [00:05<00:02, 254MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 71% 1.37G/1.95G [00:05<00:02, 260MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 72% 1.41G/1.95G [00:05<00:01, 273MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 74% 1.45G/1.95G [00:06<00:01, 287MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 76% 1.48G/1.95G [00:06<00:01, 275MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 78% 1.52G/1.95G [00:06<00:01, 291MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 80% 1.56G/1.95G [00:06<00:01, 300MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 82% 1.60G/1.95G [00:06<00:01, 308MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 85% 1.65G/1.95G [00:06<00:00, 314MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 86% 1.68G/1.95G [00:06<00:01, 242MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 88% 1.71G/1.95G [00:09<00:06, 36.1MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 90% 1.75G/1.95G [00:09<00:03, 51.5MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 92% 1.78G/1.95G [00:10<00:02, 64.6MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 93% 1.81G/1.95G [00:10<00:01, 78.0MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 95% 1.85G/1.95G [00:10<00:01, 78.0MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 96% 1.87G/1.95G [00:10<00:00, 83.9MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 98% 1.90G/1.95G [00:10<00:00, 108MB/s] \u001b[A\n","model-00006-of-00008.safetensors: 99% 1.92G/1.95G [00:11<00:00, 103MB/s]\u001b[A\n","model-00006-of-00008.safetensors: 100% 1.95G/1.95G [00:11<00:00, 167MB/s] \n","Downloading shards: 75% 6/8 [01:10<00:22, 11.45s/it]\n","model-00007-of-00008.safetensors: 0% 0.00/1.98G [00:00, ?B/s]\u001b[A\n","model-00007-of-00008.safetensors: 1% 10.5M/1.98G [00:00<00:29, 67.0MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 2% 31.5M/1.98G [00:00<00:16, 117MB/s] \u001b[A\n","model-00007-of-00008.safetensors: 3% 62.9M/1.98G [00:00<00:10, 184MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 5% 94.4M/1.98G [00:00<00:09, 208MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 6% 126M/1.98G [00:00<00:08, 231MB/s] \u001b[A\n","model-00007-of-00008.safetensors: 8% 157M/1.98G [00:00<00:07, 237MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 10% 189M/1.98G [00:00<00:07, 232MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 11% 220M/1.98G [00:01<00:07, 245MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 13% 252M/1.98G [00:01<00:10, 166MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 14% 283M/1.98G [00:01<00:09, 180MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 15% 304M/1.98G [00:01<00:09, 181MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 16% 325M/1.98G [00:01<00:09, 183MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 17% 346M/1.98G [00:01<00:09, 181MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 19% 377M/1.98G [00:01<00:08, 191MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 20% 398M/1.98G [00:02<00:08, 188MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 21% 419M/1.98G [00:02<00:08, 188MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 23% 451M/1.98G [00:02<00:07, 201MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 24% 482M/1.98G [00:02<00:06, 214MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 26% 514M/1.98G [00:02<00:06, 211MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 28% 545M/1.98G [00:02<00:06, 221MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 29% 577M/1.98G [00:02<00:06, 225MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 31% 608M/1.98G [00:03<00:06, 228MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 32% 640M/1.98G [00:03<00:06, 212MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 34% 671M/1.98G [00:03<00:06, 195MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 35% 703M/1.98G [00:03<00:06, 210MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 37% 734M/1.98G [00:03<00:05, 219MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 39% 765M/1.98G [00:03<00:06, 200MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 40% 786M/1.98G [00:03<00:05, 199MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 41% 807M/1.98G [00:04<00:05, 199MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 42% 828M/1.98G [00:04<00:05, 200MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 43% 849M/1.98G [00:07<00:50, 22.5MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 44% 870M/1.98G [00:08<00:50, 21.9MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 46% 902M/1.98G [00:08<00:32, 33.3MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 47% 933M/1.98G [00:08<00:21, 48.1MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 49% 965M/1.98G [00:08<00:15, 66.5MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 50% 996M/1.98G [00:08<00:11, 85.4MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 52% 1.03G/1.98G [00:08<00:09, 105MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 53% 1.06G/1.98G [00:09<00:07, 128MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 55% 1.09G/1.98G [00:09<00:05, 152MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 57% 1.12G/1.98G [00:09<00:04, 175MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 58% 1.15G/1.98G [00:09<00:04, 199MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 60% 1.18G/1.98G [00:09<00:03, 204MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 61% 1.22G/1.98G [00:09<00:03, 219MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 63% 1.25G/1.98G [00:09<00:03, 230MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 65% 1.28G/1.98G [00:09<00:02, 242MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 66% 1.31G/1.98G [00:10<00:02, 226MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 68% 1.34G/1.98G [00:10<00:04, 155MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 69% 1.36G/1.98G [00:10<00:04, 126MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 70% 1.38G/1.98G [00:10<00:04, 127MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 71% 1.41G/1.98G [00:11<00:04, 136MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 73% 1.44G/1.98G [00:11<00:03, 159MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 74% 1.47G/1.98G [00:11<00:02, 176MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 75% 1.49G/1.98G [00:11<00:02, 172MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 76% 1.51G/1.98G [00:11<00:02, 175MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 77% 1.53G/1.98G [00:11<00:02, 158MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 78% 1.55G/1.98G [00:11<00:02, 162MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 79% 1.57G/1.98G [00:12<00:02, 142MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 82% 1.61G/1.98G [00:12<00:01, 191MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 83% 1.64G/1.98G [00:12<00:02, 145MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 84% 1.66G/1.98G [00:12<00:02, 136MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 85% 1.69G/1.98G [00:12<00:01, 155MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 86% 1.71G/1.98G [00:12<00:01, 148MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 88% 1.74G/1.98G [00:13<00:01, 178MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 90% 1.77G/1.98G [00:13<00:01, 204MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 91% 1.80G/1.98G [00:13<00:00, 225MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 93% 1.84G/1.98G [00:13<00:00, 225MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 94% 1.87G/1.98G [00:13<00:00, 240MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 96% 1.90G/1.98G [00:13<00:00, 243MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 98% 1.94G/1.98G [00:13<00:00, 266MB/s]\u001b[A\n","model-00007-of-00008.safetensors: 100% 1.98G/1.98G [00:16<00:00, 119MB/s] \n","Downloading shards: 88% 7/8 [01:26<00:13, 13.18s/it]\n","model-00008-of-00008.safetensors: 0% 0.00/1.75G [00:00, ?B/s]\u001b[A\n","model-00008-of-00008.safetensors: 1% 10.5M/1.75G [00:00<00:19, 90.9MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 2% 31.5M/1.75G [00:00<00:12, 139MB/s] \u001b[A\n","model-00008-of-00008.safetensors: 3% 52.4M/1.75G [00:00<00:10, 160MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 5% 83.9M/1.75G [00:00<00:09, 184MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 7% 115M/1.75G [00:00<00:08, 204MB/s] \u001b[A\n","model-00008-of-00008.safetensors: 8% 147M/1.75G [00:00<00:07, 225MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 10% 178M/1.75G [00:00<00:07, 201MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 12% 210M/1.75G [00:01<00:07, 212MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 14% 241M/1.75G [00:01<00:06, 221MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 16% 273M/1.75G [00:01<00:06, 227MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 17% 304M/1.75G [00:01<00:06, 233MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 19% 336M/1.75G [00:01<00:05, 247MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 21% 367M/1.75G [00:01<00:05, 250MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 23% 398M/1.75G [00:01<00:05, 263MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 25% 430M/1.75G [00:01<00:04, 273MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 27% 472M/1.75G [00:02<00:04, 295MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 29% 514M/1.75G [00:02<00:04, 305MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 31% 545M/1.75G [00:02<00:04, 295MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 33% 577M/1.75G [00:02<00:04, 274MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 35% 608M/1.75G [00:02<00:04, 270MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 37% 640M/1.75G [00:02<00:04, 270MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 39% 682M/1.75G [00:02<00:03, 290MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 41% 713M/1.75G [00:06<00:33, 30.7MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 43% 755M/1.75G [00:06<00:22, 44.7MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 46% 797M/1.75G [00:06<00:15, 62.6MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 47% 828M/1.75G [00:06<00:11, 78.7MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 49% 860M/1.75G [00:06<00:09, 96.4MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 51% 891M/1.75G [00:06<00:07, 115MB/s] \u001b[A\n","model-00008-of-00008.safetensors: 53% 923M/1.75G [00:06<00:05, 139MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 55% 965M/1.75G [00:07<00:04, 170MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 57% 996M/1.75G [00:07<00:03, 191MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 59% 1.03G/1.75G [00:07<00:03, 210MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 61% 1.06G/1.75G [00:07<00:03, 223MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 62% 1.09G/1.75G [00:07<00:02, 238MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 65% 1.13G/1.75G [00:07<00:02, 266MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 67% 1.16G/1.75G [00:07<00:02, 253MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 68% 1.20G/1.75G [00:07<00:02, 247MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 70% 1.23G/1.75G [00:08<00:02, 232MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 72% 1.26G/1.75G [00:08<00:02, 226MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 74% 1.29G/1.75G [00:08<00:02, 216MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 76% 1.32G/1.75G [00:08<00:02, 177MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 77% 1.34G/1.75G [00:12<00:16, 24.7MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 79% 1.37G/1.75G [00:12<00:10, 34.5MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 80% 1.39G/1.75G [00:12<00:08, 42.7MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 81% 1.42G/1.75G [00:12<00:06, 53.3MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 83% 1.45G/1.75G [00:12<00:04, 73.0MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 85% 1.48G/1.75G [00:12<00:02, 94.8MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 86% 1.51G/1.75G [00:12<00:02, 117MB/s] \u001b[A\n","model-00008-of-00008.safetensors: 88% 1.54G/1.75G [00:12<00:01, 138MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 90% 1.57G/1.75G [00:13<00:01, 161MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 92% 1.60G/1.75G [00:13<00:00, 178MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 94% 1.64G/1.75G [00:13<00:00, 186MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 95% 1.67G/1.75G [00:13<00:00, 190MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 97% 1.70G/1.75G [00:13<00:00, 198MB/s]\u001b[A\n","model-00008-of-00008.safetensors: 100% 1.75G/1.75G [00:13<00:00, 126MB/s]\n","Downloading shards: 100% 8/8 [01:40<00:00, 12.61s/it]\n","Loading checkpoint shards: 100% 8/8 [01:00<00:00, 7.58s/it]\n","generation_config.json: 100% 123/123 [00:00<00:00, 900kB/s]\n","Some parameters are on the meta device device because they were offloaded to the cpu.\n","(2) GPU = Tesla T4. Max memory = 14.748 GB.\n","12.084 GB of memory reserved.\n","loading train/test data files\n","Generating train split: 25000 examples [00:00, 29335.93 examples/s]\n","Generating test split: 3000 examples [00:00, 41850.13 examples/s]\n","Map: 100% 25000/25000 [00:01<00:00, 20627.51 examples/s]\n","Map: 100% 3000/3000 [00:00<00:00, 19699.28 examples/s]\n","DatasetDict({\n"," train: Dataset({\n"," features: ['text', 'label', 'answer', 'title', 'puzzle', 'truth', 'train_text', 'prompt'],\n"," num_rows: 25000\n"," })\n"," test: Dataset({\n"," features: ['text', 'label', 'answer', 'title', 'puzzle', 'truth', 'train_text', 'prompt'],\n"," num_rows: 3000\n"," })\n","})\n","--- evaluating 500 entries\n","--------------------------------------------------\n","text: 甄加索是自杀吗\n","--------------------------------------------------\n","label: 不是\n","--------------------------------------------------\n","answer: nan\n","--------------------------------------------------\n","title: 海岸之谜\n","--------------------------------------------------\n","puzzle: 在远离城市喧嚣的海边小屋,一天清晨,邻居发现甄加索僵卧在沙滩上,已无生命迹象。现场没有发现任何打斗的迹象。请问甄加索的死因是什么?\n","--------------------------------------------------\n","truth: 甄加索是一位热爱自然的画家,他每年都会来到这个海边小屋寻找灵感。在他生命的最后几天,他一直在创作一幅描绘海洋生物的画作。在画即将完成的前一天晚上,他骑着自行车外出,打算在海边观赏夜景。然而,他在沙滩上意外发现了一只搁浅的海豚,为了救助这只海豚,他耗费了极大的体力,最终成功将其送回海中。筋疲力尽的甄加索在沙滩上睡着了,由于他患有严重的心脏病,却未告知旁人,在寒冷的海风中,他的心脏停止了跳动。因此,警方在现场只发现了车轮痕迹和未完成的画作,而没有发现任何他杀的迹象。\n","--------------------------------------------------\n","train_text: <|im_start|>system\n","You are an expert in logical reasoning.<|im_end|>\n","<|im_start|>user\n","你是一个逻辑游戏的主持人。游戏规则如下:\n","\n","1. 参与者会得到一个谜题。\n","2. 参与者可以通过提问来获取线索,尝试解开谜题。\n","3. 对于每个问题,主持人将根据实际情况回答以下五个选项之一:是、不是、不重要、回答正确、问法错误。\n","4. 回答中不能添加任何其它信息,也不能省略选项中的任何一个字。例如,不可以把“不是”省略成“不”。\n","5. 参与者需要根据回答来推理,并最终找出谜题的正确答案。\n","\n","请严格按照这些规则回答参与者提出的问题。\n","\n","谜题: 在远离城市喧嚣的海边小屋,一天清晨,邻居发现甄加索僵卧在沙滩上,已无生命迹象。现场没有发现任何打斗的迹象。请问甄加索的死因是什么?\n","\n","实际情况: 甄加索是一位热爱自然的画家,他每年都会来到这个海边小屋寻找灵感。在他生命的最后几天,他一直在创作一幅描绘海洋生物的画作。在画即将完成的前一天晚上,他骑着自行车外出,打算在海边观赏夜景。然而,他在沙滩上意外发现了一只搁浅的海豚,为了救助这只海豚,他耗费了极大的体力,最终成功将其送回海中。筋疲力尽的甄加索在沙滩上睡着了,由于他患有严重的心脏病,却未告知旁人,在寒冷的海风中,他的心脏停止了跳动。因此,警方在现场只发现了车轮痕迹和未完成的画作,而没有发现任何他杀的迹象。\n","\n","参与者提出的问题: 甄加索是自杀吗\n","<|im_end|>\n","<|im_start|>assistant\n","不是\n","--------------------------------------------------\n","prompt: <|im_start|>system\n","You are an expert in logical reasoning.<|im_end|>\n","<|im_start|>user\n","你是一个逻辑游戏的主持人。游戏规则如下:\n","\n","1. 参与者会得到一个谜题。\n","2. 参与者可以通过提问来获取线索,尝试解开谜题。\n","3. 对于每个问题,主持人将根据实际情况回答以下五个选项之一:是、不是、不重要、回答正确、问法错误。\n","4. 回答中不能添加任何其它信息,也不能省略选项中的任何一个字。例如,不可以把“不是”省略成“不”。\n","5. 参与者需要根据回答来推理,并最终找出谜题的正确答案。\n","\n","请严格按照这些规则回答参与者提出的问题。\n","\n","谜题: 在远离城市喧嚣的海边小屋,一天清晨,邻居发现甄加索僵卧在沙滩上,已无生命迹象。现场没有发现任何打斗的迹象。请问甄加索的死因是什么?\n","\n","实际情况: 甄加索是一位热爱自然的画家,他每年都会来到这个海边小屋寻找灵感。在他生命的最后几天,他一直在创作一幅描绘海洋生物的画作。在画即将完成的前一天晚上,他骑着自行车外出,打算在海边观赏夜景。然而,他在沙滩上意外发现了一只搁浅的海豚,为了救助这只海豚,他耗费了极大的体力,最终成功将其送回海中。筋疲力尽的甄加索在沙滩上睡着了,由于他患有严重的心脏病,却未告知旁人,在寒冷的海风中,他的心脏停止了跳动。因此,警方在现场只发现了车轮痕迹和未完成的画作,而没有发现任何他杀的迹象。\n","\n","参与者提出的问题: 甄加索是自杀吗\n","<|im_end|>\n","<|im_start|>assistant\n","\n","--------------------------------------------------\n","text: 它原本是人\n","--------------------------------------------------\n","label: 不是\n","--------------------------------------------------\n","answer: nan\n","--------------------------------------------------\n","title: 湖畔迷影\n","--------------------------------------------------\n","puzzle: 一个宁静的午后,湖边突然传来了惊叫声。人们跑过去发现,湖边石头上静静躺着一个打翻的背包和一张奇怪的纸条。纸条上写着:“它就在这里,但我无法带它回去。”人们搜寻了周围,但什么也没有发现,背包的主人也不知所踪。\n","--------------------------------------------------\n","truth: 原来,湖边是一个学校的生物研究小组经常进行野外考察的地方。背包的主人是一位对湖中生物充满好奇的学生。他在湖边发现了一只稀有的湖龟,但由于湖龟属于保护动物,他无法私自将其带回去。他在纸条上记录了自己的发现,并准备将这个消息告诉他的研究小组。然而,在他离开去寻找同组的伙伴时,不小心滑入湖中,因不会游泳而遭遇了不幸。而湖龟在他跌入水中时受到了惊吓,悄悄潜入了湖中深处。那张纸条和打翻的背包成为了这个谜团的唯一线索。 \n","--------------------------------------------------\n","train_text: <|im_start|>system\n","You are an expert in logical reasoning.<|im_end|>\n","<|im_start|>user\n","你是一个逻辑游戏的主持人。游戏规则如下:\n","\n","1. 参与者会得到一个谜题。\n","2. 参与者可以通过提问来获取线索,尝试解开谜题。\n","3. 对于每个问题,主持人将根据实际情况回答以下五个选项之一:是、不是、不重要、回答正确、问法错误。\n","4. 回答中不能添加任何其它信息,也不能省略选项中的任何一个字。例如,不可以把“不是”省略成“不”。\n","5. 参与者需要根据回答来推理,并最终找出谜题的正确答案。\n","\n","请严格按照这些规则回答参与者提出的问题。\n","\n","谜题: 一个宁静的午后,湖边突然传来了惊叫声。人们跑过去发现,湖边石头上静静躺着一个打翻的背包和一张奇怪的纸条。纸条上写着:“它就在这里,但我无法带它回去。”人们搜寻了周围,但什么也没有发现,背包的主人也不知所踪。\n","\n","实际情况: 原来,湖边是一个学校的生物研究小组经常进行野外考察的地方。背包的主人是一位对湖中生物充满好奇的学生。他在湖边发现了一只稀有的湖龟,但由于湖龟属于保护动物,他无法私自将其带回去。他在纸条上记录了自己的发现,并准备将这个消息告诉他的研究小组。然而,在他离开去寻找同组的伙伴时,不小心滑入湖中,因不会游泳而遭遇了不幸。而湖龟在他跌入水中时受到了惊吓,悄悄潜入了湖中深处。那张纸条和打翻的背包成为了这个谜团的唯一线索。 \n","\n","参与者提出的问题: 它原本是人\n","<|im_end|>\n","<|im_start|>assistant\n","不是\n","--------------------------------------------------\n","prompt: <|im_start|>system\n","You are an expert in logical reasoning.<|im_end|>\n","<|im_start|>user\n","你是一个逻辑游戏的主持人。游戏规则如下:\n","\n","1. 参与者会得到一个谜题。\n","2. 参与者可以通过提问来获取线索,尝试解开谜题。\n","3. 对于每个问题,主持人将根据实际情况回答以下五个选项之一:是、不是、不重要、回答正确、问法错误。\n","4. 回答中不能添加任何其它信息,也不能省略选项中的任何一个字。例如,不可以把“不是”省略成“不”。\n","5. 参与者需要根据回答来推理,并最终找出谜题的正确答案。\n","\n","请严格按照这些规则回答参与者提出的问题。\n","\n","谜题: 一个宁静的午后,湖边突然传来了惊叫声。人们跑过去发现,湖边石头上静静躺着一个打翻的背包和一张奇怪的纸条。纸条上写着:“它就在这里,但我无法带它回去。”人们搜寻了周围,但什么也没有发现,背包的主人也不知所踪。\n","\n","实际情况: 原来,湖边是一个学校的生物研究小组经常进行野外考察的地方。背包的主人是一位对湖中生物充满好奇的学生。他在湖边发现了一只稀有的湖龟,但由于湖龟属于保护动物,他无法私自将其带回去。他在纸条上记录了自己的发现,并准备将这个消息告诉他的研究小组。然而,在他离开去寻找同组的伙伴时,不小心滑入湖中,因不会游泳而遭遇了不幸。而湖龟在他跌入水中时受到了惊吓,悄悄潜入了湖中深处。那张纸条和打翻的背包成为了这个谜团的唯一线索。 \n","\n","参与者提出的问题: 它原本是人\n","<|im_end|>\n","<|im_start|>assistant\n","\n","Evaluating model: internlm/internlm2_5-7b-chat-1m\n"," 0% 0/500 [00:00, ?it/s]--------\n","step 1: 不是<|im_end|>\n","--------\n","step 2: 不是\n","--------\n","step 3: 不是\n","--------\n","step 4: 不是\n","--------\n","step 5: 不是\n"," 29% 147/500 [14:38<34:59, 5.95s/it]"]}],"source":["%%time\n","\n","evaluate_model_all_epochs(\"internlm/internlm2_5-7b-chat-1m\", 0, \"\", load_in_4bit=False, num_of_entries=500)"]}],"metadata":{"accelerator":"GPU","application/vnd.databricks.v1+notebook":{"dashboards":[],"environmentMetadata":null,"language":"python","notebookMetadata":{"mostRecentlyExecutedCommandWithImplicitDF":{"commandId":-1,"dataframes":["_sqldf"]},"pythonIndentUnit":4},"notebookName":"10_eval-lf-medium-py3.11","widgets":{}},"colab":{"gpuType":"T4","provenance":[]},"kernelspec":{"display_name":"Python 3","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.11.9"}},"nbformat":4,"nbformat_minor":0}