Spaces:

hayas
/

Swallow-13B-instruct

Sleeping

App Files Files Community

hayas commited on Jan 2

Commit

aad286b

1 Parent(s): d0d7843

Update

Browse files

Files changed (8) hide show

.pre-commit-config.yaml +9 -22
.vscode/extensions.json +8 -0
.vscode/settings.json +7 -12
README.md +1 -1
app.py +10 -8
pyproject.toml +43 -7
requirements.txt +48 -44
uv.lock +0 -0

.pre-commit-config.yaml CHANGED Viewed

@@ -13,18 +13,15 @@ repos:
         args: ["--fix=lf"]
       - id: requirements-txt-fixer
       - id: trailing-whitespace
-  - repo: https://github.com/myint/docformatter
-    rev: v1.7.5
     hooks:
-      - id: docformatter
-        args: ["--in-place"]
-  - repo: https://github.com/pycqa/isort
-    rev: 5.13.2
-    hooks:
-      - id: isort
-        args: ["--profile", "black"]
   - repo: https://github.com/pre-commit/mirrors-mypy
-    rev: v1.12.0
     hooks:
       - id: mypy
         args: ["--ignore-missing-imports"]
@@ -35,18 +32,8 @@ repos:
             "types-PyYAML",
             "types-pytz",
           ]
-  - repo: https://github.com/psf/black
-    rev: 24.10.0
-    hooks:
-      - id: black
-        language_version: python3.10
-        args: ["--line-length", "119"]
-  - repo: https://github.com/charliermarsh/ruff-pre-commit
-    rev: v0.7.0
-    hooks:
-      - id: ruff
   - repo: https://github.com/kynan/nbstripout
-    rev: 0.7.1
     hooks:
       - id: nbstripout
         args:
@@ -55,7 +42,7 @@ repos:
             "metadata.interpreter metadata.kernelspec cell.metadata.pycharm",
           ]
   - repo: https://github.com/nbQA-dev/nbQA
-    rev: 1.8.7
     hooks:
       - id: nbqa-black
       - id: nbqa-pyupgrade

         args: ["--fix=lf"]
       - id: requirements-txt-fixer
       - id: trailing-whitespace
+  - repo: https://github.com/astral-sh/ruff-pre-commit
+    rev: v0.8.4
     hooks:
+      - id: ruff
+        args: ["--fix"]
+      - id: ruff-format
+        args: ["--line-length", "119"]
   - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.14.0
     hooks:
       - id: mypy
         args: ["--ignore-missing-imports"]
             "types-PyYAML",
             "types-pytz",
           ]
   - repo: https://github.com/kynan/nbstripout
+    rev: 0.8.1
     hooks:
       - id: nbstripout
         args:
             "metadata.interpreter metadata.kernelspec cell.metadata.pycharm",
           ]
   - repo: https://github.com/nbQA-dev/nbQA
+    rev: 1.9.1
     hooks:
       - id: nbqa-black
       - id: nbqa-pyupgrade

.vscode/extensions.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "recommendations": [
+        "ms-python.python",
+        "charliermarsh.ruff",
+        "streetsidesoftware.code-spell-checker",
+        "tamasfe.even-better-toml"
+    ]
+}

.vscode/settings.json CHANGED Viewed

@@ -2,25 +2,20 @@
     "editor.formatOnSave": true,
     "files.insertFinalNewline": false,
     "[python]": {
-        "editor.defaultFormatter": "ms-python.black-formatter",
         "editor.formatOnType": true,
         "editor.codeActionsOnSave": {
             "source.organizeImports": "explicit"
         }
     },
     "[jupyter]": {
         "files.insertFinalNewline": false
     },
-    "black-formatter.args": [
-        "--line-length=119"
-    ],
-    "isort.args": ["--profile", "black"],
-    "flake8.args": [
-        "--max-line-length=119"
-    ],
-    "ruff.lint.args": [
-        "--line-length=119"
-    ],
     "notebook.output.scrolling": true,
-    "notebook.formatOnCellExecution": true
 }

     "editor.formatOnSave": true,
     "files.insertFinalNewline": false,
     "[python]": {
+        "editor.defaultFormatter": "charliermarsh.ruff",
         "editor.formatOnType": true,
         "editor.codeActionsOnSave": {
+            "source.fixAll.ruff": "explicit",
             "source.organizeImports": "explicit"
         }
     },
     "[jupyter]": {
         "files.insertFinalNewline": false
     },
     "notebook.output.scrolling": true,
+    "notebook.formatOnCellExecution": true,
+    "notebook.formatOnSave.enabled": true,
+    "notebook.codeActionsOnSave": {
+        "source.organizeImports": "explicit"
+    }
 }

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 🐢
 colorFrom: purple
 colorTo: purple
 sdk: gradio
-sdk_version: 5.1.0
 app_file: app.py
 pinned: false
 ---

 colorFrom: purple
 colorTo: purple
 sdk: gradio
+sdk_version: 5.9.1
 app_file: app.py
 pinned: false
 ---

app.py CHANGED Viewed

@@ -1,8 +1,8 @@
 #!/usr/bin/env python
 import os
 from threading import Thread
-from typing import Iterator
 import gradio as gr
 import spaces
@@ -46,23 +46,24 @@ PROMPT_DICT = {
 def create_prompt(instruction: str, input_text: str | None = None) -> str:
-    """Generates a prompt based on the given instruction and an optional input.
     If input is provided, it uses the 'prompt_input' template from PROMPT_DICT.
     If no input is provided, it uses the 'prompt_no_input' template.
     Args:
         instruction (str): The instruction describing the task.
-        input_text (str, optional): Additional input providing context for the task. Default is None.
     Returns:
         str: The generated prompt.
     """
     if input_text:
         # Use the 'prompt_input' template when additional input is provided
         return PROMPT_DICT["prompt_input"].format(instruction=instruction, input=input_text)
-    else:
-        # Use the 'prompt_no_input' template when no additional input is provided
-        return PROMPT_DICT["prompt_no_input"].format(instruction=instruction)
 @spaces.GPU
@@ -80,7 +81,8 @@ def run(
     prompt = create_prompt(instruction, input_text)
     input_ids = tokenizer.encode(prompt, add_special_tokens=False, return_tensors="pt")
     if input_ids.shape[-1] > MAX_INPUT_TOKENS:
-        raise gr.Error(f"Input exceeds maximum number of tokens ({MAX_INPUT_TOKENS})")
     streamer = TextIteratorStreamer(tokenizer, timeout=20.0, skip_prompt=True, skip_special_tokens=True)
     generate_kwargs = dict(
@@ -138,7 +140,7 @@ with gr.Blocks(css_paths="style.css") as demo:
                 "以下のトピックに関する詳細な情報を提供してください。",
                 "夢オチとは何かについて教えてください。",
             ],
-            ["暴れん坊将軍って誰のことですか？", ""],
         ],
         inputs=[instruction, input_text],
         outputs=output,

 #!/usr/bin/env python
 import os
+from collections.abc import Iterator
 from threading import Thread
 import gradio as gr
 import spaces
 def create_prompt(instruction: str, input_text: str | None = None) -> str:
+    """Generate a prompt based on the given instruction and an optional input.
     If input is provided, it uses the 'prompt_input' template from PROMPT_DICT.
     If no input is provided, it uses the 'prompt_no_input' template.
     Args:
         instruction (str): The instruction describing the task.
+        input_text (str | None): Additional input providing context for the task. Defaults to None.
     Returns:
         str: The generated prompt.
     """
     if input_text:
         # Use the 'prompt_input' template when additional input is provided
         return PROMPT_DICT["prompt_input"].format(instruction=instruction, input=input_text)
+    # Use the 'prompt_no_input' template when no additional input is provided
+    return PROMPT_DICT["prompt_no_input"].format(instruction=instruction)
 @spaces.GPU
     prompt = create_prompt(instruction, input_text)
     input_ids = tokenizer.encode(prompt, add_special_tokens=False, return_tensors="pt")
     if input_ids.shape[-1] > MAX_INPUT_TOKENS:
+        error_message = f"Input exceeds maximum number of tokens ({MAX_INPUT_TOKENS})"
+        raise gr.Error(error_message)
     streamer = TextIteratorStreamer(tokenizer, timeout=20.0, skip_prompt=True, skip_special_tokens=True)
     generate_kwargs = dict(
                 "以下のトピックに関する詳細な情報を提供してください。",
                 "夢オチとは何かについて教えてください。",
             ],
+            ["暴れん坊将軍って誰のことですか？", ""],  # noqa: RUF001
         ],
         inputs=[instruction, input_text],
         outputs=output,

pyproject.toml CHANGED Viewed

@@ -5,16 +5,52 @@ description = ""
 readme = "README.md"
 requires-python = ">=3.10"
 dependencies = [
-    "accelerate>=1.0.1",
-    "bitsandbytes>=0.44.1",
     "blobfile>=3.0.0",
-    "gradio>=5.1.0",
     "hf-transfer>=0.1.8",
-    "protobuf>=5.28.2",
     "sentencepiece>=0.2.0",
-    "setuptools>=75.2.0",
-    "spaces>=0.30.4",
     "tiktoken>=0.8.0",
     "torch==2.4.0",
-    "transformers>=4.45.2",
 ]

 readme = "README.md"
 requires-python = ">=3.10"
 dependencies = [
+    "accelerate>=1.2.1",
+    "bitsandbytes>=0.45.0",
     "blobfile>=3.0.0",
+    "gradio>=5.9.1",
     "hf-transfer>=0.1.8",
+    "protobuf>=5.29.2",
     "sentencepiece>=0.2.0",
+    "setuptools>=75.6.0",
+    "spaces>=0.31.1",
     "tiktoken>=0.8.0",
     "torch==2.4.0",
+    "transformers>=4.47.1",
 ]
+[tool.ruff]
+line-length = 119
+[tool.ruff.lint]
+select = ["ALL"]
+ignore = [
+    "COM812", # missing-trailing-comma
+    "D203",   # one-blank-line-before-class
+    "D213",   # multi-line-summary-second-line
+    "E501",   # line-too-long
+    "SIM117", # multiple-with-statements
+]
+extend-ignore = [
+    "D100",    # undocumented-public-module
+    "D101",    # undocumented-public-class
+    "D102",    # undocumented-public-method
+    "D103",    # undocumented-public-function
+    "D104",    # undocumented-public-package
+    "D105",    # undocumented-magic-method
+    "D107",    # undocumented-public-init
+    "EM101",   # raw-string-in-exception
+    "FBT001",  # boolean-type-hint-positional-argument
+    "FBT002",  # boolean-default-value-positional-argument
+    "PD901",   # pandas-df-variable-name
+    "PGH003",  # blanket-type-ignore
+    "PLR0913", # too-many-arguments
+    "PLR0915", # too-many-statements
+    "TRY003",  # raise-vanilla-args
+]
+unfixable = [
+    "F401", # unused-import
+]
+[tool.ruff.format]
+docstring-code-format = true

requirements.txt CHANGED Viewed

@@ -1,36 +1,36 @@
 # This file was autogenerated by uv via the following command:
 #    uv pip compile pyproject.toml -o requirements.txt
-accelerate==1.0.1
     # via swallow-13b-instruct (pyproject.toml)
 aiofiles==23.2.1
     # via gradio
 annotated-types==0.7.0
     # via pydantic
-anyio==4.6.2.post1
     # via
     #   gradio
     #   httpx
     #   starlette
-bitsandbytes==0.44.1
     # via swallow-13b-instruct (pyproject.toml)
 blobfile==3.0.0
     # via swallow-13b-instruct (pyproject.toml)
-certifi==2024.8.30
     # via
     #   httpcore
     #   httpx
     #   requests
-charset-normalizer==3.4.0
     # via requests
-click==8.1.7
     # via
     #   typer
     #   uvicorn
 exceptiongroup==1.2.2
     # via anyio
-fastapi==0.115.2
     # via gradio
-ffmpy==0.4.0
     # via gradio
 filelock==3.16.1
     # via
@@ -39,16 +39,16 @@ filelock==3.16.1
     #   torch
     #   transformers
     #   triton
-fsspec==2024.9.0
     # via
     #   gradio-client
     #   huggingface-hub
     #   torch
-gradio==5.1.0
     # via
     #   swallow-13b-instruct (pyproject.toml)
     #   spaces
-gradio-client==1.4.0
     # via gradio
 h11==0.14.0
     # via
@@ -56,14 +56,15 @@ h11==0.14.0
     #   uvicorn
 hf-transfer==0.1.8
     # via swallow-13b-instruct (pyproject.toml)
-httpcore==1.0.6
     # via httpx
-httpx==0.27.2
     # via
     #   gradio
     #   gradio-client
     #   spaces
-huggingface-hub==0.26.0
     # via
     #   accelerate
     #   gradio
@@ -75,7 +76,7 @@ idna==3.10
     #   anyio
     #   httpx
     #   requests
-jinja2==3.1.4
     # via
     #   gradio
     #   torch
@@ -91,9 +92,9 @@ mdurl==0.1.2
     # via markdown-it-py
 mpmath==1.3.0
     # via sympy
-networkx==3.4.1
     # via torch
-numpy==2.1.2
     # via
     #   accelerate
     #   bitsandbytes
@@ -125,15 +126,15 @@ nvidia-cusparse-cu12==12.1.0.106
     #   torch
 nvidia-nccl-cu12==2.20.5
     # via torch
-nvidia-nvjitlink-cu12==12.6.77
     # via
     #   nvidia-cusolver-cu12
     #   nvidia-cusparse-cu12
 nvidia-nvtx-cu12==12.1.105
     # via torch
-orjson==3.10.9
     # via gradio
-packaging==24.1
     # via
     #   accelerate
     #   gradio
@@ -143,9 +144,9 @@ packaging==24.1
     #   transformers
 pandas==2.2.3
     # via gradio
-pillow==10.4.0
     # via gradio
-protobuf==5.28.2
     # via swallow-13b-instruct (pyproject.toml)
 psutil==5.9.8
     # via
@@ -153,12 +154,12 @@ psutil==5.9.8
     #   spaces
 pycryptodomex==3.21.0
     # via blobfile
-pydantic==2.9.2
     # via
     #   fastapi
     #   gradio
     #   spaces
-pydantic-core==2.23.4
     # via pydantic
 pydub==0.25.1
     # via gradio
@@ -166,7 +167,7 @@ pygments==2.18.0
     # via rich
 python-dateutil==2.9.0.post0
     # via pandas
-python-multipart==0.0.12
     # via gradio
 pytz==2024.2
     # via pandas
@@ -176,7 +177,7 @@ pyyaml==6.0.2
     #   gradio
     #   huggingface-hub
     #   transformers
-regex==2024.9.11
     # via
     #   tiktoken
     #   transformers
@@ -186,9 +187,11 @@ requests==2.32.3
     #   spaces
     #   tiktoken
     #   transformers
-rich==13.9.2
     # via typer
-ruff==0.7.0
     # via gradio
 safetensors==0.4.5
     # via
@@ -198,46 +201,47 @@ semantic-version==2.10.0
     # via gradio
 sentencepiece==0.2.0
     # via swallow-13b-instruct (pyproject.toml)
-setuptools==75.2.0
     # via swallow-13b-instruct (pyproject.toml)
 shellingham==1.5.4
     # via typer
-six==1.16.0
     # via python-dateutil
 sniffio==1.3.1
-    # via
-    #   anyio
-    #   httpx
-spaces==0.30.4
     # via swallow-13b-instruct (pyproject.toml)
-starlette==0.40.0
-    # via fastapi
 sympy==1.13.3
     # via torch
 tiktoken==0.8.0
     # via swallow-13b-instruct (pyproject.toml)
-tokenizers==0.20.1
     # via transformers
-tomlkit==0.12.0
     # via gradio
 torch==2.4.0
     # via
     #   swallow-13b-instruct (pyproject.toml)
     #   accelerate
     #   bitsandbytes
-tqdm==4.66.5
     # via
     #   huggingface-hub
     #   transformers
-transformers==4.45.2
     # via swallow-13b-instruct (pyproject.toml)
 triton==3.0.0
     # via torch
-typer==0.12.5
     # via gradio
 typing-extensions==4.12.2
     # via
     #   anyio
     #   fastapi
     #   gradio
     #   gradio-client
@@ -251,11 +255,11 @@ typing-extensions==4.12.2
     #   uvicorn
 tzdata==2024.2
     # via pandas
-urllib3==2.2.3
     # via
     #   blobfile
     #   requests
-uvicorn==0.32.0
     # via gradio
-websockets==12.0
     # via gradio-client

 # This file was autogenerated by uv via the following command:
 #    uv pip compile pyproject.toml -o requirements.txt
+accelerate==1.2.1
     # via swallow-13b-instruct (pyproject.toml)
 aiofiles==23.2.1
     # via gradio
 annotated-types==0.7.0
     # via pydantic
+anyio==4.7.0
     # via
     #   gradio
     #   httpx
     #   starlette
+bitsandbytes==0.45.0
     # via swallow-13b-instruct (pyproject.toml)
 blobfile==3.0.0
     # via swallow-13b-instruct (pyproject.toml)
+certifi==2024.12.14
     # via
     #   httpcore
     #   httpx
     #   requests
+charset-normalizer==3.4.1
     # via requests
+click==8.1.8
     # via
     #   typer
     #   uvicorn
 exceptiongroup==1.2.2
     # via anyio
+fastapi==0.115.6
     # via gradio
+ffmpy==0.5.0
     # via gradio
 filelock==3.16.1
     # via
     #   torch
     #   transformers
     #   triton
+fsspec==2024.12.0
     # via
     #   gradio-client
     #   huggingface-hub
     #   torch
+gradio==5.9.1
     # via
     #   swallow-13b-instruct (pyproject.toml)
     #   spaces
+gradio-client==1.5.2
     # via gradio
 h11==0.14.0
     # via
     #   uvicorn
 hf-transfer==0.1.8
     # via swallow-13b-instruct (pyproject.toml)
+httpcore==1.0.7
     # via httpx
+httpx==0.28.1
     # via
     #   gradio
     #   gradio-client
+    #   safehttpx
     #   spaces
+huggingface-hub==0.27.0
     # via
     #   accelerate
     #   gradio
     #   anyio
     #   httpx
     #   requests
+jinja2==3.1.5
     # via
     #   gradio
     #   torch
     # via markdown-it-py
 mpmath==1.3.0
     # via sympy
+networkx==3.4.2
     # via torch
+numpy==2.2.1
     # via
     #   accelerate
     #   bitsandbytes
     #   torch
 nvidia-nccl-cu12==2.20.5
     # via torch
+nvidia-nvjitlink-cu12==12.6.85
     # via
     #   nvidia-cusolver-cu12
     #   nvidia-cusparse-cu12
 nvidia-nvtx-cu12==12.1.105
     # via torch
+orjson==3.10.13
     # via gradio
+packaging==24.2
     # via
     #   accelerate
     #   gradio
     #   transformers
 pandas==2.2.3
     # via gradio
+pillow==11.1.0
     # via gradio
+protobuf==5.29.2
     # via swallow-13b-instruct (pyproject.toml)
 psutil==5.9.8
     # via
     #   spaces
 pycryptodomex==3.21.0
     # via blobfile
+pydantic==2.10.4
     # via
     #   fastapi
     #   gradio
     #   spaces
+pydantic-core==2.27.2
     # via pydantic
 pydub==0.25.1
     # via gradio
     # via rich
 python-dateutil==2.9.0.post0
     # via pandas
+python-multipart==0.0.20
     # via gradio
 pytz==2024.2
     # via pandas
     #   gradio
     #   huggingface-hub
     #   transformers
+regex==2024.11.6
     # via
     #   tiktoken
     #   transformers
     #   spaces
     #   tiktoken
     #   transformers
+rich==13.9.4
     # via typer
+ruff==0.8.4
+    # via gradio
+safehttpx==0.1.6
     # via gradio
 safetensors==0.4.5
     # via
     # via gradio
 sentencepiece==0.2.0
     # via swallow-13b-instruct (pyproject.toml)
+setuptools==75.6.0
     # via swallow-13b-instruct (pyproject.toml)
 shellingham==1.5.4
     # via typer
+six==1.17.0
     # via python-dateutil
 sniffio==1.3.1
+    # via anyio
+spaces==0.31.1
     # via swallow-13b-instruct (pyproject.toml)
+starlette==0.41.3
+    # via
+    #   fastapi
+    #   gradio
 sympy==1.13.3
     # via torch
 tiktoken==0.8.0
     # via swallow-13b-instruct (pyproject.toml)
+tokenizers==0.21.0
     # via transformers
+tomlkit==0.13.2
     # via gradio
 torch==2.4.0
     # via
     #   swallow-13b-instruct (pyproject.toml)
     #   accelerate
     #   bitsandbytes
+tqdm==4.67.1
     # via
     #   huggingface-hub
     #   transformers
+transformers==4.47.1
     # via swallow-13b-instruct (pyproject.toml)
 triton==3.0.0
     # via torch
+typer==0.15.1
     # via gradio
 typing-extensions==4.12.2
     # via
     #   anyio
+    #   bitsandbytes
     #   fastapi
     #   gradio
     #   gradio-client
     #   uvicorn
 tzdata==2024.2
     # via pandas
+urllib3==2.3.0
     # via
     #   blobfile
     #   requests
+uvicorn==0.34.0
     # via gradio
+websockets==14.1
     # via gradio-client

uv.lock CHANGED Viewed

The diff for this file is too large to render. See raw diff