Spaces:

freddyaboulton
/

smollm-voice-code-editor

Running on T4

App Files Files Community

freddyaboulton HF staff commited on 7 days ago

Commit

3112b0d

•

1 Parent(s): 3c004fa

code

Browse files

Files changed (4) hide show

README.md +1 -1
app.py +68 -0
requirements.in +4 -0
requirements.txt +291 -0

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 title: Smollm Voice Code Editor
-emoji: 📊
 colorFrom: pink
 colorTo: blue
 sdk: gradio

 ---
 title: Smollm Voice Code Editor
+emoji: ⚡️
 colorFrom: pink
 colorTo: blue
 sdk: gradio

app.py ADDED Viewed

	@@ -0,0 +1,68 @@

+from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
+import gradio as gr
+from gradio_webrtc import WebRTC, ReplyOnPause, AdditionalOutputs
+import numpy as np
+import os
+from twilio.rest import Client
+account_sid = os.environ.get("TWILIO_ACCOUNT_SID")
+auth_token = os.environ.get("TWILIO_AUTH_TOKEN")
+if account_sid and auth_token:
+    client = Client(account_sid, auth_token)
+    token = client.tokens.create()
+    rtc_configuration = {
+        "iceServers": token.ice_servers,
+        "iceTransportPolicy": "relay",
+    }
+else:
+    rtc_configuration = None
+checkpoint = "HuggingFaceTB/SmolLM2-1.7B-Instruct"
+device = "cuda"
+tokenizer = AutoTokenizer.from_pretrained(checkpoint)
+model = AutoModelForCausalLM.from_pretrained(checkpoint).to(device)
+whisper = pipeline(
+    model="openai/whisper-large-v3-turbo", device=device
+)
+system_prompt = "You are an AI coding assistant. Your task is to write single-file HTML applications based on a user's request. You may also be asked to edit your original response. Only return the code needed to fulfill the request."
+user_prompt = "Please write a single-file HTML application to fulfill the following request. Only return the necessary code. Include all necessary imports and styles.\nThe message:{user_message}\nCurrent code you have written:{code}"
+def generate(user_message: tuple[int, np.ndarray],
+             history: list[dict],
+             code: str):
+    msg_text = whisper({"array": user_message[1], "sampling_rate": user_message[0]})["text"]
+    history.append({"role": "user", "content": user_prompt.format(user_message=msg_text, code=code)})
+    input_text = tokenizer.apply_chat_template(history, tokenize=False)
+    inputs = tokenizer.encode(input_text, return_tensors="pt").to(device)
+    outputs = model.generate(inputs, max_new_tokens=500, temperature=0.2, top_p=0.9, do_sample=True)
+    response = tokenizer.decode(outputs[0])
+    output = response[response.rindex("<|im_start|>assistant\n") + len("<|im_start|>assistant\n"):]
+    history.append({"role": "assistant", "content": output})
+    yield AdditionalOutputs(history, output)
+with gr.Blocks() as demo:
+    history = gr.State([{"role": "system", "content": system_prompt}])
+    with gr.Row():
+        code = gr.Code(language="html")
+        sandbox = gr.HTML("")
+    with gr.Row():
+        webrtc = WebRTC(rtc_configuration=rtc_configuration, mode="send", modality="audio")
+    webrtc.stream(ReplyOnPause(generate),
+                  inputs=[webrtc, history, code],
+                  outputs=[webrtc], time_limit=90)
+    webrtc.on_additional_outputs(lambda history, code: (history, code),
+                                 outputs=[history, code])
+if __name__ == "__main__":
+    demo.launch()

requirements.in ADDED Viewed

	@@ -0,0 +1,4 @@

+gradio_webrtc[vad]==0.0.12
+numba==0.60.0
+twilio
+transformers

requirements.txt ADDED Viewed

	@@ -0,0 +1,291 @@

+# This file was autogenerated by uv via the following command:
+#    uv pip compile requirements.in -o requirements.txt
+aiofiles==23.2.1
+    # via gradio
+aiohappyeyeballs==2.4.3
+    # via aiohttp
+aiohttp==3.11.2
+    # via
+    #   aiohttp-retry
+    #   twilio
+aiohttp-retry==2.8.3
+    # via twilio
+aioice==0.9.0
+    # via aiortc
+aiortc==1.9.0
+    # via gradio-webrtc
+aiosignal==1.3.1
+    # via aiohttp
+annotated-types==0.7.0
+    # via pydantic
+anyio==4.6.2.post1
+    # via
+    #   gradio
+    #   httpx
+    #   starlette
+attrs==24.2.0
+    # via aiohttp
+audioread==3.0.1
+    # via librosa
+av==12.3.0
+    # via aiortc
+certifi==2024.8.30
+    # via
+    #   httpcore
+    #   httpx
+    #   requests
+cffi==1.17.1
+    # via
+    #   aiortc
+    #   cryptography
+    #   pylibsrtp
+    #   soundfile
+charset-normalizer==3.4.0
+    # via requests
+click==8.1.7
+    # via
+    #   typer
+    #   uvicorn
+coloredlogs==15.0.1
+    # via onnxruntime
+cryptography==43.0.3
+    # via
+    #   aiortc
+    #   pyopenssl
+decorator==5.1.1
+    # via librosa
+dnspython==2.7.0
+    # via aioice
+fastapi==0.115.5
+    # via gradio
+ffmpy==0.4.0
+    # via gradio
+filelock==3.16.1
+    # via
+    #   huggingface-hub
+    #   transformers
+flatbuffers==24.3.25
+    # via onnxruntime
+frozenlist==1.5.0
+    # via
+    #   aiohttp
+    #   aiosignal
+fsspec==2024.10.0
+    # via
+    #   gradio-client
+    #   huggingface-hub
+google-crc32c==1.6.0
+    # via aiortc
+gradio==5.6.0
+    # via gradio-webrtc
+gradio-client==1.4.3
+    # via gradio
+gradio-webrtc==0.0.12
+    # via -r requirements.in
+h11==0.14.0
+    # via
+    #   httpcore
+    #   uvicorn
+httpcore==1.0.7
+    # via httpx
+httpx==0.27.2
+    # via
+    #   gradio
+    #   gradio-client
+    #   safehttpx
+huggingface-hub==0.26.2
+    # via
+    #   gradio
+    #   gradio-client
+    #   tokenizers
+    #   transformers
+humanfriendly==10.0
+    # via coloredlogs
+idna==3.10
+    # via
+    #   anyio
+    #   httpx
+    #   requests
+    #   yarl
+ifaddr==0.2.0
+    # via aioice
+jinja2==3.1.4
+    # via gradio
+joblib==1.4.2
+    # via
+    #   librosa
+    #   scikit-learn
+lazy-loader==0.4
+    # via librosa
+librosa==0.10.2.post1
+    # via gradio-webrtc
+llvmlite==0.43.0
+    # via numba
+markdown-it-py==3.0.0
+    # via rich
+markupsafe==2.1.5
+    # via
+    #   gradio
+    #   jinja2
+mdurl==0.1.2
+    # via markdown-it-py
+mpmath==1.3.0
+    # via sympy
+msgpack==1.1.0
+    # via librosa
+multidict==6.1.0
+    # via
+    #   aiohttp
+    #   yarl
+numba==0.60.0
+    # via
+    #   -r requirements.in
+    #   librosa
+numpy==2.0.2
+    # via
+    #   gradio
+    #   librosa
+    #   numba
+    #   onnxruntime
+    #   pandas
+    #   scikit-learn
+    #   scipy
+    #   soxr
+    #   transformers
+onnxruntime==1.20.0
+    # via gradio-webrtc
+orjson==3.10.11
+    # via gradio
+packaging==24.2
+    # via
+    #   gradio
+    #   gradio-client
+    #   huggingface-hub
+    #   lazy-loader
+    #   onnxruntime
+    #   pooch
+    #   transformers
+pandas==2.2.3
+    # via gradio
+pillow==11.0.0
+    # via gradio
+platformdirs==4.3.6
+    # via pooch
+pooch==1.8.2
+    # via librosa
+propcache==0.2.0
+    # via
+    #   aiohttp
+    #   yarl
+protobuf==5.28.3
+    # via onnxruntime
+pycparser==2.22
+    # via cffi
+pydantic==2.9.2
+    # via
+    #   fastapi
+    #   gradio
+pydantic-core==2.23.4
+    # via pydantic
+pydub==0.25.1
+    # via gradio
+pyee==12.1.1
+    # via aiortc
+pygments==2.18.0
+    # via rich
+pyjwt==2.10.0
+    # via twilio
+pylibsrtp==0.10.0
+    # via aiortc
+pyopenssl==24.2.1
+    # via aiortc
+python-dateutil==2.9.0.post0
+    # via pandas
+python-multipart==0.0.12
+    # via gradio
+pytz==2024.2
+    # via pandas
+pyyaml==6.0.2
+    # via
+    #   gradio
+    #   huggingface-hub
+    #   transformers
+regex==2024.11.6
+    # via transformers
+requests==2.32.3
+    # via
+    #   huggingface-hub
+    #   pooch
+    #   transformers
+    #   twilio
+rich==13.9.4
+    # via typer
+ruff==0.7.4
+    # via gradio
+safehttpx==0.1.1
+    # via gradio
+safetensors==0.4.5
+    # via transformers
+scikit-learn==1.5.2
+    # via librosa
+scipy==1.14.1
+    # via
+    #   librosa
+    #   scikit-learn
+semantic-version==2.10.0
+    # via gradio
+shellingham==1.5.4
+    # via typer
+six==1.16.0
+    # via python-dateutil
+sniffio==1.3.1
+    # via
+    #   anyio
+    #   httpx
+soundfile==0.12.1
+    # via librosa
+soxr==0.5.0.post1
+    # via librosa
+starlette==0.41.3
+    # via
+    #   fastapi
+    #   gradio
+sympy==1.13.3
+    # via onnxruntime
+threadpoolctl==3.5.0
+    # via scikit-learn
+tokenizers==0.20.3
+    # via transformers
+tomlkit==0.12.0
+    # via gradio
+tqdm==4.67.0
+    # via
+    #   huggingface-hub
+    #   transformers
+transformers==4.46.2
+    # via -r requirements.in
+twilio==9.3.7
+    # via -r requirements.in
+typer==0.13.0
+    # via gradio
+typing-extensions==4.12.2
+    # via
+    #   fastapi
+    #   gradio
+    #   gradio-client
+    #   huggingface-hub
+    #   librosa
+    #   pydantic
+    #   pydantic-core
+    #   pyee
+    #   typer
+tzdata==2024.2
+    # via pandas
+urllib3==2.2.3
+    # via requests
+uvicorn==0.32.0
+    # via gradio
+websockets==12.0
+    # via gradio-client
+yarl==1.17.2
+    # via aiohttp