|
import logging |
|
import os |
|
import re |
|
import warnings |
|
|
|
import gradio as gr |
|
import requests |
|
import torch |
|
from transformers import AutoModelForSpeechSeq2Seq, AutoProcessor, pipeline, Pipeline |
|
|
|
from templates import starting_app_code, update_iframe_js, copy_snippet_js, download_code_js, load_js, DemoType |
|
|
|
|
|
warnings.filterwarnings("ignore", message='Trying to convert audio automatically from int32 to 16-bit int format') |
|
|
|
logging.basicConfig( |
|
level=logging.INFO, |
|
format="%(asctime)s - %(message)s", |
|
datefmt="%Y-%m-%d %H:%M:%S", |
|
) |
|
|
|
logger = logging.getLogger("my_logger") |
|
|
|
HF_TOKEN = os.getenv("HF_TOKEN") |
|
|
|
if not HF_TOKEN: |
|
raise Exception("HF_TOKEN environment variable is required to call remote API.") |
|
|
|
API_URL = "https://api-inference.huggingface.co/models/HuggingFaceH4/zephyr-7b-beta" |
|
headers = {"Authorization": f"Bearer {HF_TOKEN}"} |
|
|
|
|
|
def init_speech_to_text_model() -> Pipeline: |
|
device = "cuda:0" if torch.cuda.is_available() else "cpu" |
|
torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32 |
|
|
|
model_id = "distil-whisper/distil-medium.en" |
|
model = AutoModelForSpeechSeq2Seq.from_pretrained( |
|
model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True |
|
) |
|
model.to(device) |
|
processor = AutoProcessor.from_pretrained(model_id) |
|
return pipeline( |
|
"automatic-speech-recognition", |
|
model=model, |
|
tokenizer=processor.tokenizer, |
|
feature_extractor=processor.feature_extractor, |
|
max_new_tokens=128, |
|
torch_dtype=torch_dtype, |
|
device=device, |
|
) |
|
|
|
|
|
whisper_pipe = init_speech_to_text_model() |
|
|
|
code_pattern = re.compile(r'```python\n(.*?)```', re.DOTALL) |
|
|
|
|
|
def query(payload: dict): |
|
response = requests.post(API_URL, headers=headers, json=payload) |
|
return response.json() |
|
|
|
|
|
def generate_text(code: str, prompt: str) -> (str, str, str): |
|
logger.info(f"Calling API with prompt:\n{prompt}") |
|
prompt = f"```python\n{code}```\nGiven the code above return only updated code for the following request:\n{prompt}\n<|assistant|>" |
|
params = {"max_new_tokens": 512} |
|
output = query({"inputs": prompt, "parameters": params}) |
|
if 'error' in output: |
|
logger.warning(f'Language model call failed: {output["error"]}') |
|
raise gr.Warning(f'Language model call failed: {output["error"]}') |
|
logger.info(f'API RESPONSE\n{output[0]["generated_text"]}') |
|
assistant_reply = output[0]["generated_text"].split('<|assistant|>')[1] |
|
match = re.search(code_pattern, assistant_reply) |
|
if not match: |
|
return assistant_reply, code, None |
|
new_code = match.group(1) |
|
logger.info(f'NEW CODE:\nnew_code') |
|
return assistant_reply, new_code, None |
|
|
|
|
|
def transcribe(audio: str) -> (str, str): |
|
result = whisper_pipe(audio) |
|
return result["text"], None |
|
|
|
|
|
def copy_notify(code): |
|
gr.Info("App code snippet copied!") |
|
|
|
|
|
def add_hotkeys() -> str: |
|
return """() => { |
|
function gradioApp() { |
|
const elems = document.getElementsByTagName('gradio-app'); |
|
const elem = elems.length == 0 ? document : elems[0]; |
|
|
|
if (elem !== document) { |
|
elem.getElementById = function(id) { |
|
return document.getElementById(id); |
|
}; |
|
} |
|
return elem.shadowRoot ? elem.shadowRoot : elem; |
|
} |
|
window.addEventListener('keydown', (e) => { |
|
if (e.keyCode == 192 && e.ctrlKey) { // CTRL + ` key |
|
const recordButton = gradioApp().querySelector("div.mic-wrap > button"); |
|
console.log(recordButton); |
|
recordButton.click(); |
|
} |
|
}); |
|
} |
|
""" |
|
|
|
|
|
with gr.Blocks() as demo: |
|
gr.Markdown("<h1 id=\"TEST\" align=\"center\">KiteWind πͺπ</h1>") |
|
gr.Markdown( |
|
"<h4 align=\"center\">Chat-assisted web app creator by <a href=\"https://huggingface.co/gstaff\">@gstaff</a></h4>") |
|
selectedTab = gr.State(value='stlite') |
|
with gr.Tab('Streamlit (stlite)') as stlite_tab: |
|
with gr.Row(): |
|
with gr.Column(): |
|
gr.Markdown("## 1. Run your app in the browser!") |
|
gr.HTML(value='<div id="stliteDemoDiv"></div>') |
|
gr.Markdown("## 2. Customize using voice requests!") |
|
with gr.Row(): |
|
with gr.Column(): |
|
with gr.Group(): |
|
in_audio = gr.Audio(label="Record a voice request (click or press ctrl + ` to start/stop)", source='microphone', type='filepath') |
|
in_prompt = gr.Textbox(label="Or type a text request and press Enter", |
|
placeholder="Need an idea? Try one of these:\n- Add a button to reverse the name\n- Change the greeting to Spanish\n- Make the button primary") |
|
out_text = gr.TextArea(label="Chat Assistant Response") |
|
clear_btn = gr.ClearButton([in_prompt, in_audio, out_text]) |
|
with gr.Column(): |
|
code_area = gr.Code(label="App Code - You can also edit directly and then click Update App", |
|
language='python', value=starting_app_code(DemoType.STREAMLIT)) |
|
update_btn = gr.Button("Update App", variant="primary") |
|
code_update_params = {'fn': None, 'inputs': code_area, 'outputs': None, |
|
'_js': update_iframe_js(DemoType.STREAMLIT)} |
|
gen_text_params = {'fn': generate_text, 'inputs': [code_area, in_prompt], |
|
'outputs': [out_text, code_area]} |
|
transcribe_params = {'fn': transcribe, 'inputs': [in_audio], 'outputs': [in_prompt, in_audio]} |
|
update_btn.click(**code_update_params) |
|
in_prompt.submit(**gen_text_params).then(**code_update_params) |
|
in_audio.stop_recording(**transcribe_params).then(**gen_text_params).then(**code_update_params) |
|
with gr.Row(): |
|
with gr.Column(): |
|
gr.Markdown("## 3. Export your app to share!") |
|
copy_snippet_btn = gr.Button("Copy app snippet to paste in another page") |
|
copy_snippet_btn.click(copy_notify, code_area, None, _js=copy_snippet_js(DemoType.STREAMLIT)) |
|
download_btn = gr.Button("Download app as a standalone file") |
|
download_btn.click(None, code_area, None, _js=download_code_js(DemoType.STREAMLIT)) |
|
with gr.Row(): |
|
with gr.Column(): |
|
gr.Markdown("## Current limitations") |
|
with gr.Accordion("Click to view", open=False): |
|
gr.Markdown( |
|
"- Only Streamlit apps using libraries available in pyodide are supported\n- The chat hasn't been tuned on Streamlit library data; it may make mistakes") |
|
with gr.Tab('Gradio (gradio-lite)') as gradio_lite_tab: |
|
with gr.Row(): |
|
with gr.Column(): |
|
gr.Markdown("## 1. Run your app in the browser!") |
|
gr.HTML(value='<div id="gradioDemoDiv"></div>') |
|
gr.Markdown("## 2. Customize using voice requests!") |
|
with gr.Row(): |
|
with gr.Column(): |
|
with gr.Group(): |
|
in_audio = gr.Audio(label="Record a voice request (click or press ctrl + ` to start/stop)", source='microphone', type='filepath') |
|
in_prompt = gr.Textbox(label="Or type a text request and press Enter", |
|
placeholder="Need an idea? Try one of these:\n- Add a button to reverse the name\n- Change the greeting to Hola\n- Put the reversed name output into a separate textbox\n- Change the theme from monochrome to soft") |
|
out_text = gr.TextArea(label="Chat Assistant Response") |
|
clear = gr.ClearButton([in_prompt, in_audio, out_text]) |
|
with gr.Column(): |
|
code_area = gr.Code(label="App Code - You can also edit directly and then click Update App", |
|
language='python', value=starting_app_code(DemoType.GRADIO)) |
|
update_btn = gr.Button("Update App", variant="primary") |
|
code_update_params = {'fn': None, 'inputs': code_area, 'outputs': None, |
|
'_js': update_iframe_js(DemoType.GRADIO)} |
|
gen_text_params = {'fn': generate_text, 'inputs': [code_area, in_prompt], |
|
'outputs': [out_text, code_area]} |
|
transcribe_params = {'fn': transcribe, 'inputs': [in_audio], 'outputs': [in_prompt, in_audio]} |
|
update_btn.click(**code_update_params) |
|
in_prompt.submit(**gen_text_params).then(**code_update_params) |
|
in_audio.stop_recording(**transcribe_params).then(**gen_text_params).then(**code_update_params) |
|
with gr.Row(): |
|
with gr.Column(): |
|
gr.Markdown("## 3. Export your app to share!") |
|
copy_snippet_btn = gr.Button("Copy app snippet to paste in another page") |
|
copy_snippet_btn.click(copy_notify, code_area, None, _js=copy_snippet_js(DemoType.GRADIO)) |
|
download_btn = gr.Button("Download app as a standalone file") |
|
download_btn.click(None, code_area, None, _js=download_code_js(DemoType.GRADIO)) |
|
with gr.Row(): |
|
with gr.Column(): |
|
gr.Markdown("## Current limitations") |
|
with gr.Accordion("Click to view", open=False): |
|
gr.Markdown( |
|
"- Only gradio-lite apps using the python standard libraries and gradio are supported\n- The chat hasn't been tuned on gradio library data; it may make mistakes\n- The app needs to fully reload each time it is changed") |
|
|
|
stlite_tab.select(lambda: "stlite", None, selectedTab).then(None, None, None, _js=load_js(DemoType.STREAMLIT)) |
|
gradio_lite_tab.select(lambda: "gradio-lite", None, selectedTab).then(None, None, None, |
|
_js=load_js(DemoType.GRADIO)) |
|
demo.load(None, None, None, _js=load_js(DemoType.STREAMLIT)) |
|
demo.load(None, None, None, _js=add_hotkeys()) |
|
demo.css = "footer {visibility: hidden}" |
|
|
|
if __name__ == "__main__": |
|
demo.queue().launch() |
|
|