Spaces:

microsoft
/

phi-4-mini

Running

App Files Files Community

nguyenbh commited on 12 days ago

Commit

5f2dccf

1 Parent(s): d00bdd7

Add penalty control

Browse files

Files changed (1) hide show

app.py +37 -13

app.py CHANGED Viewed

@@ -29,6 +29,8 @@ except Exception as e:
 default_temperature = 0.7
 default_max_tokens = 4096
 default_top_p = 0.1
 # Example prompts that users can try
 example_prompts = [
@@ -39,7 +41,7 @@ example_prompts = [
     "I have $20,000 in my savings account, where I receive a 4% profit per year and payments twice a year. Can you please tell me how long it will take for me to become a millionaire?",
 ]
-def get_azure_response(message, chat_history, temperature, max_tokens, top_p):
     """
     Function to get a response from the Azure Phi-4 model
     """
@@ -61,8 +63,8 @@ def get_azure_response(message, chat_history, temperature, max_tokens, top_p):
         "max_tokens": max_tokens,
         "temperature": temperature,
         "top_p": top_p,
-        "presence_penalty": 0,
-        "frequency_penalty": 0,
         "stream": True
     }
@@ -277,6 +279,10 @@ with gr.Blocks(css=custom_css, title="Phi-4-mini Playground") as demo:
         # Header section
         with gr.Column(elem_classes="header"):
             gr.Markdown("# Phi-4-mini Playground")
         # Main content with side-by-side layout
         with gr.Row():
@@ -343,18 +349,36 @@ with gr.Blocks(css=custom_css, title="Phi-4-mini Playground") as demo:
                         label="Max Tokens",
                         info="Maximum length of response"
                     )
         # Footer
         with gr.Column(elem_classes="footer"):
             gr.Markdown("Powered by Microsoft [Phi-4 mini model](https://aka.ms/phi-4-mini/azure) on Azure AI. © 2025")
     # Simplified chat function that handles both sending and receiving messages
-    def chat(message, history, temperature, max_tokens, top_p):
         if not message.strip():
             return "", history
         # Get response from Azure
-        response = get_azure_response(message, history, temperature, max_tokens, top_p)
         # Add the exchange to history
         history.append((message, ""))
@@ -387,10 +411,10 @@ with gr.Blocks(css=custom_css, title="Phi-4-mini Playground") as demo:
     # Function to clear the conversation
     def clear_conversation():
-        return [], default_temperature, default_max_tokens, default_top_p
     # Function to regenerate the last response
-    def regenerate_response(history, temperature, max_tokens, top_p):
         if not history:
             return history
@@ -399,7 +423,7 @@ with gr.Blocks(css=custom_css, title="Phi-4-mini Playground") as demo:
         history = history[:-1]
         # Get new response
-        response = get_azure_response(last_user_message, history, temperature, max_tokens, top_p)
         # Add the exchange to history
         history.append((last_user_message, ""))
@@ -423,10 +447,10 @@ with gr.Blocks(css=custom_css, title="Phi-4-mini Playground") as demo:
             return history
     # Set up event handlers
-    msg.submit(chat, [msg, chatbot, temp_slider, max_tokens_slider, top_p_slider], [msg, chatbot])
-    send_btn.click(chat, [msg, chatbot, temp_slider, max_tokens_slider, top_p_slider], [msg, chatbot])
-    clear.click(clear_conversation, None, [chatbot, temp_slider, max_tokens_slider, top_p_slider])
-    regenerate.click(regenerate_response, [chatbot, temp_slider, max_tokens_slider, top_p_slider], [chatbot])
 # Launch the app
-demo.launch(share=True)  # Set share=True to generate a public URL for testing# Launch the app

 default_temperature = 0.7
 default_max_tokens = 4096
 default_top_p = 0.1
+default_presence_penalty = 0.0
+default_frequency_penalty = 0.0
 # Example prompts that users can try
 example_prompts = [
     "I have $20,000 in my savings account, where I receive a 4% profit per year and payments twice a year. Can you please tell me how long it will take for me to become a millionaire?",
 ]
+def get_azure_response(message, chat_history, temperature, max_tokens, top_p, presence_penalty, frequency_penalty):
     """
     Function to get a response from the Azure Phi-4 model
     """
         "max_tokens": max_tokens,
         "temperature": temperature,
         "top_p": top_p,
+        "presence_penalty": presence_penalty,
+        "frequency_penalty": frequency_penalty,
         "stream": True
     }
         # Header section
         with gr.Column(elem_classes="header"):
             gr.Markdown("# Phi-4-mini Playground")
+            gr.Markdown("""This demo allows you to interact with the [Phi-4-Mini](https://aka.ms/phi-4-multimodal/techreport).
+Other demos include [Thoughts Organizer](https://microsoft-thoughtsorganizer.hf.space/),
+[Stories Come Alive](https://microsoft-storiescomealive.hf.space/),
+[Phine Speech Translator](https://microsoft-phinespeechtranslator.hf.space/)""")
         # Main content with side-by-side layout
         with gr.Row():
                         label="Max Tokens",
                         info="Maximum length of response"
                     )
+                    # New sliders for presence and frequency penalty
+                    presence_penalty_slider = gr.Slider(
+                        minimum=-2.0,
+                        maximum=2.0,
+                        value=default_presence_penalty,
+                        step=0.1,
+                        label="Presence Penalty",
+                        info="Positive values increase likelihood to talk about new topics"
+                    )
+                    frequency_penalty_slider = gr.Slider(
+                        minimum=-2.0,
+                        maximum=2.0,
+                        value=default_frequency_penalty,
+                        step=0.1,
+                        label="Frequency Penalty",
+                        info="Positive values decrease likelihood to repeat the same text"
+                    )
         # Footer
         with gr.Column(elem_classes="footer"):
             gr.Markdown("Powered by Microsoft [Phi-4 mini model](https://aka.ms/phi-4-mini/azure) on Azure AI. © 2025")
     # Simplified chat function that handles both sending and receiving messages
+    def chat(message, history, temperature, max_tokens, top_p, presence_penalty, frequency_penalty):
         if not message.strip():
             return "", history
         # Get response from Azure
+        response = get_azure_response(message, history, temperature, max_tokens, top_p, presence_penalty, frequency_penalty)
         # Add the exchange to history
         history.append((message, ""))
     # Function to clear the conversation
     def clear_conversation():
+        return [], default_temperature, default_max_tokens, default_top_p, default_presence_penalty, default_frequency_penalty
     # Function to regenerate the last response
+    def regenerate_response(history, temperature, max_tokens, top_p, presence_penalty, frequency_penalty):
         if not history:
             return history
         history = history[:-1]
         # Get new response
+        response = get_azure_response(last_user_message, history, temperature, max_tokens, top_p, presence_penalty, frequency_penalty)
         # Add the exchange to history
         history.append((last_user_message, ""))
             return history
     # Set up event handlers
+    msg.submit(chat, [msg, chatbot, temp_slider, max_tokens_slider, top_p_slider, presence_penalty_slider, frequency_penalty_slider], [msg, chatbot])
+    send_btn.click(chat, [msg, chatbot, temp_slider, max_tokens_slider, top_p_slider, presence_penalty_slider, frequency_penalty_slider], [msg, chatbot])
+    clear.click(clear_conversation, None, [chatbot, temp_slider, max_tokens_slider, top_p_slider, presence_penalty_slider, frequency_penalty_slider])
+    regenerate.click(regenerate_response, [chatbot, temp_slider, max_tokens_slider, top_p_slider, presence_penalty_slider, frequency_penalty_slider], [chatbot])
 # Launch the app
+demo.launch(share=True)  # Set share=True to generate a public URL for testing