Spaces:

jiangjiechen
/

tiktoken_count

Running

jiangjiechen commited on Nov 16, 2024

Commit

ede8cb5

1 Parent(s): f7048ce

init

Files changed (2) hide show

app.py ADDED Viewed

+import gradio as gr
+import tiktoken
+def count_tokens(text):
+    """
+    Calculate the number of tokens in the input text using tiktoken.
+    Args:
+        text (str): The input text to be tokenized.
+    Returns:
+        int: The number of tokens in the input text.
+    """
+    # Choose the encoding based on the model you are targeting.
+    # Here, we use 'gpt-3.5-turbo' as an example.
+    encoding = tiktoken.encoding_for_model("gpt-4")
+    # Encode the input text to get the list of token IDs
+    tokens = encoding.encode(text)
+    # Return the number of tokens
+    return len(tokens)
+# Define the Gradio interface
+iface = gr.Interface(
+    fn=count_tokens,                   # The function to call
+    inputs=gr.Textbox(lines=10, placeholder="Enter your text here..."),  # Input component
+    outputs="number",                  # Output component
+    title="Token Counter with tiktoken",
+    description="Enter text below to calculate the number of tokens using the tiktoken library.",
+    examples=[
+        ["Hello, how are you doing today?"],
+        ["Gradio makes it easy to create web apps for machine learning models."],
+        ["OpenAI's GPT models are powerful tools for natural language processing tasks."]
+    ],
+    theme="default"
+)
+# Launch the app
+if __name__ == "__main__":
+    iface.launch()

requirements.txt ADDED Viewed