Spaces:

luminoussg
/

token_counter

Sleeping

luminoussg commited on Oct 16, 2024

Commit

169e43b

verified ·

1 Parent(s): ececca0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import gradio as gr
 import tiktoken
 import json
 # Function to count tokens in the dataset based on the "messages" field
 def count_tokens(json_file, encoding_name):
@@ -58,6 +59,15 @@ with gr.Blocks() as app:
         json_input = gr.File(label="Upload JSON/JSONL File")
         encoding_dropdown = gr.Dropdown(choices=encoding_options, label="Select Encoding", value="o200k_base (gpt-4o, gpt-4o-mini)")
     # Output for individual conversation token counts
     conversation_output = gr.JSON(label="Token Counts per Conversation")

 import gradio as gr
 import tiktoken
 import json
+import os
 # Function to count tokens in the dataset based on the "messages" field
 def count_tokens(json_file, encoding_name):
         json_input = gr.File(label="Upload JSON/JSONL File")
         encoding_dropdown = gr.Dropdown(choices=encoding_options, label="Select Encoding", value="o200k_base (gpt-4o, gpt-4o-mini)")
+    # Example file (this will automatically upload when clicked)
+    example_file_path = "keivalyaMedQuad-MedicalQnADataset_valid.jsonl"
+    if os.path.exists(example_file_path):
+        example = gr.Examples(
+            examples=[example_file_path],
+            inputs=json_input,
+            label="Click here to load the example file"
+        )
     # Output for individual conversation token counts
     conversation_output = gr.JSON(label="Token Counts per Conversation")