Spaces:

Koshti10
/

LLMCalc

Running

App Files Files Community

carbonnnnn commited on Oct 7, 2024

Commit

d8f251a

1 Parent(s): bbae640

update fetching

Browse files

Files changed (3) hide show

app.py +2 -10
src/__pycache__/pricing.cpython-310.pyc +0 -0
src/pricing.py +29 -60

app.py CHANGED Viewed

@@ -2,10 +2,10 @@ import pandas as pd
 import gradio as gr
 import asyncio  # Ensure asyncio is imported
-from src.pricing import get_pricing_df
-text_leaderboard = get_pricing_df()
 llm_calc_app = gr.Blocks()
 with llm_calc_app:
@@ -18,13 +18,5 @@ with llm_calc_app:
                         )
     llm_calc_app.load()
-# # Ensure the app runs in an asyncio event loop
-# async def main():
-#     llm_calc_app.queue()
-#     await llm_calc_app.launch()
-# Run the async main function
-# asyncio.run(main())
 llm_calc_app.queue()
 llm_calc_app.launch()

 import gradio as gr
 import asyncio  # Ensure asyncio is imported
+from src.pricing import fetch_prices
+text_leaderboard = fetch_prices()
 llm_calc_app = gr.Blocks()
 with llm_calc_app:
                         )
     llm_calc_app.load()
 llm_calc_app.queue()
 llm_calc_app.launch()

src/__pycache__/pricing.cpython-310.pyc CHANGED Viewed

Binary files a/src/__pycache__/pricing.cpython-310.pyc and b/src/__pycache__/pricing.cpython-310.pyc differ

src/pricing.py CHANGED Viewed

@@ -1,61 +1,30 @@
-import asyncio
-from pyppeteer import launch
-from bs4 import BeautifulSoup
-import pandas as pd  # Add this import for DataFrame functionality
-async def main():
-    # Launch the browser in headless mode
-    browser = await launch(headless=True)
-    page = await browser.newPage()
-    # Find the table in the HTML
-    await page.goto('https://llm-price.com/')
-    await page.waitForSelector('#tableBody')
-    content = await page.content()
-    soup = BeautifulSoup(content, 'html.parser')
-    table = soup.find('table')
-    # Check if the table is found
-    if table:
-        model_names = []
-        # providers = [] # Skip providers, only uses .svg logos on the website, use sources (col4) instead
-        input_tokens = []
-        output_tokens = []
-        sources = []
-        updated_times = []
-        # Iterate through the rows of the table
-        for row in table.find_all('tr')[1:]:  # Skip the header row
-            cols = row.find_all('td')
-            if len(cols) > 0:
-                model_names.append(cols[0].text.strip())
-                # providers.append(cols[1].text.strip())
-                input_tokens.append(cols[2].text.strip())
-                output_tokens.append(cols[3].text.strip())
-                sources.append(cols[4].text.strip())
-                updated_times.append(cols[5].text.strip())
-        # Create a DataFrame from the collected data
-        data = {
-            'Model Name': model_names,
-            # 'Providers': providers,
-            '1 M Input Tokens': input_tokens,
-            '1 M Output Tokens': output_tokens,
-            'Source': sources,
-            'Updated Time': updated_times
-        }
-        df = pd.DataFrame(data)
-        return df
     else:
-        print("Table not found.")
-    # Close the browser
-    await browser.close()
-# Run the main function
-def get_pricing_df():
-    price_df = asyncio.get_event_loop().run_until_complete(main())
-    return price_df

+import pandas as pd
+import requests
+def fetch_prices():
+    # Fetch the JSON data from the URL
+    url = "https://llm-price.huhuhang.workers.dev/"
+    response = requests.get(url)
+    # Check if the request was successful
+    if response.status_code == 200:
+        data = response.json()
+        # Extract relevant information
+        extracted_data = []
+        for entry in data:
+            extracted_info = {
+                "output_tokens": entry["fields"]["output_tokens"],
+                "provider": entry["fields"]["provider"],
+                "model_name": entry["fields"]["model_name"],
+                "url": entry["fields"]["url"],
+                "input_tokens": entry["fields"]["input_tokens"],
+                "update_time": entry["fields"]["update_time"]
+            }
+            extracted_data.append(extracted_info)
+        # Create a DataFrame from the extracted data
+        df = pd.DataFrame(extracted_data)
+        return df
     else:
+        print(f"Failed to retrieve data: {response.status_code}")
+        return None