Spaces:

root-sajjan
/

backend_image_detection

Running

App Files Files Community

root-sajjan commited on Nov 28, 2024

Commit

4e10dac

verified ·

1 Parent(s): ecaf31c

llm

Browse files

Files changed (3) hide show

llm/fridge.JPG +0 -0
llm/inference.py +110 -0
llm/upload_image.py +39 -0

llm/fridge.JPG ADDED Viewed

llm/inference.py ADDED Viewed

	@@ -0,0 +1,110 @@

+from huggingface_hub import InferenceClient
+import nltk
+import re
+import requests
+nltk.download('punkt')
+nltk.download('punkt_tab')
+nltk.download('averaged_perceptron_tagger')
+client = InferenceClient(api_key="xyz")
+def extract_product_info(text):
+    # Initialize result dictionary
+    result = {"brand": None, "model": None, "description": None, "price": None}
+    # Extract price separately using regex (to avoid confusion with brand name)
+    price_match = re.search(r'\$\s?\d{1,3}(?:,\d{3})*(?:\.\d{2})?', text)
+    if price_match:
+        result["price"] = price_match.group().replace("$", "").replace(",", "").strip()
+        # Remove the price part from the text to prevent it from being included in the brand/model extraction
+        text = text.replace(price_match.group(), "").strip()
+    # Tokenize the remaining text and tag parts of speech
+    tokens = nltk.word_tokenize(text)
+    pos_tags = nltk.pos_tag(tokens)
+    # Extract brand and model (Proper Nouns + Alphanumeric patterns)
+    brand_parts = []
+    model_parts = []
+    description_parts = []
+    # First part: Extract brand and model info
+    for word, tag in pos_tags:
+        if tag == 'NNP' or re.match(r'[A-Za-z0-9-]+', word):
+            if len(brand_parts) == 0:  # Assume the first proper noun is the brand
+                brand_parts.append(word)
+            else:  # Model number tends to follow the brand
+                model_parts.append(word)
+        else:
+            description_parts.append(word)
+    # Assign brand and model to result dictionary
+    if brand_parts:
+        result["brand"] = " ".join(brand_parts)
+    if model_parts:
+        result["model"] = " ".join(model_parts)
+    # Combine the remaining parts as description
+    result["description"] = " ".join(description_parts)
+    return result
+def extract_info(text):
+    API_URL = "https://api-inference.huggingface.co/models/google/flan-t5-large"
+    headers = {"Authorization": "Bearer hf_xyz"}
+    payload = {"inputs": f"From the given text, extract brand name, model number, description about it, and its average price in today's market. Give me back a python dictionary with keys as brand_name, model_number, desc, price. The text is {text}.",}
+    response = requests.post(API_URL, headers=headers, json=payload)
+    print('GOOGLEE LLM OUTPUTTTTTTT\n\n',response )
+    output = response.json()
+    print(output)
+def get_name(url, object):
+	messages = [
+		{
+			"role": "user",
+			"content": [
+				{
+					"type": "text",
+					"text": f"Is this a {object}?. Can you guess what it is and give me the closest brand it resembles to? or a model number? And give me its average price in today's market in USD. In output, give me its normal name, model name, model number and price. separated by commas. No description is needed."
+				},
+				{
+					"type": "image_url",
+					"image_url": {
+						"url": url
+					}
+				}
+			]
+		}
+	]
+	completion = client.chat.completions.create(
+		model="meta-llama/Llama-3.2-11B-Vision-Instruct",
+		messages=messages,
+		max_tokens=500
+	)
+	print(f'\n\nNow output of LLM:\n')
+	llm_result = completion.choices[0].message['content']
+	print(llm_result)
+	print(f'\n\nThat is the output')
+	result = extract_product_info(llm_result)
+	print(f'\n\nResult brand and price:{result}')
+	# result2 = extract_info(llm_result)
+	# print(f'\n\nFrom Google llm:{result2}')
+	return result
+# url = "https://i.ibb.co/mNYvqDL/crop_39.jpg"
+# object="fridge"
+# get_name(url, object)

llm/upload_image.py ADDED Viewed

	@@ -0,0 +1,39 @@

+import requests
+def upload_image_to_imgbb(image_path, api_key="0e7fb6d183b8db925812dee230f71079"):
+    """
+    Uploads an image to ImgBB and returns the URL.
+    :param image_path: Path to the local image
+    :param api_key: ImgBB API key
+    :return: URL of the uploaded image
+    """
+    try:
+        # API endpoint for ImgBB
+        url = "https://api.imgbb.com/1/upload"
+        # Open the image in binary mode
+        with open(image_path, "rb") as image_file:
+            # Send POST request to upload the image
+            response = requests.post(
+                url,
+                data={"key": api_key},
+                files={"image": image_file}
+            )
+        # Check if the request was successful
+        if response.status_code == 200:
+            data = response.json()
+            print(f'Uploaded to {data["data"]["url"]}')
+            return data["data"]["url"]
+        else:
+            raise Exception(f"Error uploading image: {response.status_code}, {response.text}")
+    except Exception as e:
+        return str(e)
+# # Replace with your local image path and ImgBB API key
+# image_path = "fridge.JPG"  # Replace this with your local image path
+# api_key = "0e7fb6d183b8db925812dee230f71079"         # Get your API key from https://api.imgbb.com/
+# uploaded_url = upload_image_to_imgbb(image_path, api_key)
+# print(f"Uploaded image URL: {uploaded_url}")