Spaces:
Running
Running
File size: 5,109 Bytes
8ffbf51 c73a6b4 6e2e0c5 c3cdb5e 7c56b7b 2e0de3d d84dbbc c73a6b4 c32572d c73a6b4 c3cdb5e 0a161b7 c3cdb5e 0a161b7 c3cdb5e 9358231 c3cdb5e 32036ce c3cdb5e 32036ce c3cdb5e 32036ce c3cdb5e 32036ce c3cdb5e c73a6b4 c3cdb5e c73a6b4 6a2375b c73a6b4 a93e14b 97260f9 a93e14b 8ffbf51 97260f9 c73a6b4 a93e14b c73a6b4 7c56b7b 99dbe33 6e2e0c5 6a2375b a93e14b c3cdb5e 6e2e0c5 c3cdb5e 6e2e0c5 0a161b7 c3cdb5e 32036ce c3cdb5e 6e63bb6 f855041 c3cdb5e fc4d401 99dbe33 d6030a5 4eeda08 d84dbbc 99dbe33 c73a6b4 fc4d401 c73a6b4 c3cdb5e 2e0de3d f855041 0510f64 2e0de3d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 |
import streamlit as st
import requests
import os
import base64
from PIL import Image
from io import BytesIO
# Set page title and layout
st.set_page_config(page_title="Image Caption Generator", layout="wide")
# API key from environment variable
API_KEY = os.environ.get("NEBIUS_API_KEY")
if not API_KEY:
st.error("API key not found. Please set the `NEBIUS_API_KEY` environment variable.")
# Function to resize the image
def resize_image(image, max_width=300):
"""
Resize the image to a fixed width (300) while maintaining the aspect ratio.
"""
width_percent = max_width / float(image.size[0])
new_height = int((float(image.size[1]) * float(width_percent)))
resized_image = image.resize((max_width, new_height), Image.Resampling.LANCZOS)
return resized_image
# Function to compress the image before converting to Base64
def compress_image(image, quality=70):
"""
Compress the image to reduce the size before Base64 encoding.
"""
buffered = BytesIO()
image.save(buffered, format="JPEG", quality=quality) # Save as JPEG with compression
return buffered.getvalue()
# Function to convert image to Base64
def convert_to_base64(image_data):
"""
Convert the compressed image to Base64 encoding.
"""
image_base64 = base64.b64encode(image_data).decode()
return image_base64
# Function to call Nebius API
def generate_caption(image_base64, api_key):
"""
Calls the Nebius API with the Base64-encoded image and generates a caption.
"""
api_url = "https://api.studio.nebius.ai/v1/chat/completions"
headers = {"Authorization": f"Bearer {api_key}"}
payload = {
"model": "llava-hf/llava-1.5-13b-hf",
"messages": [
{
"role": "system",
"content": """observe each and every detail of the image and craft a detailed prompt under 75 words in this format: [image content/subject, description of action, state, and mood], [art form, style], [artist/photographer reference if needed], [additional settings such as camera and lens settings, lighting, colors, effects, texture, background, rendering].""",
},
{
"role": "user",
"content": [
{"type": "text", "text": "Describe This Image In Detail"},
{"type": "image_url", "image_url": {"url": f"data:image/png;base64,{image_base64}"}},
],
},
],
"temperature": 0,
}
try:
response = requests.post(api_url, json=payload, headers=headers)
if response.status_code == 200:
return response.json()
else:
st.error(f"API Error: {response.status_code}, {response.text}")
return {"error": response.text}
except Exception as e:
st.error(f"An exception occurred: {e}")
return {"error": str(e)}
uploaded_image = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])
if uploaded_image:
# Load the uploaded image
original_image = Image.open(uploaded_image)
# Resize the image to a fixed width of 300px
resized_image = resize_image(original_image)
# Display the resized image
st.image(resized_image, caption="Resized Image", use_container_width=True)
# Compress the image before converting to Base64
compressed_image_data = compress_image(resized_image)
# Convert compressed image to Base64
base64_string = convert_to_base64(compressed_image_data)
# Call the Nebius API to generate a caption
if st.button("Generate Prompt", use_container_width=True):
st.write("Generating Prompt...")
result = generate_caption(base64_string, API_KEY)
# Display the generated caption
if "error" in result:
st.error(f"Error: {result['error']}")
else:
try:
caption = (
result.get("choices", [{}])[0]
.get("message", {})
.get("content", "No caption generated.")
)
st.text_area("Prompt Generated", caption, height=200, key="caption_output")
except Exception as e:
st.error(f"Error processing the response: {e}")
else:
if not API_KEY:
st.warning("Please set the `NEBIUS_API_KEY` environment variable.")
else:
st.info("Please upload an image.")
# Style adjustments
st.markdown(
"""
<style>
.css-1d391kg {text-align: center;}
.css-1v3fvcr {justify-content: center; display: flex;}
.css-1y4ccs5 {margin: 0 auto;}
.css-1aumxhk {display: flex; justify-content: center;}
.css-1k6kn8p {justify-content: center; align-items: center; display: flex;}
.css-ffhzg6 {text-align: center;}
textarea {
color: white !important;
background-color: #262626 !important;
}
textarea {
color: white !important;
background-color: #262626 !important;
}
</style>
""", unsafe_allow_html=True
)
|