File size: 5,109 Bytes
8ffbf51
c73a6b4
 
 
6e2e0c5
c3cdb5e
7c56b7b
2e0de3d
d84dbbc
c73a6b4
c32572d
 
 
 
 
c73a6b4
c3cdb5e
0a161b7
c3cdb5e
0a161b7
c3cdb5e
 
 
9358231
c3cdb5e
 
32036ce
 
 
 
 
 
 
 
 
c3cdb5e
32036ce
c3cdb5e
32036ce
c3cdb5e
32036ce
c3cdb5e
 
c73a6b4
 
c3cdb5e
 
 
c73a6b4
 
 
6a2375b
c73a6b4
a93e14b
 
97260f9
a93e14b
 
 
8ffbf51
97260f9
c73a6b4
 
 
a93e14b
c73a6b4
 
7c56b7b
99dbe33
 
 
 
 
 
 
 
 
 
6e2e0c5
6a2375b
a93e14b
c3cdb5e
6e2e0c5
c3cdb5e
 
 
6e2e0c5
0a161b7
 
c3cdb5e
 
 
 
32036ce
 
 
 
 
c3cdb5e
 
6e63bb6
f855041
c3cdb5e
 
 
fc4d401
 
 
99dbe33
d6030a5
 
 
 
 
4eeda08
d84dbbc
99dbe33
 
c73a6b4
fc4d401
 
 
 
c73a6b4
c3cdb5e
2e0de3d
 
 
f855041
 
 
 
 
 
 
 
 
 
 
 
0510f64
 
 
 
2e0de3d
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
import streamlit as st
import requests
import os
import base64
from PIL import Image
from io import BytesIO

# Set page title and layout
st.set_page_config(page_title="Image Caption Generator", layout="wide")

# API key from environment variable
API_KEY = os.environ.get("NEBIUS_API_KEY")

if not API_KEY:
    st.error("API key not found. Please set the `NEBIUS_API_KEY` environment variable.")

# Function to resize the image
def resize_image(image, max_width=300):
    """
    Resize the image to a fixed width (300) while maintaining the aspect ratio.
    """
    width_percent = max_width / float(image.size[0])
    new_height = int((float(image.size[1]) * float(width_percent)))
    resized_image = image.resize((max_width, new_height), Image.Resampling.LANCZOS)
    return resized_image

# Function to compress the image before converting to Base64
def compress_image(image, quality=70):
    """
    Compress the image to reduce the size before Base64 encoding.
    """
    buffered = BytesIO()
    image.save(buffered, format="JPEG", quality=quality)  # Save as JPEG with compression
    return buffered.getvalue()

# Function to convert image to Base64
def convert_to_base64(image_data):
    """
    Convert the compressed image to Base64 encoding.
    """
    image_base64 = base64.b64encode(image_data).decode()
    return image_base64

# Function to call Nebius API
def generate_caption(image_base64, api_key):
    """
    Calls the Nebius API with the Base64-encoded image and generates a caption.
    """
    api_url = "https://api.studio.nebius.ai/v1/chat/completions"
    headers = {"Authorization": f"Bearer {api_key}"}
    payload = {
        "model": "llava-hf/llava-1.5-13b-hf",
        "messages": [
            {
                "role": "system",
                "content": """observe each and every detail of the image and craft a detailed prompt under 75 words in this format: [image content/subject, description of action, state, and mood], [art form, style], [artist/photographer reference if needed], [additional settings such as camera and lens settings, lighting, colors, effects, texture, background, rendering].""",
            },
            {
                "role": "user",
                "content": [
                    {"type": "text", "text": "Describe This Image In Detail"},
                    {"type": "image_url", "image_url": {"url": f"data:image/png;base64,{image_base64}"}},
                ],
            },
        ],
        "temperature": 0,
    }

    try:
        response = requests.post(api_url, json=payload, headers=headers)
        if response.status_code == 200:
            return response.json()
        else:
            st.error(f"API Error: {response.status_code}, {response.text}")
            return {"error": response.text}
    except Exception as e:
        st.error(f"An exception occurred: {e}")
        return {"error": str(e)}



uploaded_image = st.file_uploader("Upload an image", type=["jpg", "jpeg", "png"])

if uploaded_image:
    # Load the uploaded image
    original_image = Image.open(uploaded_image)

    # Resize the image to a fixed width of 300px
    resized_image = resize_image(original_image)

    # Display the resized image
    st.image(resized_image, caption="Resized Image", use_container_width=True)

    # Compress the image before converting to Base64
    compressed_image_data = compress_image(resized_image)

    # Convert compressed image to Base64
    base64_string = convert_to_base64(compressed_image_data)

    # Call the Nebius API to generate a caption
    if st.button("Generate Prompt", use_container_width=True):
        st.write("Generating Prompt...")
        result = generate_caption(base64_string, API_KEY)

        # Display the generated caption
        if "error" in result:
            st.error(f"Error: {result['error']}")
        else:
            try:
                caption = (
                    result.get("choices", [{}])[0]
                    .get("message", {})
                    .get("content", "No caption generated.")
                )
                
                st.text_area("Prompt Generated", caption, height=200, key="caption_output")
            except Exception as e:
                st.error(f"Error processing the response: {e}")
else:
    if not API_KEY:
        st.warning("Please set the `NEBIUS_API_KEY` environment variable.")
    else:
        st.info("Please upload an image.")

# Style adjustments
st.markdown(
    """
    <style>
     
        .css-1d391kg {text-align: center;}
        .css-1v3fvcr {justify-content: center; display: flex;}
        .css-1y4ccs5 {margin: 0 auto;}
        .css-1aumxhk {display: flex; justify-content: center;}
        .css-1k6kn8p {justify-content: center; align-items: center; display: flex;}
        .css-ffhzg6 {text-align: center;}
        textarea {
            color: white !important;
            background-color: #262626 !important;
        }
    
        textarea {
            color: white !important;
            background-color: #262626 !important;
        }
    </style>
    """, unsafe_allow_html=True
)