Im-prmpt-im

Running

App Files Files Community

Im-prmpt-im / app.py

mrbeliever

Update app.py

99dbe33 verified about 1 year ago

raw

history blame

3.88 kB

	import streamlit as st
	import requests
	import os
	import base64
	from PIL import Image
	from io import BytesIO # Correctly import BytesIO from the io module

	# Set page title
	st.set_page_config(page_title="Image Caption Generator", layout="centered")

	# API key from environment variable
	API_KEY = os.environ.get("NEBIUS_API_KEY")

	# UI for the app
	st.title("Image Caption Generator")
	st.write(
	"Upload an image, and this app will generate a detailed caption for it using the Nebius AI API."
	)

	if not API_KEY:
	st.error("API key not found. Please set the `NEBIUS_API_KEY` environment variable.")

	# Function to call Nebius API
	def generate_caption(image_base64, api_key):
	api_url = "https://api.studio.nebius.ai/v1/chat/completions"
	headers = {"Authorization": f"Bearer {api_key}"}
	payload = {
	"model": "Qwen/Qwen2-VL-72B-Instruct",
	"messages": [
	{
	"role": "system",
	"content": """You are an image to prompt converter. Your work is to observe each and every detail of the image and craft a detailed prompt under 75 words in this format: [image content/subject, description of action, state, and mood], [art form, style], [artist/photographer reference if needed], [additional settings such as camera and lens settings, lighting, colors, effects, texture, background, rendering].""",
	},
	{
	"role": "user",
	"content": [
	{"type": "text", "text": "Write a caption for this image"},
	{"type": "image_url", "image_url": {"url": f"data:image/png;base64,{image_base64}"}},
	],
	},
	],
	"temperature": 0,
	}

	try:
	response = requests.post(api_url, json=payload, headers=headers)
	if response.status_code == 200:
	st.write("API response received successfully.") # Debugging message
	return response.json()
	else:
	st.error(f"API Error: {response.status_code}, {response.text}")
	return {"error": response.text}
	except Exception as e:
	st.error(f"An exception occurred: {e}")
	return {"error": str(e)}

	# File uploader for image
	uploaded_image = st.file_uploader("Upload an image", type=["png", "jpg", "jpeg"])

	if uploaded_image and API_KEY:
	# Convert the image to base64
	image = Image.open(uploaded_image)
	buffered = BytesIO() # Use BytesIO from the io module
	image.save(buffered, format="PNG")
	image_base64 = base64.b64encode(buffered.getvalue()).decode()

	# Show the uploaded image
	st.image(image, caption="Uploaded Image", use_column_width=True)

	# Add a button to trigger caption generation
	if st.button("Generate Caption"):
	st.write("Generating caption...")
	result = generate_caption(image_base64, API_KEY)

	# Debug: Display the full API response
	st.write("Full API Response:")
	st.json(result)

	# Display the result
	if "error" in result:
	st.error(f"Error: {result['error']}")
	else:
	# Extract caption from the response
	try:
	# Safely navigate the response to extract the caption
	messages = result.get("choices", [{}])[0].get("message", {}).get("content", "")
	if messages:
	st.subheader("Generated Caption")
	st.write(messages)
	else:
	st.error("No caption generated. The response structure might have changed.")
	except Exception as e:
	st.error(f"Error processing the response: {e}")
	else:
	if not API_KEY:
	st.warning("Please set the `NEBIUS_API_KEY` environment variable.")
	else:
	st.info("Please upload an image.")

	st.sidebar.write("Built with ❤️ by OpenAI GPT-4")