ChatGPT-ImageCaptioner

Paused

taesiri commited on Mar 1, 2023

Commit

ed2d211

1 Parent(s): b135597

switching to gpt-3.5-turbo

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import os
-from langchain.llms import OpenAI
 os.system("pip install -U gradio")
@@ -80,8 +80,8 @@ session_token = os.environ.get("SessionToken")
 def generate_caption(object_list_str, api_key, temperature):
     query = f"You are an intelligent image captioner. I will hand you the objects and their position, and you should give me a detailed description for the photo. In this photo we have the following objects\n{object_list_str}"
-    llm = OpenAI(
-        model_name="text-davinci-003", openai_api_key=api_key, temperature=temperature
     )
     try:
@@ -142,13 +142,13 @@ def inference(img, vocabulary, api_key, temperature):
 with gr.Blocks() as demo:
     with gr.Column():
-        gr.Markdown("# Image Captioning using LangChain (GPT3.5) 🦜️🔗")
         gr.Markdown(
-            "Use Detic to detect objects in an image and then use GPT to describe the image."
         )
-    with gr.Column():
-        with gr.Row():
             inp = gr.Image(label="Input Image", type="filepath")
             with gr.Column():
                 openai_api_key_textbox = gr.Textbox(
@@ -164,10 +164,10 @@ with gr.Blocks() as demo:
                     value="lvis",
                 )
-        btn_detic = gr.Button("Run Detic+GPT3.5")
-    with gr.Row():
-        outviz = gr.Image(label="Visualization", type="pil")
-        output_desc = gr.Textbox(label="Description Description", lines=5)
     btn_detic.click(
         fn=inference,

 import os
+from langchain.llms import OpenAI, OpenAIChat
 os.system("pip install -U gradio")
 def generate_caption(object_list_str, api_key, temperature):
     query = f"You are an intelligent image captioner. I will hand you the objects and their position, and you should give me a detailed description for the photo. In this photo we have the following objects\n{object_list_str}"
+    llm = OpenAIChat(
+        model_name="gpt-3.5-turbo", openai_api_key=api_key, temperature=temperature
     )
     try:
 with gr.Blocks() as demo:
     with gr.Column():
+        gr.Markdown("# Image Captioning using Detic and ChatGPT with LangChain 🦜️🔗")
         gr.Markdown(
+            "Use Detic to detect objects in an image and then use `gpt-3.5-turbo` to describe the image."
         )
+    with gr.Row():
+        with gr.Column():
             inp = gr.Image(label="Input Image", type="filepath")
             with gr.Column():
                 openai_api_key_textbox = gr.Textbox(
                     value="lvis",
                 )
+            btn_detic = gr.Button("Run Detic and ChatGPT")
+        with gr.Column():
+            output_desc = gr.Textbox(label="Description Description", lines=5)
+            outviz = gr.Image(label="Visualization", type="pil")
     btn_detic.click(
         fn=inference,

requirements.txt CHANGED Viewed

@@ -35,5 +35,6 @@ nltk
 git+https://github.com/openai/CLIP.git
 openai
 langchain

 git+https://github.com/openai/CLIP.git
 openai
 langchain