Spaces:

ChandraP12330
/

Surveillance-Image-Caption-2024

Sleeping

App Files Files Community

ChandraP12330 commited on Apr 27, 2024

Commit

bacdfba

verified ·

1 Parent(s): 6a1305b

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -2

app.py CHANGED Viewed

@@ -55,8 +55,41 @@ context_raw= scene_labels[probs.argmax(-1)]
 context= 'the image is depicting scene of '+ context_raw
 ##LLM
 # Generate the caption
 if st.button("Generate Caption"):
-    st.write()

 context= 'the image is depicting scene of '+ context_raw
 ##LLM
+GOOGLE_API_KEY = st.text_input("Please enter your GOOGLE GEMINI API KEY", type="password")
+os.environ['GOOGLE_API_KEY'] = GOOGLE_API_KEY
+from langchain_google_genai import ChatGoogleGenerativeAI
+from langchain.prompts import PromptTemplate
+from google.generativeai.types.safety_types import HarmBlockThreshold, HarmCategory
+llm = ChatGoogleGenerativeAI(model="gemini-1.0-pro-latest", google_api_key=GOOGLE_API_KEY, temperature=0.2, top_p=1, top_k=1,
+                             safety_settings={
+        HarmCategory.HARM_CATEGORY_DANGEROUS_CONTENT: HarmBlockThreshold.BLOCK_NONE,
+        HarmCategory.HARM_CATEGORY_HARASSMENT: HarmBlockThreshold.BLOCK_NONE,
+        HarmCategory.HARM_CATEGORY_HATE_SPEECH: HarmBlockThreshold.BLOCK_NONE,
+        HarmCategory.HARM_CATEGORY_SEXUALLY_EXPLICIT: HarmBlockThreshold.BLOCK_NONE,
+    },
+      )
+template="""You are an advanced image captioning AI assistant for surveillance related images.
+Your task is to refine and improve an initial image caption using relevant contextual information provided.
+You will receive two inputs:
+Input 1: {initial_caption} - This is the initial caption for the image, most likely grammatically incorrect
+and incomplete sentence, generated by a separate not so good image captioning model.
+Input 2: {context} - This is the contextual information that provides more details about the background
+Your goal is to take the initial caption and the additional context, and produce a new, refined caption that
+incorporates the contextual details.
+Please do not speculate things which are not provided. The final caption should be grammatically correct.
+Please output only the final caption."""
+prompt_template = PromptTemplate(
+    template=template,
+    input_variables=["initial_caption", "context"],
+)
+prompt=prompt_template.format(initial_caption=initial_caption, context=context)
+response = llm.invoke(prompt)
+final_caption = response.content
 # Generate the caption
 if st.button("Generate Caption"):
+    st.write(final_caption)