Merge pull request #51 from ks6088ts-labs/feature/issue-50_camera-input

ks6088ts · web-flow · commit 0b95894e1de7 · 2024-08-12T08:55:29.000+09:00
add camera Q&amp;A example
diff --git a/apps/99_streamlit_examples/README.md b/apps/99_streamlit_examples/README.md
@@ -37,13 +37,13 @@ Access to http://localhost:8501 and select the sample you want to run from the s
 
 ![File Q&A](../../docs/images/99_streamlit_examples.fileqa.png)
 
-#### 2. Speech to Text
+#### 2. Image Q&A
 
-![Speech to Text](../../docs/images/99_streamlit_examples.stt.png)
+![Image Q&A](../../docs/images/99_streamlit_examples.imageqa.png)
 
-#### 3. Image Q&A
+#### 3. Camera Q&A
 
-![Image Q&A](../../docs/images/99_streamlit_examples.imageqa.png)
+![Camera Q&A](../../docs/images/99_streamlit_examples.cameraqa.png)
 
 #### 4. Translate text
 
@@ -53,6 +53,10 @@ Access to http://localhost:8501 and select the sample you want to run from the s
 
 ![Explain data](../../docs/images/99_streamlit_examples.explaindata.png)
 
+#### 6. Speech to Text
+
+![Speech to Text](../../docs/images/99_streamlit_examples.stt.png)
+
 ## References
 
 - [🎈 Streamlit + LLM Examples App](https://github.com/streamlit/llm-examples)
diff --git a/apps/99_streamlit_examples/pages/2_Image_Q&A.py b/apps/99_streamlit_examples/pages/2_Image_Q&A.py
@@ -33,7 +33,7 @@
     )
     "[Azure Portal](https://portal.azure.com/)"
     "[Azure OpenAI Studio](https://oai.azure.com/resource/overview)"
-    "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/3_Image_Q&A.py)"
+    "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/2_Image_Q&A.py)"
 
 st.title("Image Q&A")
 
diff --git a/apps/99_streamlit_examples/pages/3_Camera_Q&A.py b/apps/99_streamlit_examples/pages/3_Camera_Q&A.py
@@ -0,0 +1,88 @@
+import base64
+from os import getenv
+
+import streamlit as st
+from dotenv import load_dotenv
+from openai import AzureOpenAI
+
+load_dotenv()
+
+with st.sidebar:
+    azure_openai_endpoint = st.text_input(
+        label="AZURE_OPENAI_ENDPOINT",
+        value=getenv("AZURE_OPENAI_ENDPOINT"),
+        key="AZURE_OPENAI_ENDPOINT",
+        type="default",
+    )
+    azure_openai_api_key = st.text_input(
+        label="AZURE_OPENAI_API_KEY",
+        key="AZURE_OPENAI_API_KEY",
+        type="password",
+    )
+    azure_openai_api_version = st.text_input(
+        label="AZURE_OPENAI_API_VERSION",
+        value=getenv("AZURE_OPENAI_API_VERSION"),
+        key="AZURE_OPENAI_API_VERSION",
+        type="default",
+    )
+    azure_openai_gpt_model = st.text_input(
+        label="AZURE_OPENAI_GPT_MODEL",
+        value=getenv("AZURE_OPENAI_GPT_MODEL"),
+        key="AZURE_OPENAI_GPT_MODEL",
+        type="default",
+    )
+    "[Azure Portal](https://portal.azure.com/)"
+    "[Azure OpenAI Studio](https://oai.azure.com/resource/overview)"
+    "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/3_Camera_Q&A.py)"
+
+st.title("Camera Q&A")
+
+if not azure_openai_api_key or not azure_openai_endpoint or not azure_openai_api_version or not azure_openai_gpt_model:
+    st.warning("Please fill in the required fields at the sidebar.")
+    st.stop()
+
+st.info("Take a picture and ask a question. AI will answer the question.")
+
+img_file_buffer = st.camera_input("Take a picture")
+question = st.text_input(
+    "Ask a question about the captured image",
+    placeholder="Please describe the content of the image",
+    disabled=not img_file_buffer,
+)
+
+if img_file_buffer and question:
+    encoded_image = base64.b64encode(img_file_buffer.getvalue()).decode()
+
+    client = AzureOpenAI(
+        api_key=azure_openai_api_key,
+        api_version=azure_openai_api_version,
+        azure_endpoint=azure_openai_endpoint,
+    )
+
+    print(question)
+    with st.spinner("Thinking..."):
+        response = client.chat.completions.create(
+            model=azure_openai_gpt_model,
+            messages=[
+                {
+                    "role": "system",
+                    "content": "You are a professional image analyst. Describe the image.",
+                },
+                {
+                    "role": "user",
+                    "content": [
+                        {
+                            "type": "image_url",
+                            "image_url": {"url": f"data:image/jpeg;base64,{encoded_image}"},
+                        },
+                        {
+                            "type": "text",
+                            "content": question,
+                        },
+                    ],
+                },
+            ],
+        )
+    msg = response.choices[0].message.content
+    st.write("### Answer")
+    st.chat_message("assistant").write(msg)
diff --git a/apps/99_streamlit_examples/pages/6_Speech_to_text.py b/apps/99_streamlit_examples/pages/6_Speech_to_text.py
@@ -33,7 +33,7 @@
     )
     "[Azure Portal](https://portal.azure.com/)"
     "[Azure OpenAI Studio](https://oai.azure.com/resource/overview)"
-    "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/2_Speech_to_text.py)"
+    "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/6_Speech_to_text.py)"
 
 st.title("Speech to text")
 
diff --git a/docs/images/99_streamlit_examples.cameraqa.png b/docs/images/99_streamlit_examples.cameraqa.png

Original file line number	Diff line number	Diff line change
`@@ -33,7 +33,7 @@`
`33`	`33`	`)`
`34`	`34`	`"[Azure Portal](https://portal.azure.com/)"`
`35`	`35`	`"[Azure OpenAI Studio](https://oai.azure.com/resource/overview)"`
`36`		`- "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/3_Image_Q&A.py)"`
	`36`	`+ "[View the source code](https://github.com/ks6088ts-labs/workshop-azure-openai/blob/main/apps/99_streamlit_examples/pages/2_Image_Q&A.py)"`
`37`	`37`
`38`	`38`	`st.title("Image Q&A")`
`39`	`39`