first commit

2023-11-07 10:27:35 -05:00 · 2023-11-07 10:27:35 -05:00 · 091f066859
commit 091f066859
8 changed files with 157 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,3 @@
+.env
+/venv
+/frames
--- a/assets/stop_slouching.mp3
+++ b/assets/stop_slouching.mp3
--- a/assets/stop_slouching.wav
+++ b/assets/stop_slouching.wav
--- a/assets/wonderful_posture.mp3
+++ b/assets/wonderful_posture.mp3
--- a/assets/wonderful_posture.wav
+++ b/assets/wonderful_posture.wav
--- a/capture.py
+++ b/capture.py
@ -0,0 +1,32 @@
+import cv2
+import time
+
+# Folder
+folder = "frames"
+
+# Initialize the webcam
+cap = cv2.VideoCapture(0)
+
+# Check if the webcam is opened correctly
+if not cap.isOpened():
+    raise IOError("Cannot open webcam")
+
+# Wait for the camera to initialize and adjust light levels
+time.sleep(2)
+
+while True:
+    ret, frame = cap.read()
+    if ret:
+        # Save the frame as an image file
+        print("📸 Say cheese! Saving frame.")
+        path = f"{folder}/frame.jpg"
+        cv2.imwrite(path, frame)
+    else:
+        print("Failed to capture image")
+
+    # Wait for 5 seconds
+    time.sleep(2)
+
+# Release the camera and close all windows
+cap.release()
+cv2.destroyAllWindows()
--- a/judge.py
+++ b/judge.py
@ -0,0 +1,103 @@
+import os
+from openai import OpenAI
+import base64
+import json
+import time
+import simpleaudio as sa
+
+client = OpenAI()
+
+def encode_image(image_path):
+    with open(image_path, "rb") as image_file:
+        return base64.b64encode(image_file.read()).decode('utf-8')
+
+
+def play_audio(file_path):
+    wave_obj = sa.WaveObject.from_wave_file(file_path)
+    play_obj = wave_obj.play()
+    play_obj.wait_done()
+
+
+def analyze_posture(base64_image):
+    response = client.chat.completions.create(
+        model="gpt-4-vision-preview",
+        messages=[
+            {
+                "role": "system",
+                "content": """
+                You are a posture rater.
+                I send you a profile photo of a person and you tell me roughly how their posture is.
+                It's ok if you can't see the side view of the person.
+                """,
+            },
+            {
+                "role": "user",
+                "content": [
+                    {"type": "text", "text": "How is my posture?"},
+                    {
+                        "type": "image_url",
+                        "image_url": f"data:image/jpeg;base64,{base64_image}",
+                    },
+                ],
+            }
+        ],
+        max_tokens=300,
+    )
+    return response.choices[0].message.content
+
+
+def summarize_analysis(analysis):
+    summary_response = client.chat.completions.create(
+        model="gpt-4-1106-preview",
+        response_format={"type": "json_object"},
+        messages=[
+            {
+                "role": "system",
+                "content": """
+                You are a posture rater.
+                You received an analysis of someone's posture, and you have to summarize it with a numerical rating 1-10.
+                It's okay if you can't see the side view of the person, or if the analysis is inconclusive. You must give a 1-10 rating.
+
+                Respond in JSON, with a "rating": 1-10, "reason": "...", and "conclusive": true/false (whether or not the analysis was conclusive)
+                """,
+            },
+            {
+                "role": "user",
+                "content": analysis,
+            }
+        ],
+        max_tokens=300,
+    )
+    return summary_response.choices[0].message.content
+
+
+def main():
+    while True:
+        print("🧘 Judging posture...")
+
+        # path to your image
+        image_path = os.path.join(os.getcwd(), "./frames/frame.jpg")
+
+        # getting the base64 encoding
+        base64_image = encode_image(image_path)
+
+        # analyze posture
+        analysis = analyze_posture(base64_image)
+
+        # summarize analysis
+        result = summarize_analysis(analysis)
+        result_json = json.loads(result)
+
+        print(result_json)
+
+        # play appropriate audio file based on rating
+        if result_json['rating'] <= 5:
+            play_audio('./assets/stop_slouching.wav')
+        else:
+            play_audio('./assets/wonderful_posture.wav')
+
+        # wait for 30 seconds
+        time.sleep(5)
+
+if __name__ == "__main__":
+    main()
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,19 @@
+annotated-types==0.6.0
+anyio==3.7.1
+certifi==2023.7.22
+charset-normalizer==3.3.2
+distro==1.8.0
+h11==0.14.0
+httpcore==1.0.1
+httpx==0.25.1
+idna==3.4
+numpy==1.26.1
+openai==1.1.1
+opencv-python==4.8.1.78
+pydantic==2.4.2
+pydantic_core==2.10.1
+requests==2.31.0
+sniffio==1.3.0
+tqdm==4.66.1
+typing_extensions==4.8.0
+urllib3==2.0.7