first commit

2023-08-26 03:14:09 +08:00
commit d81021e2ee
6 changed files with 177 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,2 @@
+# ignore folder env
+env/
--- a/main.py
+++ b/main.py
@ -0,0 +1,84 @@
+import cv2
+import mediapipe as mp
+import os
+import numpy as np
+
+# Create the assets directory if it doesn't exist
+if not os.path.exists('assets'):
+    os.makedirs('assets')
+
+# Load the pose detection model
+with mp.solutions.pose.Pose(min_detection_confidence=0.5, min_tracking_confidence=0.5) as pose:
+    # Get the index of the last saved pose dataset image
+    count = len([name for name in os.listdir('assets') if name.endswith('.jpg')])
+    # Capture frames from the webcam
+    cap = cv2.VideoCapture(0)
+    
+    # Load saved pose images and store their landmarks and filenames
+    saved_landmarks = []
+    saved_filenames = []
+    for i in range(count):
+        filename = f'assets/pose_{i}.jpg'
+        image = cv2.imread(filename)
+        if image is not None:
+            image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+            results = pose.process(image_rgb)
+            if results.pose_landmarks:
+                landmarks = np.array([[landmark.x, landmark.y, landmark.z] for landmark in results.pose_landmarks.landmark])
+                saved_landmarks.append(landmarks)
+                saved_filenames.append(filename)
+
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            break
+        # Convert the image to RGB
+        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        # Process the image and find the landmarks
+        results = pose.process(image)
+        # Draw the landmarks on the image
+        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
+        mp.solutions.drawing_utils.draw_landmarks(image, results.pose_landmarks, mp.solutions.pose.POSE_CONNECTIONS)
+        
+        # Compare the pose with saved pose dataset images
+        highest_similarity = -1
+        most_similar_filename = ""
+        if results.pose_landmarks:
+            detected_landmarks = np.array([[landmark.x, landmark.y, landmark.z] for landmark in results.pose_landmarks.landmark])
+            
+            for i, saved_landmark in enumerate(saved_landmarks):
+                # Calculate cosine similarity between the landmarks
+                similarity = np.dot(detected_landmarks.flatten(), saved_landmark.flatten()) / (np.linalg.norm(detected_landmarks) * np.linalg.norm(saved_landmark))
+                
+                if similarity > highest_similarity:
+                    highest_similarity = similarity
+                    most_similar_filename = saved_filenames[i]
+        
+        # Calculate similarity percentage
+        similarity_percentage = round(highest_similarity * 100, 2)
+        
+        # Display the most similar filename and similarity percentage if similarity is above 96%
+        if similarity_percentage > 94.6:
+            text = f"Most Similar: {most_similar_filename} - Similarity: {similarity_percentage}%"
+            cv2.putText(image, text, (10, image.shape[0] - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 255, 0), 2)
+        
+        # Display the image
+        cv2.imshow('Pose Detection', image)
+
+        # Save the image if the 'q' key is pressed
+        if cv2.waitKey(1) & 0xFF == ord('q'):
+            filename = f'assets/pose_{count}.jpg'
+            # Check if the file already exists and increment the count if it does
+            while os.path.exists(filename):
+                count += 1
+                filename = f'assets/pose_{count}.jpg'
+            cv2.imwrite(filename, image)
+            print(f'Saved pose dataset image: {filename}')
+            count += 1
+        # Exit the loop if the 'ESC' key is pressed
+        if cv2.waitKey(1) == 27:
+            break
+
+    # Release the capture and destroy the window
+    cap.release()
+    cv2.destroyAllWindows()
--- a/main2.py
+++ b/main2.py
@ -0,0 +1,50 @@
+import cv2
+import mediapipe as mp
+import os
+import time
+
+# Create the assets directory if it doesn't exist
+if not os.path.exists('assets'):
+    os.makedirs('assets')
+
+# Get the index of the last saved pose dataset image
+count = len([name for name in os.listdir('assets') if name.endswith('.jpg')])
+
+with mp.solutions.pose.Pose(min_detection_confidence=0.5, min_tracking_confidence=0.5) as pose:
+    cap = cv2.VideoCapture(0)
+    start_time = time.time()
+    while True:
+        ret, frame = cap.read()
+        if not ret:
+            break
+        # Convert the image to RGB
+        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        # To improve performance, optionally mark the image as not writeable to pass by reference.
+        image.flags.writeable = False
+        # Process the image and find the landmarks
+        results = pose.process(image)
+        # Draw the landmarks on the image
+        image.flags.writeable = True
+        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
+        mp.solutions.drawing_utils.draw_landmarks(image, results.pose_landmarks, mp.solutions.pose.POSE_CONNECTIONS)
+        # Display the image in a window
+        cv2.imshow('Pose Detection', image)
+        # Save the image and close the window if 5 seconds have passed
+        if time.time() - start_time > 5:
+            filename = f'assets/pose_{count}.jpg'
+            # Check if the file already exists and increment the count if it does
+            while os.path.exists(filename):
+                count += 1
+                filename = f'assets/pose_{count}.jpg'
+            cv2.imwrite(filename, image)
+            print(f'Saved pose dataset image: {filename}')
+            count += 1
+            # Close the window
+            cv2.destroyAllWindows()
+            break
+        # Exit the loop if the 'ESC' key is pressed
+        if cv2.waitKey(1) == 27:
+            break
+    # Release the capture and destroy the window
+    cap.release()
+    cv2.destroyAllWindows()
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,30 @@
+absl-py==1.4.0
+attrs==23.1.0
+blinker==1.6.2
+cffi==1.15.1
+click==8.1.7
+contourpy==1.1.0
+cycler==0.11.0
+Flask==2.3.3
+flatbuffers==23.5.26
+fonttools==4.42.1
+importlib-metadata==6.8.0
+importlib-resources==6.0.1
+itsdangerous==2.1.2
+Jinja2==3.1.2
+kiwisolver==1.4.5
+MarkupSafe==2.1.3
+matplotlib==3.7.2
+mediapipe==0.10.3
+numpy==1.25.2
+opencv-contrib-python==4.8.0.76
+packaging==23.1
+Pillow==10.0.0
+protobuf==3.20.3
+pycparser==2.21
+pyparsing==3.0.9
+python-dateutil==2.8.2
+six==1.16.0
+sounddevice==0.4.6
+Werkzeug==2.3.7
+zipp==3.16.2
--- a/runtime.txt
+++ b/runtime.txt
@ -0,0 +1 @@
+python-3.9.10
--- a/templates/index.html
+++ b/templates/index.html
@ -0,0 +1,10 @@
+<!DOCTYPE html>
+<html>
+  <head>
+    <title>Pose Detection</title>
+  </head>
+  <body>
+    <h1>Pose Detection</h1>
+    <img src="{{ url_for('video_feed') }}" width="640" height="480">
+  </body>
+</html>