streamlit-webrtc-example-experimental

Running

App Files Files Community

Pratyush101 commited on Dec 13, 2024

Commit

e11ad06

verified ·

1 Parent(s): 6b85062

Update app.py

Browse files

I have changed the code to previous version i.e. detect hands

Files changed (1) hide show

app.py +60 -40

app.py CHANGED Viewed

@@ -248,51 +248,71 @@ output_text = ""
 if "output_text" not in st.session_state:
     st.session_state["output_text"] = ""
-def video_frame_callback(frame: av.VideoFrame) -> av.VideoFrame:
-    global indexImg, output_text
     img = frame.to_ndarray(format="bgr24")
-    imgOut = segmentor.removeBG(img, imgList[indexImg])
-    hands, imgOut = detector.findHands(imgOut, flipType=False)
-    buttonList = [Button([30 + col * 105, 30 + row * 120], key) for row, line in enumerate(keys) for col, key in enumerate(line)]
-    detections = []
     if hands:
-        for i, hand in enumerate(hands):
-            lmList = hand['lmList']
-            bbox = hand['bbox']
-            label = "Hand"
-            score = hand['score']
-            box = np.array([bbox[0], bbox[1], bbox[0] + bbox[2], bbox[1] + bbox[3]])
-            detections.append(Detection(label=label, score=score, box=box))
-            if lmList:
-                x4, y4 = lmList[4][0], lmList[4][1]
-                x8, y8 = lmList[8][0], lmList[8][1]
-                distance = np.sqrt((x8 - x4) ** 2 + (y8 - y4) ** 2)
-                click_threshold = 10
-                for button in buttonList:
-                    x, y = button.pos
-                    w, h = button.size
-                    if x < x8 < x + w and y < y8 < y + h:
-                        cv2.rectangle(imgOut, button.pos, (x + w, y + h), (0, 255, 160), -1)
-                        cv2.putText(imgOut, button.text, (x + 20, y + 70), cv2.FONT_HERSHEY_PLAIN, 5, (255, 255, 255), 3)
-                        if (distance / np.sqrt(bbox[2] ** 2 + bbox[3] ** 2)) * 100 < click_threshold:
-                            if time.time() - prev_key_time[i] > 2:
-                                prev_key_time[i] = time.time()
-                                if button.text != 'BS' and button.text != 'SPACE':
-                                    output_text += button.text
-                                elif button.text == 'BS':
-                                    output_text = output_text[:-1]
-                                else:
-                                    output_text += ' '
-    result_queue.put(detections)
-    st.session_state["output_text"] = output_text
-    return av.VideoFrame.from_ndarray(imgOut, format="bgr24")
 webrtc_streamer(
     key="virtual-keyboard",

 if "output_text" not in st.session_state:
     st.session_state["output_text"] = ""
+def video_frame_callback(frame: av.VideoFrame) -> av.VideoFrame:
     img = frame.to_ndarray(format="bgr24")
+    hands, img = detector.findHands(img, flipType=False)
+    # Render hand detection results
     if hands:
+        hand = hands[0]
+        bbox = hand["bbox"]
+        cv2.rectangle(img, (bbox[0], bbox[1]), (bbox[0]+bbox[2], bbox[1]+bbox[3]), (255, 0, 0), 2)
+        cv2.putText(img, 'OpenCV', (50,50), font,
+                   fontScale, color, thickness, cv2.LINE_AA)
+        cv2.putText(img, 'OpenCV', (50, 50), cv2.FONT_HERSHEY_SIMPLEX, 2, (255, 255, 255), 1, cv2.LINE_AA)
+        result_queue.put(hands)
+# def video_frame_callback(frame: av.VideoFrame) -> av.VideoFrame:
+#     global indexImg, output_text
+#     img = frame.to_ndarray(format="bgr24")
+#     imgOut = segmentor.removeBG(img, imgList[indexImg])
+#     hands, imgOut = detector.findHands(imgOut, flipType=False)
+#     buttonList = [Button([30 + col * 105, 30 + row * 120], key) for row, line in enumerate(keys) for col, key in enumerate(line)]
+#     detections = []
+#     if hands:
+#         for i, hand in enumerate(hands):
+#             lmList = hand['lmList']
+#             bbox = hand['bbox']
+#             label = "Hand"
+#             score = hand['score']
+#             box = np.array([bbox[0], bbox[1], bbox[0] + bbox[2], bbox[1] + bbox[3]])
+#             detections.append(Detection(label=label, score=score, box=box))
+#             if lmList:
+#                 x4, y4 = lmList[4][0], lmList[4][1]
+#                 x8, y8 = lmList[8][0], lmList[8][1]
+#                 distance = np.sqrt((x8 - x4) ** 2 + (y8 - y4) ** 2)
+#                 click_threshold = 10
+#                 for button in buttonList:
+#                     x, y = button.pos
+#                     w, h = button.size
+#                     if x < x8 < x + w and y < y8 < y + h:
+#                         cv2.rectangle(imgOut, button.pos, (x + w, y + h), (0, 255, 160), -1)
+#                         cv2.putText(imgOut, button.text, (x + 20, y + 70), cv2.FONT_HERSHEY_PLAIN, 5, (255, 255, 255), 3)
+#                         if (distance / np.sqrt(bbox[2] ** 2 + bbox[3] ** 2)) * 100 < click_threshold:
+#                             if time.time() - prev_key_time[i] > 2:
+#                                 prev_key_time[i] = time.time()
+#                                 if button.text != 'BS' and button.text != 'SPACE':
+#                                     output_text += button.text
+#                                 elif button.text == 'BS':
+#                                     output_text = output_text[:-1]
+#                                 else:
+#                                     output_text += ' '
+#     result_queue.put(detections)
+#     st.session_state["output_text"] = output_text
+#     return av.VideoFrame.from_ndarray(imgOut, format="bgr24")
 webrtc_streamer(
     key="virtual-keyboard",