Spaces:

osheina
/

Sign_language_project

Running

App Files Files Community

osheina commited on 22 days ago

Commit

26c2790

verified ·

1 Parent(s): 473c0a0

Update pages/Camera.py

Browse files

Files changed (1) hide show

pages/Camera.py +29 -29

pages/Camera.py CHANGED Viewed

@@ -9,7 +9,6 @@ from streamlit_webrtc import WebRtcMode, webrtc_streamer, RTCConfiguration
 from utils import SLInference
 logger = logging.getLogger(__name__)
 RTC_CONFIGURATION = RTCConfiguration({
@@ -17,9 +16,7 @@ RTC_CONFIGURATION = RTCConfiguration({
 })
 def main():
-    """
-    Main function of the app.
-    """
     config = {
         "path_to_model": "S3D.onnx",
         "threshold": 0.3,
@@ -29,37 +26,35 @@ def main():
         "provider": "OpenVINOExecutionProvider"
     }
-    # Сохранение конфигурации во временный файл
     with tempfile.NamedTemporaryFile(delete=False, mode='w', suffix='.json') as config_file:
         json.dump(config, config_file)
         config_file_path = config_file.name
     inference_thread = SLInference(config_file_path)
     inference_thread.start()
     webrtc_ctx = webrtc_streamer(
-        key="video-sendonly",
         mode=WebRtcMode.SENDONLY,
         rtc_configuration=RTC_CONFIGURATION,
         media_stream_constraints={"video": True, "audio": False},
     )
     gestures_deque = deque(maxlen=5)
-    # Set up Streamlit interface
-    st.title("Sign Language Recognition Demo")
     image_place = st.empty()
     text_output = st.empty()
-    last_5_gestures = st.empty()
-    st.markdown(
-        """
-        This application is designed to recognize sign language using a webcam feed.
-        The model has been trained to recognize various sign language gestures and display the corresponding text in real-time.
-        The project is open for collaboration. If you have any suggestions or want to contribute, please feel free to reach out.
-        """
-    )
     while True:
         if webrtc_ctx.video_receiver:
@@ -70,22 +65,27 @@ def main():
                 continue
             img_rgb = video_frame.to_ndarray(format="rgb24")
-            image_place.image(img_rgb)
-            inference_thread.input_queue.append(video_frame.reformat(224, 224).to_ndarray(format="rgb24"))
             gesture = inference_thread.pred
             if gesture not in ['no', '']:
-                if not gestures_deque:
-                    gestures_deque.append(gesture)
-                elif gesture != gestures_deque[-1]:
                     gestures_deque.append(gesture)
-            text_output.markdown(f'<p style="font-size:20px"> Current gesture: {gesture}</p>',
-                                 unsafe_allow_html=True)
-            last_5_gestures.markdown(f'<p style="font-size:20px"> Last 5 gestures: {" ".join(gestures_deque)}</p>',
-                                 unsafe_allow_html=True)
-            print(gestures_deque)
 if __name__ == "__main__":
     main()

 from utils import SLInference
 logger = logging.getLogger(__name__)
 RTC_CONFIGURATION = RTCConfiguration({
 })
 def main():
+    # Конфигурация модели
     config = {
         "path_to_model": "S3D.onnx",
         "threshold": 0.3,
         "provider": "OpenVINOExecutionProvider"
     }
+    # Временный файл с конфигом
     with tempfile.NamedTemporaryFile(delete=False, mode='w', suffix='.json') as config_file:
         json.dump(config, config_file)
         config_file_path = config_file.name
+    # Запуск инференса
     inference_thread = SLInference(config_file_path)
     inference_thread.start()
+    # --- Заголовок камеры в фирменном стиле ---
+    st.markdown("""
+    <div class="upload-section">
+        <h3>📷 Live Camera Recognition</h3>
+        <p>Enable your webcam and see real-time gesture detection powered by AI.</p>
+    </div>
+    """, unsafe_allow_html=True)
+    # Запуск WebRTC
     webrtc_ctx = webrtc_streamer(
+        key="gesture-stream",
         mode=WebRtcMode.SENDONLY,
         rtc_configuration=RTC_CONFIGURATION,
         media_stream_constraints={"video": True, "audio": False},
     )
     gestures_deque = deque(maxlen=5)
     image_place = st.empty()
     text_output = st.empty()
+    last_5_output = st.empty()
     while True:
         if webrtc_ctx.video_receiver:
                 continue
             img_rgb = video_frame.to_ndarray(format="rgb24")
+            image_place.image(img_rgb, caption="📸 Live Feed", use_column_width=True)
+            # Инференс кадра
+            inference_thread.input_queue.append(video_frame.reformat(224, 224).to_ndarray(format="rgb24"))
             gesture = inference_thread.pred
             if gesture not in ['no', '']:
+                if not gestures_deque or gesture != gestures_deque[-1]:
                     gestures_deque.append(gesture)
+            # Вывод на экран
+            text_output.markdown(
+                f'<div class="section"><p style="font-size:22px">🖐️ Current gesture: <b>{gesture}</b></p></div>',
+                unsafe_allow_html=True
+            )
+            last_5_output.markdown(
+                f'<div class="section"><p style="font-size:18px">🧠 Last 5 gestures: <span style="color:#6a1b9a;">{" | ".join(gestures_deque)}</span></p></div>',
+                unsafe_allow_html=True
+            )
 if __name__ == "__main__":
     main()