Spaces:

ake178178
/

beyoureyes

Runtime error

App Files Files Community

ake178178 commited on Sep 18

Commit

d2b41a1

•

1 Parent(s): 928afff

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -33

app.py CHANGED Viewed

@@ -6,6 +6,9 @@ from gtts import gTTS
 import os
 import time
 # 加载 Hugging Face 模型
 @st.cache_resource
 def load_model():
@@ -25,42 +28,45 @@ run = st.button('打开摄像头并开始识别')
 if run:
     st.text("正在打开摄像头，请稍等...")
     camera = cv2.VideoCapture(0)
-    while True:
-        ret, frame = camera.read()
-        if not ret:
-            st.error("无法读取摄像头")
-            break
-        # 显示摄像头画面
-        st.image(frame, channels="BGR")
-        # 每10秒进行一次拍照
-        time.sleep(10)
-        # 保存照片
-        img_path = "captured_image.jpg"
-        cv2.imwrite(img_path, frame)
-        # 读取图像并转换为模型输入
-        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-        inputs = processor(images=image, return_tensors="pt")
-        # 进行物体识别
-        with torch.no_grad():
-            outputs = model(**inputs)
-            logits = outputs.logits
-            predicted_label = torch.argmax(logits, dim=1).item()
-        # 获取识别到的物体标签
-        label = model.config.id2label[predicted_label]
-        st.write(f"识别到的物体: {label}")
-        # 将标签转化为语音
-        tts = gTTS(text=f"The object detected is {label}", lang='en')
-        tts.save("output.mp3")
-        os.system("mpg321 output.mp3")  # 播放语音
-    # 释放摄像头
-    camera.release()

 import os
 import time
+# 提示用户手动检查权限
+st.warning("请确保已允许应用访问您的摄像头。对于 Windows 用户，请检查 [设置 -> 隐私 -> 摄像头]。对于 macOS/iOS 用户，请检查 [系统偏好设置 -> 安全性与隐私 -> 摄像头]。")
 # 加载 Hugging Face 模型
 @st.cache_resource
 def load_model():
 if run:
     st.text("正在打开摄像头，请稍等...")
     camera = cv2.VideoCapture(0)
+    # 检查摄像头是否成功打开
+    if not camera.isOpened():
+        st.error("无法打开摄像头，请检查摄像头权限设置")
+    else:
+        while True:
+            ret, frame = camera.read()
+            if not ret:
+                st.error("无法读取摄像头画面")
+                break
+            # 显示摄像头画面
+            st.image(frame, channels="BGR")
+            # 每10秒进行一次拍照
+            time.sleep(10)
+            # 保存照片
+            img_path = "captured_image.jpg"
+            cv2.imwrite(img_path, frame)
+            # 读取图像并转换为模型输入
+            image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+            inputs = processor(images=image, return_tensors="pt")
+            # 进行物体识别
+            with torch.no_grad():
+                outputs = model(**inputs)
+                logits = outputs.logits
+                predicted_label = torch.argmax(logits, dim=1).item()
+            # 获取识别到的物体标签
+            label = model.config.id2label[predicted_label]
+            st.write(f"识别到的物体: {label}")
+            # 将标签转化为语音
+            tts = gTTS(text=f"The object detected is {label}", lang='en')
+            tts.save("output.mp3")
+            os.system("mpg321 output.mp3")  # 播放语音
+        # 释放摄像头
+        camera.release()