Jul 18, 2024
pip install opencv-contrib-python
pip install cvlib
pip install gtts
pip install playsound
pip3 install pyobjc
playsound more efficient.import cv2
import cvlib as cv
from cvlib.object_detection import draw_bbox
from gtts import gTTS
from playsound import playsound
video = cv2.VideoCapture(1) # or use index 0 for default camera
while True:
ret, frame = video.read() # Unpack each frame
bbox, label, conf = cv.detect_common_objects(frame)
output_image = draw_bbox(frame, bbox, label, conf)
cv2.imshow('Object Detection', output_image)
if cv2.waitKey(1) & 0xFF == ord('q'):
break
labels = []
for item in label:
if item not in labels:
labels.append(item)
new_sentence = []
for i, label in enumerate(labels):
if i == 0:
new_sentence.append(f'I found a {label},')
else:
new_sentence.append(label)
sentence = ' '.join(new_sentence)
def speech(text):
print(text)
language = 'en'
output = gTTS(text=text, lang=language, slow=False)
output.save('sounds/output.mp3')
playsound('sounds/output.mp3')
speech(sentence)