dmateos · January 8, 2024 23:29
diff --git a/voice.py b/voice.py
 import cv2
 import os
 from PIL import Image
 from torchvision.models.detection import fasterrcnn_resnet50_fpn_v2, FasterRCNN_ResNet50_FPN_V2_Weights
 from torchvision.transforms.functional import pil_to_tensor

 cap = cv2.VideoCapture(0)
 cap.set(cv2.CAP_PROP_FRAME_WIDTH, 640)  # width
 cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 480)  # height
 cap.set(cv2.CAP_PROP_FPS, 30)  # frame rate

 last_label = None

 while True:
    ret, frame = cap.read()
    if cv2.waitKey(1) & 0xFF == ord("q"):
        break
    else:
        pass

    img = Image.fromarray(frame)
    img = pil_to_tensor(img)

    weights = FasterRCNN_ResNet50_FPN_V2_Weights.DEFAULT
    model = fasterrcnn_resnet50_fpn_v2(weights=weights, box_score_thresh=0.8)
    model.eval()

    preprocess = weights.transforms()
    batch = [preprocess(img)]

    prediction = model(batch)[0]
    labels = [weights.meta["categories"][i] for i in prediction["labels"]]

    # check if none
    if len(labels) == 0:
        continue

    label = labels[prediction["scores"].argmax()]
    if label != last_label:
        os.system(f"say {label}")
        last_label = label
	import cv2
	import os
	from PIL import Image
	from torchvision.models.detection import fasterrcnn_resnet50_fpn_v2, FasterRCNN_ResNet50_FPN_V2_Weights
	from torchvision.transforms.functional import pil_to_tensor

	cap = cv2.VideoCapture(0)
	cap.set(cv2.CAP_PROP_FRAME_WIDTH, 640) # width
	cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 480) # height
	cap.set(cv2.CAP_PROP_FPS, 30) # frame rate

	last_label = None

	while True:
	ret, frame = cap.read()
	if cv2.waitKey(1) & 0xFF == ord("q"):
	break
	else:
	pass

	img = Image.fromarray(frame)
	img = pil_to_tensor(img)

	weights = FasterRCNN_ResNet50_FPN_V2_Weights.DEFAULT
	model = fasterrcnn_resnet50_fpn_v2(weights=weights, box_score_thresh=0.8)
	model.eval()

	preprocess = weights.transforms()
	batch = [preprocess(img)]

	prediction = model(batch)[0]
	labels = [weights.meta["categories"][i] for i in prediction["labels"]]

	# check if none
	if len(labels) == 0:
	continue

	label = labels[prediction["scores"].argmax()]
	if label != last_label:
	os.system(f"say {label}")
	last_label = label