smeschke · April 6, 2024 21:17 · jhayush0502 · Jul 2, 2023
diff --git a/head nod detection b/head nod detection
 import cv2
 import numpy as np

 fourcc = cv2.VideoWriter_fourcc(*'XVID')
 out = cv2.VideoWriter('/home/sm/Desktop/nodcontrol.avi',fourcc, 20.0, (640,480))

 #dinstance function
 def distance(x,y):
    import math
    return math.sqrt((x[0]-y[0])**2+(x[1]-y[1])**2) 
    
 #capture source video
 cap = cv2.VideoCapture(0)

 #params for ShiTomasi corner detection
 feature_params = dict( maxCorners = 100,
                        qualityLevel = 0.3,
                        minDistance = 7,
                        blockSize = 7 )
 # Parameters for lucas kanade optical flow
 lk_params = dict( winSize  = (15,15),
                  maxLevel = 2,
                  criteria = (cv2.TERM_CRITERIA_EPS | cv2.TERM_CRITERIA_COUNT, 10, 0.03))

 #path to face cascde
 face_cascade = cv2.CascadeClassifier('haarcascade_frontalface_alt.xml')

 #function to get coordinates
 def get_coords(p1):
    try: return int(p1[0][0][0]), int(p1[0][0][1])
    except: return int(p1[0][0]), int(p1[0][1])

 #define font and text color
 font = cv2.FONT_HERSHEY_SIMPLEX


 #define movement threshodls
 max_head_movement = 20
 movement_threshold = 50
 gesture_threshold = 175

 #find the face in the image
 face_found = False
 frame_num = 0
 while not face_found:
    # Take first frame and find corners in it
    frame_num += 1
    ret, frame = cap.read()
    frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
    faces = face_cascade.detectMultiScale(frame_gray, 1.3, 5)
    for (x,y,w,h) in faces:
        cv2.rectangle(frame,(x,y),(x+w,y+h),(255,0,0),2)
        face_found = True
    cv2.imshow('image',frame)
    out.write(frame)
    cv2.waitKey(1)
 face_center = x+w/2, y+h/3
 p0 = np.array([[face_center]], np.float32)

 gesture = False
 x_movement = 0
 y_movement = 0
 gesture_show = 60 #number of frames a gesture is shown

 while True:    
    ret,frame = cap.read()
    old_gray = frame_gray.copy()
    frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
    p1, st, err = cv2.calcOpticalFlowPyrLK(old_gray, frame_gray, p0, None, **lk_params)
    cv2.circle(frame, get_coords(p1), 4, (0,0,255), -1)
    cv2.circle(frame, get_coords(p0), 4, (255,0,0))
    
    #get the xy coordinates for points p0 and p1
    a,b = get_coords(p0), get_coords(p1)
    x_movement += abs(a[0]-b[0])
    y_movement += abs(a[1]-b[1])
    
    text = 'x_movement: ' + str(x_movement)
    if not gesture: cv2.putText(frame,text,(50,50), font, 0.8,(0,0,255),2)
    text = 'y_movement: ' + str(y_movement)
    if not gesture: cv2.putText(frame,text,(50,100), font, 0.8,(0,0,255),2)

    if x_movement > gesture_threshold:
        gesture = 'No'
    if y_movement > gesture_threshold:
        gesture = 'Yes'
    if gesture and gesture_show > 0:
        cv2.putText(frame,'Gesture Detected: ' + gesture,(50,50), font, 1.2,(0,0,255),3)
        gesture_show -=1
    if gesture_show == 0:
        gesture = False
        x_movement = 0
        y_movement = 0
        gesture_show = 60 #number of frames a gesture is shown
        
    #print distance(get_coords(p0), get_coords(p1))
    p0 = p1

    cv2.imshow('image',frame)
    out.write(frame)
    cv2.waitKey(1)

 cv2.destroyAllWindows()
 cap.release()
	import cv2
	import numpy as np

	fourcc = cv2.VideoWriter_fourcc(*'XVID')
	out = cv2.VideoWriter('/home/sm/Desktop/nodcontrol.avi',fourcc, 20.0, (640,480))

	#dinstance function
	def distance(x,y):
	import math
	return math.sqrt((x[0]-y[0])2+(x[1]-y[1])2)

	#capture source video
	cap = cv2.VideoCapture(0)

	#params for ShiTomasi corner detection
	feature_params = dict( maxCorners = 100,
	qualityLevel = 0.3,
	minDistance = 7,
	blockSize = 7 )
	# Parameters for lucas kanade optical flow
	lk_params = dict( winSize = (15,15),
	maxLevel = 2,
	criteria = (cv2.TERM_CRITERIA_EPS \| cv2.TERM_CRITERIA_COUNT, 10, 0.03))

	#path to face cascde
	face_cascade = cv2.CascadeClassifier('haarcascade_frontalface_alt.xml')

	#function to get coordinates
	def get_coords(p1):
	try: return int(p1[0][0][0]), int(p1[0][0][1])
	except: return int(p1[0][0]), int(p1[0][1])

	#define font and text color
	font = cv2.FONT_HERSHEY_SIMPLEX


	#define movement threshodls
	max_head_movement = 20
	movement_threshold = 50
	gesture_threshold = 175

	#find the face in the image
	face_found = False
	frame_num = 0
	while not face_found:
	# Take first frame and find corners in it
	frame_num += 1
	ret, frame = cap.read()
	frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
	faces = face_cascade.detectMultiScale(frame_gray, 1.3, 5)
	for (x,y,w,h) in faces:
	cv2.rectangle(frame,(x,y),(x+w,y+h),(255,0,0),2)
	face_found = True
	cv2.imshow('image',frame)
	out.write(frame)
	cv2.waitKey(1)
	face_center = x+w/2, y+h/3
	p0 = np.array([[face_center]], np.float32)

	gesture = False
	x_movement = 0
	y_movement = 0
	gesture_show = 60 #number of frames a gesture is shown

	while True:
	ret,frame = cap.read()
	old_gray = frame_gray.copy()
	frame_gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
	p1, st, err = cv2.calcOpticalFlowPyrLK(old_gray, frame_gray, p0, None, **lk_params)
	cv2.circle(frame, get_coords(p1), 4, (0,0,255), -1)
	cv2.circle(frame, get_coords(p0), 4, (255,0,0))

	#get the xy coordinates for points p0 and p1
	a,b = get_coords(p0), get_coords(p1)
	x_movement += abs(a[0]-b[0])
	y_movement += abs(a[1]-b[1])

	text = 'x_movement: ' + str(x_movement)
	if not gesture: cv2.putText(frame,text,(50,50), font, 0.8,(0,0,255),2)
	text = 'y_movement: ' + str(y_movement)
	if not gesture: cv2.putText(frame,text,(50,100), font, 0.8,(0,0,255),2)

	if x_movement > gesture_threshold:
	gesture = 'No'
	if y_movement > gesture_threshold:
	gesture = 'Yes'
	if gesture and gesture_show > 0:
	cv2.putText(frame,'Gesture Detected: ' + gesture,(50,50), font, 1.2,(0,0,255),3)
	gesture_show -=1
	if gesture_show == 0:
	gesture = False
	x_movement = 0
	y_movement = 0
	gesture_show = 60 #number of frames a gesture is shown

	#print distance(get_coords(p0), get_coords(p1))
	p0 = p1

	cv2.imshow('image',frame)
	out.write(frame)
	cv2.waitKey(1)

	cv2.destroyAllWindows()
	cap.release()