detect_numbers_webcam.py

#############################################
# Universidad Tecnica Particular de Loja    #
#############################################
# Professor:                                #
# Rodrigo Barba        lrbarba@utpl.edu.ec  #
#############################################
# Students:                                 #
# Marcelo Bravo        mdbravo4@utpl.edu.ec #
# Galo Celly           gscelly@utpl.edu.ec  #
# Nicholas Earley      nearley@utpl.edu.ec  #
#############################################
# python detect_numbers_webcam.py --model models/svm.cpickle

# import the necessary packages
from pyimagesearch.hog import HOG
from pyimagesearch import dataset
from pyimagesearch import imutils
import argparse
import cPickle
import mahotas
import cv2
#import os
#uncomment for use audio
import mask as msk
import numpy as np


# construct the argument parse and parse the arguments
ap = argparse.ArgumentParser()
ap.add_argument("-m", "--model", required = True,
	help = "path to where the model will be stored")
ap.add_argument("-v", "--video",
    help = "path to the video file")
ap.add_argument("-i", "--image",
                help = "path to the video file")
args = vars(ap.parse_args())

# call web cam
if not args.get("video", False):
    camera= cv2.VideoCapture(0)


while True:
    

    (grabbed, frame) = camera.read()
    if args.get("video") and not grabbed:
        break
    
    # take a picture (press 'q')
    frame = imutils.resize(frame, width = 500)
    frameClone = frame.copy()
    mask = np.zeros(frame.shape[:2], dtype = "uint8")
    (cX, cY) = (frame.shape[1] / 2, frame.shape[0] / 2)
    cv2.rectangle(frameClone,(cX - 134, cY - 74), (cX + 102 , cY - 40), (0,0,255), 1)
    cv2.imshow("Toma 1", frameClone)
    cv2.imwrite("images/newimage.png", frame)

    if cv2.waitKey(1) == ord("q"):
        break
#load the model
model = open(args["model"]).read()
model = cPickle.loads(model)

# initialize the HOG descriptor
hog = HOG(orientations = 18, pixelsPerCell = (9,9 ),
          cellsPerBlock = (1, 1), normalize = True)

#load the image captured
image = cv2.imread("images/newimage.png")

# apply filters (Added, subtracted,bitwise Or)
M = np.ones(image.shape, dtype = "uint8") * 10
added = cv2.add(image, M)
M = np.ones(image.shape, dtype = "uint8") * 20
subtracted = cv2.subtract(image, M)
cv2.imshow("Subtracted", subtracted)
gray = cv2.cvtColor(subtracted, cv2.COLOR_BGR2GRAY)

bitwise_Or = cv2.bitwise_not(added,subtracted)
cv2.imshow("not", bitwise_Or)

# Convert image to gray scale
gray=cv2.cvtColor(bitwise_Or, cv2.COLOR_BGR2GRAY)

# location you recognize (using a mask)
mask = np.zeros(bitwise_Or.shape[:2], dtype = "uint8")
(cX, cY) = (gray.shape[1] / 2, gray.shape[0] / 2)
cv2.rectangle(mask, (cX - 134, cY - 74), (cX + 102 , cY - 40), 255, 1)
masked = cv2.bitwise_and(gray, gray, mask = mask)
cv2.imshow("Mask Applied to Image", masked)

# blur the image, find edges, and then find contours along
# the edged regions
blurred = cv2.GaussianBlur(masked, (5, 5), 0)
edged = cv2.Canny(blurred, 30, 150)
(cnts, _) = cv2.findContours(edged.copy(), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)

# sort the contours by their x-axis position, ensuring
# that we read the numbers from left to right
cnts = sorted([(c, cv2.boundingRect(c)[0]) for c in cnts], key = lambda x: x[1])

numeros=[]

# loop over the contours
for (c, _) in cnts:
    # compute the bounding box for the rectangle
    (x, y, w, h) = cv2.boundingRect(c)

    # if the width is at least 7 pixels and the height
    # is at least 20 pixels, the contour is likely a digit
    if w >= 7 and h >= 28:
        
        # crop the ROI and then threshold the grayscale
        # ROI to reveal the digit
        # apply filer
        roi = gray[y:y + h, x:x + w]
        thresh = roi.copy()
        T = mahotas.thresholding.otsu(roi)
        thresh[thresh > T] = 255
        thresh = cv2.bitwise_not(thresh)
        
        # deskew the image center its extent
        thresh = dataset.deskew(thresh, 20)
        thresh = dataset.center_extent(thresh, (20, 20))
                
        cv2.imshow("thresh", thresh)
        
        # extract features from the image and classify it
        hist = hog.describe(thresh)
        digit = model.predict(hist)[0]
        print "Creo que el numero es: %d" % (digit)
        numeros.append(digit)
        
        # draw a rectangle around the digit, the show what the
        # digit was classified as
        cv2.rectangle(image, (x, y), (x + w, y + h), 255, 1)
        cv2.putText(image, str(digit), (x - 5, y - 5),
            cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2)
        cv2.imshow("image", image)
        # prees a key to continue
        cv2.waitKey(0)

print numeros

# call web cam

if not args.get("video", False):
    camera= cv2.VideoCapture(0)


while True:
    
    
    (grabbed, frame) = camera.read()
    if args.get("video") and not grabbed:
        break
    # take a picture (press 'q')
    frame = imutils.resize(frame, width = 500)
    frameClone = frame.copy()
    mask = np.zeros(frame.shape[:2], dtype = "uint8")
    (cX, cY) = (frame.shape[1] / 2, frame.shape[0] / 2)
    cv2.rectangle(frameClone,(cX - 100, cY - 100), (cX + 100 , cY - 0), (0,0,255), 1)
    cv2.imshow("Toma 2", frameClone)
    cv2.imwrite("images/newimage2.png", frame)

    if cv2.waitKey(1) == ord("q"):
        break

# Load the model
model = open(args["model"]).read()
model = cPickle.loads(model)

# initialize the HOG descriptor
hog = HOG(orientations = 18, pixelsPerCell = (10, 10),
          cellsPerBlock = (1, 1), normalize = True)

#load the image captured
image = cv2.imread("images/newimage2.png")

# apply filters (Added, subtracted,bitwise Or)
M = np.ones(image.shape, dtype = "uint8") * 10
added = cv2.add(image, M)
M = np.ones(image.shape, dtype = "uint8") * 20
subtracted = cv2.subtract(image, M)
cv2.imshow("Subtracted", subtracted)
gray = cv2.cvtColor(subtracted, cv2.COLOR_BGR2GRAY)

bitwise_Or2 = image

# Convert image to gray scale
gray2=cv2.cvtColor(bitwise_Or2, cv2.COLOR_BGR2GRAY)

# location you recognize (using a mask)
mask = np.zeros(bitwise_Or2.shape[:2], dtype = "uint8")
(cX, cY) = (gray2.shape[1] / 2, gray2.shape[0] / 2)
cv2.rectangle(mask, (cX - 100, cY - 100), (cX + 100 , cY - 0), 255, -1)
masked = cv2.bitwise_and(gray2, gray2, mask = mask)
cv2.imshow("Mask Applied to Image", masked)

# blur the image, find edges, and then find contours along
# the edged regions
blurred = cv2.GaussianBlur(masked, (5, 5), 0)
edged = cv2.Canny(blurred, 30, 150)
(cnts, _) = cv2.findContours(edged.copy(), cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)

# sort the contours by their x-axis position, ensuring
# that we read the numbers from left to right
cnts = sorted([(c, cv2.boundingRect(c)[0]) for c in cnts], key = lambda x: x[1])

numeros2=[]

# loop over the contours
for (c, _) in cnts:
    # compute the bounding box for the rectangle
    (x, y, w, h) = cv2.boundingRect(c)
    
    # if the width is at least 7 pixels and the height
    # is at least 20 pixels, the contour is likely a digit
    if w >= 7 and h >= 28:
        
        # crop the ROI and then threshold the grayscale
        # ROI to reveal the digit
        # apply filer
        roi = gray2[y:y + h, x:x + w]
        thresh = roi.copy()
        T = mahotas.thresholding.otsu(roi)
        thresh[thresh > T] = 255
        thresh = cv2.bitwise_not(thresh)
        
        # deskew the image center its extent
        thresh = dataset.deskew(thresh, 20)
        thresh = dataset.center_extent(thresh, (20, 20))
        
        cv2.imshow("thresh", thresh)
        
        # extract features from the image and classify it
        hist = hog.describe(thresh)
        digit = model.predict(hist)[0]
        print "Creo que el numero es: %d" % (digit)
        numeros2.append(digit)
        
        # draw a rectangle around the digit, the show what the
        # digit was classified as
        cv2.rectangle(image, (x, y), (x + w, y + h), (0, 0, 255), 1)
        cv2.putText(image, str(digit), (x - 5, y - 5),
            cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 0, 255), 2)
        cv2.imshow("image", image)
        #uncommetn for use audio
        #os.system ("say Match")
        # prees a key to continue
        cv2.waitKey(0)

print numeros2


#To use sounds
#Audio (Just for OSX)
#os.system ("say Coincide")
#
#Audio (Other Systems)
#os.system("../sound/si.wav")