smeschke · April 16, 2023 23:11
diff --git a/deep_cat.py b/deep_cat.py
 from mrcnn.config import Config
 from mrcnn import model as modellib
 from mrcnn import visualize
 import cv2, os, numpy as np

 # Make Model: https://github.com/matterport/Mask_RCNN/blob/master/samples/demo.ipynb
 class Config(Config):
 	NAME = "deep_segment"
 	GPU_COUNT = 1
 	IMAGES_PER_GPU = 1
 	NUM_CLASSES = 81
 config = Config()
 model = modellib.MaskRCNN(mode="inference", model_dir=os.getcwd(), config=config)
 model.load_weights('mask_rcnn_coco.h5', by_name=True) # https://github.com/matterport/Mask_RCNN/releases

 img_path = '/home/stephen/Desktop/6.jpg'
 img = cv2.imread(img_path)
 src = img.copy()
 img_rgb = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
 h,w, _ = img.shape
 dl_size = 512
 dl_scale = w/dl_size

 # Function to get mask from MRCNN
 def get_deep_mask(img):
        img_dl_size = cv2.resize(img, (dl_size, int(h/dl_scale)))
        # Use DL to get a mask
        deep_mask = np.zeros_like(img_dl_size)
        results = model.detect([img_dl_size], verbose=1)
        r = results[0]
        mask = r["masks"][:, :, 0]        
        for i in range(0, len(r["scores"])):
                # Get the mask for this object
                mask = r["masks"][:,:,i]
                # Get the bounding box for this object
                roi = r["rois"][i]
                # If the object has a cat
                if r["class_ids"][i] == 16:
                        #Line 72 - https://github.com/matterport/Mask_RCNN/blob/master/mrcnn/visualize.py
                        deep_mask = visualize.apply_mask(deep_mask, mask, (255,255,255), alpha=.1)
                        # Stop after only one cat
                        break
        # Make things black and white
        _, deep_mask = cv2.threshold(deep_mask, 12, 255, cv2.THRESH_BINARY)
        return deep_mask, roi

 # Get the mask and roi from the image
 deep_mask, (y1,x1,y2,x2) = get_deep_mask(img_rgb)
 # Scale ROI values to the source image size
 y1,x1,y2,x2 = np.array((y1*dl_scale,x1*dl_scale,y2*dl_scale,x2*dl_scale), int)
 print("ROI VALUES: ", y1,x1,y2,x2)
 # Add a buffer of 50 px
 buffer = 150
 if y1-buffer >= 0: y1-= buffer
 else: y1 = 0
 if y2+buffer <= h: y2+= buffer
 else: y2 = h
 if x1-buffer >= 0: x1-=buffer
 else: x1 = 0
 if x2+buffer <= w: x2+=buffer
 else: x2 = w
 # Crop out the relevant part of the image
 img = img[y1:y2, x1:x2]
 img_rgb = img_rgb[y1:y2, x1:x2]
 h,w,_ = img.shape
 # Get the mask again, this time using only the roi
 deep_mask, (y1,x1,y2,x2) = get_deep_mask(img_rgb)

 print("APPLYING GRABCUT...............")
 deep_mask = cv2.cvtColor(deep_mask, cv2.COLOR_BGR2GRAY)
 deep_mask = cv2.resize(deep_mask, (w,h))
 mask = np.zeros(img.shape[:2],np.uint8)
 white_background = (255 - mask.copy())

 # Initialize parameters for the GrabCut algorithm
 bgdModel = np.zeros((1,65),np.float64)
 fgdModel = np.zeros((1,65),np.float64)
 iters, size = 4, int(h*w/124321)
 print("Using a kernel size of: ", size)
 kernel = np.ones((size,size),np.uint8)
 big_kernel = np.ones((2*size,2*size),np.uint8)
 huge_kernel = np.ones((4*size,4*size),np.uint8)
 # Dilate the mask to make sure the whole object is covered by the mask
 dilation = cv2.dilate(deep_mask, big_kernel, iterations = iters)
 # Start with a white background and subtract 
 sure_background = white_background - dilation

 # Erode to find the sure foreground
 sure_foreground = cv2.erode(deep_mask, kernel, iterations = iters)

 # Change the values on the mask so that:
 #    2 - unsure pixels
 #    1 - sure foreground pixels
 #    0 - sure background pixels
 mask[:] = 2
 mask[sure_background == 255] = 0
 mask[sure_foreground == 255] = 1

 # Apply GrabCut
 out_mask = mask.copy()
 out_mask, _, _ = cv2.grabCut(img,out_mask,None,bgdModel,fgdModel,4,cv2.GC_INIT_WITH_MASK)
 out_mask = np.where((out_mask==2)|(out_mask==0),0,1).astype('uint8')
 # Open the mask to fill in the holes
 out_img = img*out_mask[:,:,np.newaxis]

 # Plot with Matplotlib
 import matplotlib.pyplot as plt
 import matplotlib.image as mpimg

 # Create image that shows foreground and background
 def create_labeled_image(src_image, foreground, background):
        for i in range(4):
                bg = np.zeros_like(img)
                bg[background == 0] = (255,255,255)
                bg = cv2.cvtColor(bg, cv2.COLOR_BGR2GRAY)
                _,thresh = cv2.threshold(bg,1,255,cv2.THRESH_BINARY)
                contours,hierarchy = cv2.findContours(thresh,cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
                src_image=cv2.drawContours(src_image, contours, -1, (0,255,255), 5-i)
                background = cv2.erode(background, huge_kernel, iterations = 1)
        for i in range(4):
                bg = np.zeros_like(img)
                bg[:,:,:] = 255,255,255
                bg[foreground == 0] = (0,0,0)
                bg = cv2.cvtColor(bg, cv2.COLOR_BGR2GRAY)
                _,thresh = cv2.threshold(bg,1,255,cv2.THRESH_BINARY)
                contours,hierarchy = cv2.findContours(thresh,cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
                src_image=cv2.drawContours(src_image, contours, -1, (255,255,0), 5-i)
                foreground = cv2.erode(foreground, huge_kernel, iterations = 1)
        return src_image


 # Create a multi plot
 f, axarr = plt.subplots(2,3, sharex=True)
 # Show source image in the top left
 src_h, src_w, _ = src.shape
 scale_w = int(w/3)
 scale_h = int(scale_w * (src_h/src_w))
 src = cv2.resize(src, (scale_w, scale_h))
 comp_image = img.copy()
 comp_image[:scale_h,:scale_w] = src
 axarr[0,0].imshow(comp_image)
 # Show deep mask in the top middle
 axarr[0,1].imshow(deep_mask)
 # Show deep mask of source image in the top right
 deep_mask_of_source = img.copy()
 deep_mask_of_source[deep_mask == 0] = 0,0,0
 axarr[0,2].imshow(deep_mask_of_source)
 # Show the sure foreground and the sure background in the bottom left
 labeled_image = create_labeled_image(img, sure_foreground, sure_background)
 axarr[1,0].imshow(labeled_image)
 # Show the GrabCut mask in the bottom middle
 axarr[1,1].imshow(out_mask)
 # Show the GrabCut image in the bottom right
 axarr[1,2].imshow(out_img)

 # Add titles
 text = 'Source Image: '+str(src_w)+'x'+str(src_h)+' px'+' and ROI: '+str(w)+'x'+str(h)+' px'
 axarr[0,0].set_title(text)
 axarr[0,1].set_title('Mask from DL')
 axarr[0,2].set_title('DL Mask Image: 512x512 px')
 axarr[1,0].set_title('Sure Foreground and Sure Background')
 axarr[1,1].set_title('GrabCut Mask')
 axarr[1,2].set_title('GrabCut Mask Image')
 # Clean up and show
 axarr[0,0].axis('off')
 axarr[0,1].axis('off')
 axarr[1,0].axis('off')
 axarr[1,1].axis('off')
 axarr[1,2].axis('off')
 axarr[0,2].axis('off')
 plt.show()
	from mrcnn.config import Config
	from mrcnn import model as modellib
	from mrcnn import visualize
	import cv2, os, numpy as np

	# Make Model: https://github.com/matterport/Mask_RCNN/blob/master/samples/demo.ipynb
	class Config(Config):
	NAME = "deep_segment"
	GPU_COUNT = 1
	IMAGES_PER_GPU = 1
	NUM_CLASSES = 81
	config = Config()
	model = modellib.MaskRCNN(mode="inference", model_dir=os.getcwd(), config=config)
	model.load_weights('mask_rcnn_coco.h5', by_name=True) # https://github.com/matterport/Mask_RCNN/releases

	img_path = '/home/stephen/Desktop/6.jpg'
	img = cv2.imread(img_path)
	src = img.copy()
	img_rgb = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
	h,w, _ = img.shape
	dl_size = 512
	dl_scale = w/dl_size

	# Function to get mask from MRCNN
	def get_deep_mask(img):
	img_dl_size = cv2.resize(img, (dl_size, int(h/dl_scale)))
	# Use DL to get a mask
	deep_mask = np.zeros_like(img_dl_size)
	results = model.detect([img_dl_size], verbose=1)
	r = results[0]
	mask = r["masks"][:, :, 0]
	for i in range(0, len(r["scores"])):
	# Get the mask for this object
	mask = r["masks"][:,:,i]
	# Get the bounding box for this object
	roi = r["rois"][i]
	# If the object has a cat
	if r["class_ids"][i] == 16:
	#Line 72 - https://github.com/matterport/Mask_RCNN/blob/master/mrcnn/visualize.py
	deep_mask = visualize.apply_mask(deep_mask, mask, (255,255,255), alpha=.1)
	# Stop after only one cat
	break
	# Make things black and white
	_, deep_mask = cv2.threshold(deep_mask, 12, 255, cv2.THRESH_BINARY)
	return deep_mask, roi

	# Get the mask and roi from the image
	deep_mask, (y1,x1,y2,x2) = get_deep_mask(img_rgb)
	# Scale ROI values to the source image size
	y1,x1,y2,x2 = np.array((y1dl_scale,x1dl_scale,y2dl_scale,x2dl_scale), int)
	print("ROI VALUES: ", y1,x1,y2,x2)
	# Add a buffer of 50 px
	buffer = 150
	if y1-buffer >= 0: y1-= buffer
	else: y1 = 0
	if y2+buffer <= h: y2+= buffer
	else: y2 = h
	if x1-buffer >= 0: x1-=buffer
	else: x1 = 0
	if x2+buffer <= w: x2+=buffer
	else: x2 = w
	# Crop out the relevant part of the image
	img = img[y1:y2, x1:x2]
	img_rgb = img_rgb[y1:y2, x1:x2]
	h,w,_ = img.shape
	# Get the mask again, this time using only the roi
	deep_mask, (y1,x1,y2,x2) = get_deep_mask(img_rgb)

	print("APPLYING GRABCUT...............")
	deep_mask = cv2.cvtColor(deep_mask, cv2.COLOR_BGR2GRAY)
	deep_mask = cv2.resize(deep_mask, (w,h))
	mask = np.zeros(img.shape[:2],np.uint8)
	white_background = (255 - mask.copy())

	# Initialize parameters for the GrabCut algorithm
	bgdModel = np.zeros((1,65),np.float64)
	fgdModel = np.zeros((1,65),np.float64)
	iters, size = 4, int(h*w/124321)
	print("Using a kernel size of: ", size)
	kernel = np.ones((size,size),np.uint8)
	big_kernel = np.ones((2size,2size),np.uint8)
	huge_kernel = np.ones((4size,4size),np.uint8)
	# Dilate the mask to make sure the whole object is covered by the mask
	dilation = cv2.dilate(deep_mask, big_kernel, iterations = iters)
	# Start with a white background and subtract
	sure_background = white_background - dilation

	# Erode to find the sure foreground
	sure_foreground = cv2.erode(deep_mask, kernel, iterations = iters)

	# Change the values on the mask so that:
	# 2 - unsure pixels
	# 1 - sure foreground pixels
	# 0 - sure background pixels
	mask[:] = 2
	mask[sure_background == 255] = 0
	mask[sure_foreground == 255] = 1

	# Apply GrabCut
	out_mask = mask.copy()
	out_mask, _, _ = cv2.grabCut(img,out_mask,None,bgdModel,fgdModel,4,cv2.GC_INIT_WITH_MASK)
	out_mask = np.where((out_mask==2)\|(out_mask==0),0,1).astype('uint8')
	# Open the mask to fill in the holes
	out_img = img*out_mask[:,:,np.newaxis]

	# Plot with Matplotlib
	import matplotlib.pyplot as plt
	import matplotlib.image as mpimg

	# Create image that shows foreground and background
	def create_labeled_image(src_image, foreground, background):
	for i in range(4):
	bg = np.zeros_like(img)
	bg[background == 0] = (255,255,255)
	bg = cv2.cvtColor(bg, cv2.COLOR_BGR2GRAY)
	_,thresh = cv2.threshold(bg,1,255,cv2.THRESH_BINARY)
	contours,hierarchy = cv2.findContours(thresh,cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
	src_image=cv2.drawContours(src_image, contours, -1, (0,255,255), 5-i)
	background = cv2.erode(background, huge_kernel, iterations = 1)
	for i in range(4):
	bg = np.zeros_like(img)
	bg[:,:,:] = 255,255,255
	bg[foreground == 0] = (0,0,0)
	bg = cv2.cvtColor(bg, cv2.COLOR_BGR2GRAY)
	_,thresh = cv2.threshold(bg,1,255,cv2.THRESH_BINARY)
	contours,hierarchy = cv2.findContours(thresh,cv2.RETR_EXTERNAL,cv2.CHAIN_APPROX_SIMPLE)
	src_image=cv2.drawContours(src_image, contours, -1, (255,255,0), 5-i)
	foreground = cv2.erode(foreground, huge_kernel, iterations = 1)
	return src_image


	# Create a multi plot
	f, axarr = plt.subplots(2,3, sharex=True)
	# Show source image in the top left
	src_h, src_w, _ = src.shape
	scale_w = int(w/3)
	scale_h = int(scale_w * (src_h/src_w))
	src = cv2.resize(src, (scale_w, scale_h))
	comp_image = img.copy()
	comp_image[:scale_h,:scale_w] = src
	axarr[0,0].imshow(comp_image)
	# Show deep mask in the top middle
	axarr[0,1].imshow(deep_mask)
	# Show deep mask of source image in the top right
	deep_mask_of_source = img.copy()
	deep_mask_of_source[deep_mask == 0] = 0,0,0
	axarr[0,2].imshow(deep_mask_of_source)
	# Show the sure foreground and the sure background in the bottom left
	labeled_image = create_labeled_image(img, sure_foreground, sure_background)
	axarr[1,0].imshow(labeled_image)
	# Show the GrabCut mask in the bottom middle
	axarr[1,1].imshow(out_mask)
	# Show the GrabCut image in the bottom right
	axarr[1,2].imshow(out_img)

	# Add titles
	text = 'Source Image: '+str(src_w)+'x'+str(src_h)+' px'+' and ROI: '+str(w)+'x'+str(h)+' px'
	axarr[0,0].set_title(text)
	axarr[0,1].set_title('Mask from DL')
	axarr[0,2].set_title('DL Mask Image: 512x512 px')
	axarr[1,0].set_title('Sure Foreground and Sure Background')
	axarr[1,1].set_title('GrabCut Mask')
	axarr[1,2].set_title('GrabCut Mask Image')
	# Clean up and show
	axarr[0,0].axis('off')
	axarr[0,1].axis('off')
	axarr[1,0].axis('off')
	axarr[1,1].axis('off')
	axarr[1,2].axis('off')
	axarr[0,2].axis('off')
	plt.show()