primary.py

# Project Monocle: Automated Image Cropping for Books and Textbooks
# primary.py: Main System and Operations

# Eiza Stanford "charkybarky" 2022

# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# >>> >>> >>> IMPORTS AND MODULES <<< <<< <<<
from PIL import Image
import time
import interface

# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====


# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# >>> >>> >>> GLOBAL FUNCTIONS <<< <<< <<<

def imageBoundsCheck(image, x, y):
	"""Returns True if x and y are within the bounds/resolution of the image; False otherwise.
	
	More specifically, return True if:
		x between values 0 inclusive, horizontal resolution exclusive
		y between values 0 inclusive, vertical resolution exclusive
	"""
	
	size = image.size
	return (x >= 0 and y >= 0) and (x < size[0] and y < size[1])


def imageBoundsCheckRadius(image, x, y, radius):
	"""Returns True if the radius from (x, y) is within the resolution and bounds of image; False otherwise."""
	
	size = image.size
	return (x - radius >= 0 and y - radius >= 0) and (x < size[0] - radius and y < size[1] - radius)


def redBackgroundCheck(color):
	"""Returns True if color is considered to be the (red) background and unoccupied by the book; False otherwise."""
	
	# >>> the maximum value between G(reen) and B(lue)
	maxNonRedVal = max(color[1], color[2])
	maxNonRedValAllowed = 130
	
	# >>> this is a highly generalized number: the GREATER the number, the GREATER the minimum difference will be
	diffBright = 160
	
	# >>> the main algorithm for the minimum DIFFERENCE between the R(ed) and other G and B maximum
	diffThresh = min(int(diffBright * (maxNonRedVal / 255)), 255)
	
	# >>> the R(ed) value of the color must exceed this amount for the whole color to be considered for our purposes "red"
	minimumRedVal = maxNonRedVal + diffThresh
	
	isRed = (color[0] >= minimumRedVal) and (maxNonRedVal <= maxNonRedValAllowed)
	
	return isRed

# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====


# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# >>> >>> >>> CLASS: REGIONCHUNK <<< <<< <<<

class RegionChunk:
	
	def chunkDefineExact(self, startPos, jump, regionNum, regionRadius, posByCorner=False, jumpByRadius=False):
		"""Chunk definition: return True if successfully updated the chunk to have exact number of Regions in horizontal and vertical direction.
		
		Parameters:
			posByCorner:	If True, then the startPos is the top left corner of a Region instead of its center.
			startPos:		2D tuple of integers (x, y); the position of the first, top-most and left-most Region.
			jump:			2D tuple of integers (x, y); the amount of pixels between the position of each Region.
							This considers the POSITION, not both the position and the radius.
			regionNum:		2D tuple of integers (x, y).
		"""
		self.regionList = []
		navX = startPos[0]
		navY = startPos[1]
		
		if(jumpByRadius):
			jump = (regionRadius, regionRadius)
		
		if(posByCorner):
			navX += regionRadius
			navY += regionRadius
		
		if not imageBoundsCheckRadius(self.imageObject, navX, navY, regionRadius):
			return False
		
		for vert in range(regionNum[1]):
			for horz in range(regionNum[0]):
				self.regionList.append(Region(self.imageObject, self.imageLoaded, (navX, navY), regionRadius))
				
				navX += jump[0]
			
			navY += jump[1]
			navX -= jump[0] * (regionNum[0])
		
		return True


	def chunkDefinePack(self, topLeftCorner, bottomRightCorner, regionNum, useMax=False):
		"""Chunk definition: return True if successfully updated the chunk to have Regions packed between two corners (fixed count).
		
		More specifically, the function will attempt to fit "regionNum" number of regions in both the vertical
		and horizontal direction between the 2D int tuple "topLeftCorner" (topmost, leftmost pixel) and the
		2D int tuple "bottomRightCorner" (bottommost, rigthmost pixel).
		
		The radius of these Regions is not fixed by the user: if boolean "useMax" is True, then the function
		will attempt to use the greatest radius possible; this may only fit the area between the corners horizontally
		or vertically, not both.
		"""
		
		self.regionList = []
		
		width = bottomRightCorner[0] - topLeftCorner[0]
		height = bottomRightCorner[1] - topLeftCorner[1]
		
		radiusCalc = (int(width / regionNum[0]), int(height / regionNum[1]))
		radius = min(radiusCalc)
		
		if(useMax):
			radius = max(radiusCalc)
		
		# >>> regions cannot have arbitrary widths or lengths, they MUST conform to a radius
		# >>> therefore, the radius will be based on the SMALLER of the width or height
		
		return self.chunkDefineExact(topLeftCorner, (0, 0), regionNum, radius, True, True)


	def chunkDefinePackAuto(self, topLeftCorner, bottomRightCorner, regionRadius):
		"""Chunk definition: return True if successfully updated the chunk to have Regions packed between two corners (fixed radius).
		
		More specifically, the function will attempt to fit as many number of regions in both the vertical and horizontal
		direction with a given, fixed radius between the 2D int tuple "topLeftCorner" (topmost, leftmost pixel) and the
		2D int tuple "bottomRightCorner" (bottommost, rigthmost pixel).
		
		It is RECOMMENDED to use this function over chunkDefinePack.
		"""
		self.regionList = []
		
		width = bottomRightCorner[0] - topLeftCorner[0]
		height = bottomRightCorner[1] - topLeftCorner[1]
		
		# >>> LOOK AT THIS LATER: the getRegionPixelList method in the Region class gets an index out of bounds error
		# >>> maybe getRegionPixelList is to blame, not this method
		regionNumHorz = max(int(width / regionRadius) - 1, 0)
		regionNumVert = max(int(height / regionRadius) - 1, 0)
		
		regionNum = (regionNumHorz, regionNumVert)
		
		return self.chunkDefineExact(topLeftCorner, (0, 0), regionNum, regionRadius, True, True)


	def chunkFillColorAverage(self):
		for region in self.regionList:
			region.imageFillRegion(region.getRegionPixelAverage())
	
	
	def chunkLabelRedDetectRegions(self):
		for region in self.regionList:
			if(region.isRegionRed()):
				region.imageFillRegion((255, 0, 255))
	
	
	def chunkFillColor(self, color):
		for region in self.regionList:
			region.imageFillRegion(color)
	
	
	def chunkRedDetectRegions(self, outlierThresh, filterBoundOutliers=True, strictFilter=False, label=False, verboseDebug=False): #boundCheckName
		"""Returns a dict with a list of regions that detected as the background or "red" with additional information.
		
		A "bound" may include the "topmost" y-value, the "bottommost" y-value, the "leftmost" x-value, and the "rightmost" x-value.
		
		Furthermore, each directional bound (e.g. topmost) is NOT recorded as a tuple or coordinate pair, but as an integer.
		
		The "farthest bounds" are essentially the topmost, bottommost, leftmost, and rightmost pixels that contain
		background/red Regions.
		
		Parameters:
			outlierThresh:			For both the vertical and horizontal direction, if the x/y position of an iterated red Region
									EXCEEDS the average directional bound values by the integer outlierThresh, then it
									will NOT update the farthest bound (considered an "outlier").
			filterBoundOutliers:	If True, then the function will attempt to filter out and not include outlier Regions.
			strictFilter:			If True, then the function will filter outliers with the average bound values.
									If False, then it will use both the average and the bounds of the previous consecutive Region.
			label:					If True, MODIFY The image by coloring in all regions that were considered as red.
			verboseDebug:			If True, print debug info.
		"""
		
		regionRedDetect = []
		
		for region in self.regionList:
			if(region.isRegionRed()):
				regionRedDetect.append(region)
		
		if(not regionRedDetect):
			return None
		
		# use the FIRST REGION IN THE WHOLE LIST, REGARDLESS IF IT IS RED OR NOT
		#regionFirst = self.regionList[0]
		
		# use the FIRST REGION in the LIST OF "RED" REGIONS (RECOMMENDED)
		regionFirst = regionRedDetect[0]
		
		regionFirstBounds = regionFirst.pixBounds
		
		# the topmost, bottommost, leftmost, rightmost regions that triggered
		# NOTE: this is calculated by side CLOSEST to a particular direction (e.g. topmost), NOT the center alone
		boundDirs = ['top', 'bottom', 'left', 'right']
		
		boundFarthest = {
			'top' : regionFirstBounds['top'],
			'bottom' : regionFirstBounds['bottom'],
			'left' : regionFirstBounds['left'],
			'right' : regionFirstBounds['right']
		}
		
		boundAverage = boundFarthest.copy()
		
		boundSum = boundFarthest.copy()
		
		# for left and top, find minimum value; for right and bottom, find maximum value
		dirLessThan = ['left', 'top']
		dirGreaterThan = ['right', 'bottom']
		
		regionCountForAverage = 0
		
		regionPrevBounds = regionFirstBounds
		
		if verboseDebug:
			print('FIRST REGION BOUND: %s' % str(boundFarthest))
			time.sleep(3)
		
		diffPrev = 0
		
		for region in regionRedDetect[1:]:
			bounds = region.pixBounds
			
			# PERSONAL NOTES:
			# situation A: there is only ONE OUTLIER region very far away from the rest
			# siutation B: there is a GROUP OF OUTLIERS far away from the MAJORITY
			
			# using diffAvg alone is BEST for SITUATION B, as it will STRICTLY ignore ANY NUMBER OF REGIONS that are far away from the rest
			# using both diffAvg and diffPrev is BEST for accurate "boundFarthest" results, BUT can be tricked by a small group of outlier regions
			# 		(a small group, as in, consecutive regions in the list: one after the other)
			
			for b in dirLessThan:
				diffAvg = abs(bounds[b] - boundAverage[b])
				
				if strictFilter:
					diffPrev = diffAvg
				else:
					diffPrev = abs(bounds[b] - regionPrevBounds[b])
				
				if(diffAvg <= outlierThresh or diffPrev <= outlierThresh or not filterBoundOutliers):
					regionCountForAverage += 1
					boundSum[b] += bounds[b]
					boundAverage[b] = boundSum[b] / regionCountForAverage
					
					if(bounds[b] < boundFarthest[b]):
						boundFarthest[b] = bounds[b]
			
			for b in dirGreaterThan:
				diffAvg = abs(bounds[b] - boundAverage[b])
				
				if strictFilter:
					diffPrev = diffAvg
				else:
					diffPrev = abs(bounds[b] - regionPrevBounds[b])
				
				if(diffAvg <= outlierThresh or diffPrev <= outlierThresh or not filterBoundOutliers):
					regionCountForAverage += 1
					boundSum[b] += bounds[b]
					boundAverage[b] = boundSum[b] / regionCountForAverage
					
					if(bounds[b] > boundFarthest[b]):
						boundFarthest[b] = bounds[b]
			
			if label:
				region.imageFillRegion((255, 0, 255))
			
			regionPrevBounds = bounds
			
			if verboseDebug:
				print('-----')
				print('\nPOS: %s' % str(region.pixLocation))
				print('\nAVG')
				
				for d in boundDirs:
					print('\tDIR: %s\tVALUE: %s' % (d, int(boundAverage[d])))
				
				time.sleep(0.1)
		
		return {
			'regionList' : regionRedDetect,
			'boundFarthest' : boundFarthest,
			'boundSum' : boundSum,
			'boundAverage' : boundAverage
		}
	
	
	def __init__(self, imageObject, imageLoaded):
		self.imageObject = imageObject
		self.imageLoaded = imageLoaded
		self.regionList = []

# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====


# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# >>> >>> >>> CLASS: REGION <<< <<< <<<

class Region:

	def isRegionRed(self):
		colorAverage = self.getRegionPixelAverage()
		return redBackgroundCheck(colorAverage)


	def imageFillRegion(self, color):
		centerX = self.pixLocation[0]
		centerY = self.pixLocation[1]
		
		# POSSIBLE BUG: should +1 be added to right-hand bound of the horizontal and vertical range?
		# The +1 results in an index out-of-bounds error when in an image with a resoltuion IDENTICAL to the region size.
		# However, the +1 produces the correct (or at least expected) number of items in the pixelList.
		
		for x in range(centerX - self.pixRadius, centerX + self.pixRadius):
			for y in range(centerY - self.pixRadius, centerY + self.pixRadius):
				self.imageLoaded[x, y] = color


	def getRegionPixelList(self):
		centerX = self.pixLocation[0]
		centerY = self.pixLocation[1]
		
		pixelList = []
		
		if self.pixRadius == 0:
			pixelList.append(self.imageLoaded[centerX, centerY])
		else:
			# POSSIBLE BUG (REPEAT): should +1 be added to right-hand bound of the horizontal and vertical range?
			for x in range(centerX - self.pixRadius, centerX + self.pixRadius):
				for y in range(centerY - self.pixRadius, centerY + self.pixRadius):
					pixelList.append(self.imageLoaded[x, y])
		
		return pixelList
	

	def getRegionPixelAverage(self):
		# sum of all the individual color values (RGB)
		redSum = 0
		greenSum = 0
		blueSum = 0
		
		pixelList = self.getRegionPixelList()
		pixelCount = len(pixelList)
		
		for color in pixelList:
			redSum += color[0]
			greenSum += color[1]
			blueSum += color[2]
		
		return (int(redSum / pixelCount), int(greenSum / pixelCount), int(blueSum / pixelCount))


	def __init__(self, imageObject, imageLoaded, pixLocation, pixRadius=1):
		# PIL object of image with Image.open()
		self.imageObject = imageObject
		
		# PIL object of image with load()
		self.imageLoaded = imageLoaded
		
		# 2D tuple integer location of the center of the region
		self.pixLocation = pixLocation
		
		# integer radius of the region in pixels
		self.pixRadius = pixRadius
		
		# the topmost, bottommost, leftmost, and rightmost x/y values
		self.pixBounds = {
			'top':(pixLocation[1] - pixRadius),
			'bottom':(pixLocation[1] + pixRadius),
			'left':(pixLocation[0] - pixRadius),
			'right':(pixLocation[0] + pixRadius)
		}

# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====


# ===== ===== ===== ===== ===== ===== ===== ===== ===== =====
# >>> >>> >>> CLASS: CROPPER <<< <<< <<<

class Cropper:
	
	def chunkSetup(self, outerBox, innerBox, regionRadius):
		"""Sets up the topmost, bottommost, leftmost, and rightmost chunks around the book based on an inner and outer box.
		
		The boxes are a 4D integer tuple indicating horizontal and vertical pixel coordinates: (left, upper, right, lower).
		"""
		self.chunkDict['top'].chunkDefinePackAuto((innerBox[0], outerBox[1]), (innerBox[2], innerBox[1]), regionRadius)
		self.chunkDict['bottom'].chunkDefinePackAuto((innerBox[0], innerBox[3]), (innerBox[2], outerBox[3]), regionRadius)
		self.chunkDict['left'].chunkDefinePackAuto((outerBox[0], outerBox[1]), (innerBox[0], outerBox[3]), regionRadius)
		self.chunkDict['right'].chunkDefinePackAuto((innerBox[2], outerBox[1]), (outerBox[2], outerBox[3]), regionRadius)
	
	
	def chunkFillColor(self):
		colorIndex = 0
		
		for side in self.chunkSides:
			self.chunkDict[side].chunkFillColor(self.fillColorSamples[colorIndex])
			
			colorIndex = (colorIndex + 1) % len(self.fillColorSamples)
	
	def chunkFillRedDetect(self, outlierThresh, filterBoundOutliers=True, strictFilter=False, forceOrientation=False):
		for side in self.chunkSides:
			chunk = self.chunkDict[side]
			chunk.chunkRedDetectRegions(outlierThresh, filterBoundOutliers, strictFilter, True, False)
	
	
	def chunkSetupTextbook(self, distanceUntilTripod, leftRightChunkWidth, topBottomChunkHeight, regionRadius):
		"""Sets up the chunks based on the sample images in the repository."""
		
		imageWidth = self.imageObject.size[0]
		imageHeight = self.imageObject.size[1]
		
		outerBox = (0, 0, imageWidth, distanceUntilTripod)
		innerBox = (leftRightChunkWidth, topBottomChunkHeight, imageWidth - leftRightChunkWidth, distanceUntilTripod - topBottomChunkHeight)
		
		self.chunkSetup(outerBox, innerBox, regionRadius)
	
	
	def orientationDetect(self, outlierThresh, filterBoundOutliers=True, strictFilter=False):
		"""Return the orientation of the book based on the amount of background/red detection on the left and right chunk.
		
		Return "right" if there are more red Regions in the right chunk than the left chunk.
		Return "left" if there are more red Regions in the left chunk than the right chunk.
		Return "both" if there are an equal number of red Regions in the left chunk and the right chunk..
		"""
		
		# if chunks not set up yet
		if(not self.chunkDict):
			return None
		
		leftResults = self.chunkDict['left'].chunkRedDetectRegions(outlierThresh, filterBoundOutliers, strictFilter)
		rightResults = self.chunkDict['right'].chunkRedDetectRegions(outlierThresh, filterBoundOutliers, strictFilter)
		
		leftCount = len(leftResults['regionList'])
		rightCount = len(rightResults['regionList'])
		
		if(rightCount > leftCount):
			return "right"
		elif(leftCount > rightCount):
			return "left"
		else:
			return "both"
	
	
	def crop(self, cropMarginPixel, outlierThresh, filterBoundOutliers=True, strictFilter=False, forceOrientation=False, debug=False):
		"""Detects the background/red Regions in all four chunks and returns a new image object with the background cropped out.
		
		More specifically, it determines the "bounds" (bottommost, topmost, leftmost, and rightmost pixels) of the
		book or subject itself that EXCLUDE the background/red Regions and crops the image to be fit within those bounds.
		
		Parameters:
			(many parameters borrowed from RegionChunk chunkRedDetectRegions)
			cropMarginPixel:	The amount of pixels that extends past the crop bounds (e.g. if it is 10, then extend
								10 pixels above the topmost crop bound, 10 pixels below the bottommost crop bound, etc.).
								Used to make the cropping less "greedy" and likely to crop away actual book/subject content.
			forceOrientation:	If True, then the cropping system will crop only EITHER the left or right side of the
								book/subjet, not both; if False, then both the left and right side will be considered and cropped.
								It is useful to set this to True for very large books/subjects where only either the left
								or right side is visible in the picture frame.
		"""
		
		# if chunks not set up yet
		if(not self.chunkDict):
			return None
		
		imageWidth = self.imageObject.size[0]
		imageHeight = self.imageObject.size[1]
		
		
		defaultCropValues = {
			'top':0,
			'bottom':imageHeight,
			'left':0,
			'right':imageWidth
		}
		
		# each side has a list with the following values:
			# 0 = for a particular side of chunk, this is the side of THAT chunk OPPPOSITE to its side
			# 1 = determines whether to subtract (-1) or add (1) the margin
		
		chunkSideRegionRedCount = {
			'top':0,
			'bottom':0,
			'left':0,
			'right':0
		}
		
		cropSettings = {
			'top':['bottom', -1],
			'bottom':['top', 1],
			'left':['right', -1],
			'right':['left', 1]
		}
		
		cropValues = defaultCropValues.copy()
		
		chunkResults = {}
		
		for side in self.chunkSides:
			chunk = self.chunkDict[side]
			
			settings = cropSettings[side]
			
			results = chunk.chunkRedDetectRegions(outlierThresh, filterBoundOutliers, strictFilter, debug, False)
			chunkResults[side] = results
			
			if results:
				cropValues[side] = results['boundFarthest'][settings[0]] + cropMarginPixel * settings[1]
				chunkSideRegionRedCount[side] = len(results['regionList'])
				
		
		cropTop = cropValues['top']
		cropBottom = cropValues['bottom']
		cropLeft = cropValues['left']
		cropRight = cropValues['right']
		
		if(forceOrientation):
			leftCount = chunkSideRegionRedCount['left']
			rightCount = chunkSideRegionRedCount['right']
			orientation = 'both'
			
			if(rightCount > leftCount):
				orientation = 'right'
			elif(rightCount < leftCount):
				orientation = 'left'
			
			if(orientation == 'left'):
				cropRight = defaultCropValues['right']
				
			elif(orientation == 'right'):
				cropLeft = defaultCropValues['left']
				
			# if both, assume to crop both left and right
		
		if(debug):
			print('top: %d, bottom: %d, left: %d, right %d' % (cropTop, cropBottom, cropLeft, cropRight))
		
		imageCropped = self.imageObject.crop((cropLeft, cropTop, cropRight, cropBottom))
		
		# crop (left, upper, right, lower) tuple box
		return imageCropped
	
	
	def __init__(self, imageObject, imageLoaded):
		self.fillColorSamples = []
		
		for red in range(0, 2):
			for green in range(0, 2):
				for blue in range(0, 2):
					self.fillColorSamples.append((red * 255, green * 255, blue * 255))
		
		del self.fillColorSamples[0] # delete black
		del self.fillColorSamples[6] # delete white
		del self.fillColorSamples[3] # delete red
		
		self.chunkSides = [
			'top',
			'bottom',
			'left',
			'right'
		]
		
		self.imageObject = imageObject
		self.imageLoaded = imageLoaded
		
		self.chunkDict = {}
		
		for side in self.chunkSides:
			self.chunkDict[side] = RegionChunk(imageObject, imageLoaded)


if __name__ == '__main__':
	interface.main()