video.py

#trackbar and buttons https://stackoverflow.com/questions/54674343/how-do-we-create-a-trackbar-in-open-cv-so-that-i-can-use-it-to-skip-to-specific
#https://stackoverflow.com/questions/38314933/how-to-make-buttons-in-opencv-3-1-using-cv2-createbutton
import sys
import cv2
import time
import math
import ntpath
import numpy as np
from operatingSystem import screen
from loguru import logger as log
from collections import namedtuple, deque

class Const:
    FIRST_LIST_ELEMENT = 0
    SECOND_LIST_ELEMENT = 1
    # MOUSE_HOVER_SPLIT_MAX_VIDEO = 4 #If MAX_SIMULTANEOUS_VIDEO_DISPLAY exceeds MOUSE_HOVER_SPLIT_MAX_VIDEO, the mouse hover (which dynamically alters the video split position) capability won't be available
    MAX_SIMULTANEOUS_VIDEO_DISPLAY = 8 #maximum number of videos that can be shown at once (feel free to increase this number as per the hardware capability of your computer). 
    RGB_VIDEO_DIMENSION_LEN = 3       

class VideoSplit:
    NONE = None #There's only one video or none
    HORIZONTAL = 0 #videos will be split horizontally. To show 6 videos, there will be 5 splits horizontally. Video split position can change on mouse hover only if there are 2 videos.
    VERTICAL = 1 #videos will be split vertically. So to show 8 videos, there will be 7 vertical splits. Video split position can change on mouse hover only if there are 2 videos.
    MIN_NUMBER_OF_PIXELS_SHOWN = 5 #When videos are split, at least 5 pixels of each video should be visible. This is used to determine the maximum number of videos that can be shown simultaneously

class KeyCodes: #https://progtpoint.blogspot.com/2017/06/key-board-ascii-key-code.html
    ESC = 27
    SPACEBAR = 32
    UP_ARROW = 82
    DOWN_ARROW = 84
    LEFT_ARROW = 81
    RIGHT_ARROW = 83
    SPLIT_DIRECTION = 'A'
    SHOW_LINE_SPLITTER = 'L'
    SHOW_NAME = 'N'
    PLUS = 61
    NUMPAD_PLUS = 43
    MINUS = 45
    CYCLE_BACK = 91 # the key for {[
    CYCLE_FORWARD = 93 # the key for ]}

class VideoFile:
    """ Stores properties of the video """
    def __init__(self, videoNameWithPath) -> None:
        self.videoName = videoNameWithPath
        self.videoFileName = ntpath.basename(self.videoName)
        self.video = cv2.VideoCapture(self.videoName)
        self.height = int(self.video.get(cv2.CAP_PROP_FRAME_HEIGHT))
        self.width = int(self.video.get(cv2.CAP_PROP_FRAME_WIDTH))
        self.maxFrames = int(self.video.get(cv2.CAP_PROP_FRAME_COUNT))
        self.fps = self.video.get(cv2.CAP_PROP_FPS)        
        log.info(f"Video: {self.video}, height: {self.height}, width: {self.width}, fps: {self.fps}, name: {videoNameWithPath}")
        self.sliceStart = None
        self.sliceEnd = None
        self.padding = namedtuple('Padding', 'top bottom left right')
        self.setPadding(0, 0, 0, 0)
        self.textPosition = None
        self.frames = []
    
    def setPadding(self, top, bottom, left, right):
        self.padding.top = top; self.padding.bottom = bottom; self.padding.left = left; self.padding.right = right


#Note: It's not necessary that all videos will have the same dimensions, codec or framerate
class VideoProcessor:
    """ Performs various calculations on the videos """
    def __init__(self) -> None:
        #self.videos = videos
        self.videoSplitType = VideoSplit.NONE
        self.videoOrder = []
        self.allowMouseHover = False
        self.drawLineSeparatingVideos = True
        self.showFilename = False
        self.splitLineColor = (255, 255, 255) #TODO: Draw half the line as black and half as white (or contrast it based on background pixel color)
        self.lineThickness = 1
        self.lineType = cv2.LINE_AA
        self.font = cv2.FONT_HERSHEY_SIMPLEX
        self.fontThickness = 1
        self.fontScale = 0.4
        self.fontLineType = cv2.LINE_AA
        self.fontColor = (100, 100, 100)  
        self.filenameVerticalOffset = 10                     
        self.filenameHorizontalOffset = 2

    def determineVideoSplitType(self, videos):
        if len(videos) > 1 and self.videoSplitType == VideoSplit.NONE: #if the videoSplitType has never neen assigned based on the number of videos (when there are more than 1 video)
            self.videoSplitType = VideoSplit.VERTICAL #the default

    def toggleSplitAxis(self, videos):
        if self.videoSplitType == VideoSplit.NONE: log.error(f"No split type has been set yet. You can only set it after any valid video is detected. Also, there's no point setting a split type when there's only one video.")
        else:
            if self.videoSplitType == VideoSplit.HORIZONTAL: self.videoSplitType = VideoSplit.VERTICAL
            else:
                if self.videoSplitType == VideoSplit.VERTICAL: self.videoSplitType = VideoSplit.HORIZONTAL
        self.calculateSplitDimensionsAndPaddings(videos)
    
    def hideLineSeparatorIfOnlyOneVideoPresent(self, videos):
        if len(videos) == 1:
            self.drawLineSeparatingVideos = False

    def toggleLineSeparator(self, videos):        
        if self.drawLineSeparatingVideos: self.drawLineSeparatingVideos = False
        else: self.drawLineSeparatingVideos = True            
        self.hideLineSeparatorIfOnlyOneVideoPresent(videos)

    def toggleFileNameDisplay(self):
        if self.showFilename: self.showFilename = False
        else: self.showFilename = True
                
    def calculateSplitDimensionsAndPaddings(self, videos):#if videos are of different sizes, to join pieces of their frames, you need to pad the remaining space with zeroes
        #Note: videos is a dict {video object reference: video frame}. The frame is a numpy array (videoHeight, videoWidth, rgb axis)
        self.determineVideoSplitType(videos)
        self.hideLineSeparatorIfOnlyOneVideoPresent(videos)
        widths = set([video.width for video in videos])
        heights = set([video.height for video in videos])
        self.maxWidth = max(widths)#; minWidth = min(widths)
        self.maxHeight = max(heights)#; minHeight = min(heights)        
        #---find coordinates to split each video into and the padding it needs
        splitPercentage = 1 / len(videos)
        ordinal = 0
        for video in videos:            
            topPadding = 0; bottomPadding = self.maxHeight - video.height; leftPadding = 0; rightPadding = 0 #padding values
            if self.videoSplitType == VideoSplit.VERTICAL:
                video.sliceStart = math.floor(ordinal * (video.width * splitPercentage))
                video.sliceEnd = math.floor(video.sliceStart + (video.width * splitPercentage))
                #---padding calculation
                if video.height != self.maxHeight: #video.makePaddingEmptyArray() #no need of padding, since the video is as big as the largest video
                    bottomPadding = self.maxHeight - video.height                    
            if self.videoSplitType == VideoSplit.HORIZONTAL:   
                video.sliceStart = math.floor(ordinal * (video.height * splitPercentage))
                video.sliceEnd = math.floor(video.sliceStart + (video.height * splitPercentage))                       
                #---padding calculation
                if video.width != self.maxWidth: #video.makePaddingEmptyArray() #no need of padding, since the video is as big as the largest video
                    rightPadding = self.maxWidth - video.width
            video.setPadding(topPadding, bottomPadding, leftPadding, rightPadding)
            #---generate numpy array with padding
            ordinal += 1                

    def splitAndArrangeVideoPieces(self, videos, mouseX=0, mouseY=0):#videos is a dict {VideoFile object: video frame}
        if self.videoOrder != list(videos.keys()):#check if keys are in the exact same order (to ensure that the User did not change anything and to ensure that all video frames are the same as they were previously, because sometimes a video may run out of frames while the other videos continue playing)
            self.calculateSplitDimensionsAndPaddings(videos)
            self.videoOrder = list(videos.keys())
        #---join the various video slices
        joined = np.array(None); EMPTY_ARRAY = 1   
        linePosition = 0; linePositions = []; previousStartPosition = 0
        for video in videos:
            #---apply padding
            videos[video] = cv2.copyMakeBorder(videos[video], video.padding.top, video.padding.bottom, video.padding.left, video.padding.right, cv2.BORDER_CONSTANT)
            newFrame = videos[video]
            #---cut desired portion of frame
            if self.videoSplitType == VideoSplit.VERTICAL:
                newFrame = videos[video][Const.FIRST_LIST_ELEMENT:self.maxHeight, video.sliceStart:video.sliceEnd] #select region to be displayed
            if self.videoSplitType == VideoSplit.HORIZONTAL:
                newFrame = videos[video][video.sliceStart:video.sliceEnd, Const.FIRST_LIST_ELEMENT:self.maxWidth] #select region to be displayed
            #---join the padded video slice with the other video slices
            if joined.size == EMPTY_ARRAY: joined = newFrame
            else: joined = np.concatenate((joined, newFrame), axis=self.videoSplitType)
            #---gather the positions required to draw a line separating the videos                          
            if self.videoSplitType == VideoSplit.VERTICAL: linePosition = linePosition + newFrame.shape[Const.SECOND_LIST_ELEMENT] #needs to be calculated for filename text position
            if self.videoSplitType == VideoSplit.HORIZONTAL: linePosition = linePosition + newFrame.shape[Const.FIRST_LIST_ELEMENT] #needs to be calculated for filename text position
            if self.drawLineSeparatingVideos:                     
                linePositions.append(linePosition)    # TODO: modify this to make it calculate positions only during calculateSplitDimensionsAndPaddings
            if self.showFilename:
                if self.videoSplitType == VideoSplit.VERTICAL: video.textPosition = (previousStartPosition + self.filenameHorizontalOffset, self.maxHeight - self.filenameVerticalOffset)
                if self.videoSplitType == VideoSplit.HORIZONTAL: video.textPosition = (0 + self.filenameHorizontalOffset, previousStartPosition + self.filenameVerticalOffset)
                cv2.putText(img=joined, text=video.videoFileName, org=video.textPosition, fontFace=self.font, fontScale=self.fontScale, color=self.fontColor, thickness=self.fontThickness, lineType=cv2.LINE_AA)                    
            previousStartPosition = linePosition         
        #---draw a line separating the videos
        if self.drawLineSeparatingVideos:     
            for pos in linePositions:                       
                if self.videoSplitType == VideoSplit.VERTICAL:
                    point1 = (pos, 0); point2 = (pos, self.maxHeight)                 
                if self.videoSplitType == VideoSplit.HORIZONTAL:
                    point1 = (0, pos); point2 = (self.maxWidth, pos)                                    
                cv2.line(img=joined, pt1=point1, pt2=point2, color=self.splitLineColor, thickness=self.lineThickness, lineType=self.lineType, shift=0)
        return joined


class DisplayVideos:
    """ Receives video frames and displays videos together """
    def __init__(self, videoLocations) -> None:
        self.videos = deque()
        for videoFile in videoLocations:
            self.videos.append(VideoFile(videoFile))
        self.checkMaxSupportedVideos()
        self.framerate = self.findMaxFramerate()
        if self.framerate <= 0: log.error(f"Framerate can't be {self.framerate}")
        self.width, self.height = self.findMaxDisplaySize()
        self.maxFramerate = int(self.framerate)  
        self.processor = VideoProcessor()
        self.delayBetweenFrames = self.maxFramerate
        self.maxDelayBetweenFrames = 1000
        self.frameTrackbarName = "Frame"
        self.delayTrackbarName = "Delay"
        #self.delayGranularity = int(self.maxFramerate / 5)
        #if self.delayGranularity <= 0: self.delayGranularity = 1  
        self.seekGranularity = self.maxFramerate   
        self.maxFramesAvailable = 0 
        self.currentFrame = 0 
        self.preCachingEnabled = True

    def preCacheVideos(self):  
        print(f"Please wait while frames are cached for {len(self.videos)} videos (this is necessary to overcome a seek bug in the video processing base library). All videos will be loaded into RAM (the efficiency of this data storage depends on how Python manages memory).")
        self.preCachingEnabled = True
        noMoreFrames = False
        while not noMoreFrames:
            noMoreFrames = True
            for video in self.videos:
                if video.video.isOpened():
                    gotValidFrame, videoFrame = video.video.read() #frame is a numpy nd array
                    if gotValidFrame:
                        noMoreFrames = False
                        video.frames.append(videoFrame) #caching it to be able to move backward when needed
        self.maxFramesAvailable = max([len(video.frames) for video in self.videos])
        print(f"Pre-caching completed.")

    def doNotPreCacheVideos(self):
        self.preCachingEnabled = False
        self.maxFramesAvailable = max([video.maxFrames for video in self.videos])
        print("Proceeding without pre-caching...")        

    def getThisFrame(self, trackbarValue):
        self.currentFrame = trackbarValue

    def setSpeed(self, trackbarValue):
        self.delayBetweenFrames = max(trackbarValue, 1) #allowing the value to go less than 1 freezes the video and does not allow resumption

    def display(self):
        print(f"The video with maximum number of frames has {self.maxFramesAvailable} frames.")
        #Concatenate images: https://stackoverflow.com/questions/7589012/combining-two-images-with-opencv
        self.currentFrame = 0
        self.windowName = 'Comparing Videos'
        cv2.namedWindow(self.windowName, cv2.WINDOW_NORMAL)
        cv2.resizeWindow(self.windowName, self.width, self.height)  
        cv2.createTrackbar(self.frameTrackbarName, self.windowName, 0, self.maxFramesAvailable, self.getThisFrame)
        cv2.createTrackbar(self.delayTrackbarName, self.windowName, self.delayBetweenFrames, self.maxDelayBetweenFrames, self.setSpeed)                 
        while True:
            if self.currentFrame >= self.maxFramesAvailable:
                self.currentFrame = 0 #looping to the front of the video
            #---iterate videos assuming that one of them might stop supplying frames eariler than the others
            cv2.setTrackbarPos(self.frameTrackbarName, self.windowName, self.currentFrame) 
            activeVideos = dict()    
            for video in self.videos:
                if self.preCachingEnabled:
                    if self.currentFrame < len(video.frames):
                        activeVideos[video] = video.frames[self.currentFrame]
                else:
                    if self.currentFrame < video.maxFrames:
                        video.video.set(cv2.CAP_PROP_POS_FRAMES, self.currentFrame - 1) #-1 because CAP_PROP_POS_FRAMES sets it at index of the frame to be decoded/captured next.
                        if video.video.isOpened():#TODO: check if this operation is necessary
                            gotValidFrame, videoFrame = video.video.read() #frame is a numpy nd array
                            if gotValidFrame:
                                activeVideos[video] = videoFrame

            self.currentFrame = self.currentFrame + 1
            if not activeVideos:#if there are no active videos remaining
                break #exit while            
            joined = self.processor.splitAndArrangeVideoPieces(activeVideos)            
            cv2.imshow(self.windowName, joined) 
            keyCode = cv2.waitKey(self.delayBetweenFrames) & 0xFF #https://stackoverflow.com/questions/57690899/how-cv2-waitkey1-0xff-ordq-works            
            if keyCode == KeyCodes.ESC: break #exit the program
            if keyCode == KeyCodes.SPACEBAR: time.sleep(1) #pause the video for a while
            if keyCode == KeyCodes.CYCLE_BACK: self.videos.rotate(-1) #switch positions of the videos up if horizontal splits, and backward if vertical splits
            if keyCode == KeyCodes.CYCLE_FORWARD: self.videos.rotate(1) #switch positions of videos down if horizontal splits, and forward if vertical splits
            if keyCode == KeyCodes.LEFT_ARROW: #for either seeking backward cached frames
                self.currentFrame -= self.seekGranularity
                if self.currentFrame < 0: self.currentFrame = 0 
            if keyCode == KeyCodes.RIGHT_ARROW: #for either seeking forward cached frames
                self.currentFrame += self.seekGranularity
                if self.currentFrame >= self.maxFramesAvailable: self.currentFrame = self.maxFramesAvailable - 1
            # if keyCode == KeyCodes.UP_ARROW: #speed increase by decreasing the delay between frames
            #     self.delayBetweenFrames -= int(self.maxFramerate / 2)
            #     if self.delayBetweenFrames < 0: self.delayBetweenFrames = 1
            # if keyCode == KeyCodes.DOWN_ARROW: #speed decrease by increasing the delay between frames
            #     self.delayBetweenFrames += int(self.maxFramerate / 2)
            #if keyCode == KeyCodes.DOWN_ARROW or keyCode == KeyCodes.UP_ARROW: log.info(f"Delay between frames: {self.delayBetweenFrames}")
            if keyCode == ord(KeyCodes.SPLIT_DIRECTION) or keyCode == ord(KeyCodes.SPLIT_DIRECTION.lower()):#to split the video horizontally or vertically
                self.processor.toggleSplitAxis(activeVideos)            
            if keyCode == ord(KeyCodes.SHOW_LINE_SPLITTER) or keyCode == ord(KeyCodes.SHOW_LINE_SPLITTER.lower()):#to show a line where the video is separated from other videos (no line is shown if only one video is present)
                self.processor.toggleLineSeparator(activeVideos)
            if keyCode == ord(KeyCodes.SHOW_NAME) or keyCode == ord(KeyCodes.SHOW_NAME.lower()):#to show a line where the video is separated from other videos (no line is shown if only one video is present)
                self.processor.toggleFileNameDisplay()              
        self.close()

    def close(self):
        """ Clear resources """
        for video in self.videos:
            video.video.release()
        cv2.destroyAllWindows()

    def findMaxDisplaySize(self):
        """ Returns the maximum width of any video and maximum height of any video in the list of videos """
        monitor = screen.MonitorInfo()
        monitorWidth, monitorHeight = monitor.getMonitorDimensions()
        width = max([video.width for video in self.videos])
        height = max([video.height for video in self.videos])
        if width > monitorWidth or height > monitorHeight:
            log.warning(f"\n\nYour primary monitor width {monitorWidth} and height {monitorHeight} are less than the video width {width} and height {height}.")
        return width, height

    def checkMaxSupportedVideos(self):
        """ Checks if the number of pixels in the videos supplied can be displayed in split format """
        width = min([video.width for video in self.videos])
        height = min([video.height for video in self.videos])
        maxVideosAllowed = min([width, height]) / VideoSplit.MIN_NUMBER_OF_PIXELS_SHOWN 
        log.info(f"{len(self.videos)} videos supplied. {maxVideosAllowed} videos supported. Each video should show a minimum of {VideoSplit.MIN_NUMBER_OF_PIXELS_SHOWN} pixels") 
        if len(self.videos) > maxVideosAllowed:
            log.error(f"Either you are trying to play video formats that aren't supported, or you supplied {len(self.videos)} videos, but only {maxVideosAllowed} videos are supported because at least {VideoSplit.MIN_NUMBER_OF_PIXELS_SHOWN} pixels of each video needs to be visible when split")
            sys.exit()

    def findMaxFramerate(self):
        """ Returns the maximum framerate among all videos """
        return max(set([video.fps for video in self.videos]))