continuous.py


from argparse import Namespace
import cv2
import numpy as np
import os
import glob
import sys
import time
import ast
import random
import time

default_cave_order = "Emergence Cave,Emergence Cave,Hole of Beasts,Hole of Beasts,Hole of Beasts,Hole of Beasts,Hole of Beasts,White Flower Garden,White Flower Garden,White Flower Garden,White Flower Garden,White Flower Garden,Snagret Hole,Snagret Hole,Snagret Hole,Snagret Hole,Snagret Hole,Snagret Hole,Snagret Hole,Bulblax Kingdom,Bulblax Kingdom,Bulblax Kingdom,Bulblax Kingdom,Bulblax Kingdom,Bulblax Kingdom,Bulblax Kingdom,Subterranean Complex,Subterranean Complex,Subterranean Complex,Subterranean Complex,Subterranean Complex,Subterranean Complex,Subterranean Complex,Subterranean Complex,Frontier Cavern,Frontier Cavern,Frontier Cavern,Frontier Cavern,Frontier Cavern,Frontier Cavern,Frontier Cavern,Citadel of Spiders,Citadel of Spiders,Citadel of Spiders,Citadel of Spiders,Citadel of Spiders,Glutton's Kitchen,Glutton's Kitchen,Glutton's Kitchen,Glutton's Kitchen,Glutton's Kitchen,Glutton's Kitchen".split(",")
default_cave_index = 0

with open("config_use.txt" if os.path.exists("config_use.txt") else "config.txt", "r") as f:
    config_args_string = f.read()
    config_args_string = config_args_string[0:config_args_string.index("#####")]
    config_args_string = "\n".join([x[0:x.index("#")] if "#" in x else x for x in config_args_string.split("\n")])
    config_args_string = config_args_string.replace("\\","\\\\")
    args = Namespace(**ast.literal_eval(config_args_string))
print(args)

try:
    os.mkdir(args.templates)
except FileExistsError:
    pass
try:
    os.mkdir("output/")
except FileExistsError:
    pass
try:
    os.mkdir("output/!im/")
except FileExistsError:
    pass
try:
    os.mkdir("output/!im/chars/")
except FileExistsError:
    pass

videoFile=args.camera
if videoFile == 'find':
    list_of_files = glob.glob(args.video_path + "*")
    videoFile = max(list_of_files, key=os.path.getctime)
    print("Using: %s" % videoFile)
if not isinstance(args.camera, int) and "/" not in videoFile and "\\" not in videoFile:
    videoFile = args.video_path + args.camera
cap = cv2.VideoCapture(videoFile)
if isinstance(args.camera, int):
    cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280)
    cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720)
    #cap.set(cv2.CAP_PROP_FPS, 30)
    #print(cap.get(cv2.CAP_PROP_FPS))

if (cap.isOpened() == False): 
    print("Failure - error opening video stream")
    print("make sure virtual cam is setup correctly")
    sys.exit(0)

### generate template numbers

templates = []

if True:
    for i in range(10):
        temp = cv2.imread(args.templates + str(i) + ".png",cv2.IMREAD_UNCHANGED)
        templates.append(temp)
    templates.append(cv2.imread(args.templates + "_.png",cv2.IMREAD_UNCHANGED))
        
### generate template letters

letters_raw_arr = "u3044_u3051_u3060_u306e_u307e_u3082_u308a_u30ac_u30af_u30b7_u30b9_u30c0_u30c7_u30d3_u30d8_u30de_u30e0_u30e1_u30e2_u30e3_u30e9_u30eb_u30ef_u30fc_u4e0b_u4e2d_u53f0_u56fd_u5712_u5730_u57ce_u57fa_u5883_u5922_u59cb_u5bc6_u6226_u6240_u6839_u6c34_u6c8c_u6d1e_u6df7_u738b_u767d_u767e_u78e8_u795e_u79d8_u7a74_u7a9f_u82b1_u8fba_u932c_u98df_u9b54".split("_") + [i for i in 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ']

letters = {}
letters_height = {}
letters_yoff = {}
letters_width = {}
letters_xoff = {}
letters_y_addn = {}

for l in letters_raw_arr:
    img = cv2.imread('files/templates/letters/' + (l+l if l.isupper() else l) + ".png")
    img = cv2.resize(img, (int(img.shape[1]*args.letters_xscale), int(img.shape[0]*args.letters_yscale) ), interpolation=cv2.INTER_LINEAR_EXACT)
    letters[l] = np.uint8(img)
    #cv2.imwrite("output/!im/debug_"+(l+l if l.isupper() else l)+".png",letters[l])
    row_mean = letters[l].max(axis=2).max(axis=1)
    min_idx = 1000
    max_idx = 0
    for i in range(len(row_mean)):
        if row_mean[i] > 70:
            min_idx = min(min_idx,i)
            max_idx = max(max_idx,i)
    letters_height[l] = max_idx-min_idx+1
    letters_yoff[l] = min_idx
    shape_penalty = int((letters[l].shape[0] - letters['u3044'].shape[0])*args.letters_yscale + 0.5)
    letters_y_addn[l] = -shape_penalty+letters[l].shape[0]-letters_height[l]-letters_yoff[l] # important. todo: how should height affect it? could switch letters[l] to letters['u3044'] to get the consensus size
    
    col_mean = letters[l].max(axis=2).max(axis=0)
    min_idx = 1000
    max_idx = 0
    for i in range(len(col_mean)):
        if col_mean[i] > 70:
            min_idx = min(min_idx,i)
            max_idx = max(max_idx,i)
    letters_width[l] = max_idx-min_idx+1
    letters_xoff[l] = min_idx
    #if l == 'l':
    #    #print(l + " " + str(row_mean))
    #print(l + " " + str(img.shape) + " h" + str(letters_height[l]) + " y" + str(letters_yoff[l]) + " w" + str(letters_width[l]) + " x" + str(letters_xoff[l]))
#print(letters_y_addn)
other_letters_w = {" ": args.space_mult, "'": args.apostrophe_mult}

### find and read the digits of a single frame

def read_digits_on_frame(image):

    if args.images:
        comp_img = np.zeros((11*args.digits_height,5*args.digits_width,3), np.uint8)
    output_digits = []
    
    for i in range(5):
        img = image[args.digits_y:args.digits_y+args.digits_height, args.digits_x+args.digits_spacing*i:args.digits_x+args.digits_spacing*i+args.digits_width, :]
        img = img.copy()
        #blur = cv2.GaussianBlur(img,(139,139),0) # this is too slow
        blur = np.zeros(img.shape, np.uint8)
        blur[:,:] = frame.mean(axis=0).mean(axis=0)
        diff = cv2.subtract(128 + cv2.subtract(img,blur),cv2.subtract(blur,img))
        diff = cv2.cvtColor(diff, cv2.COLOR_BGR2GRAY)

        score = []
        #score_addn = [-0.02, 0.015, 0, 0.01, 0,  0, 0, 0.015, 0, 0,  0.07]
        score_addn = [0,0.01,0,0.01,0, 0,0,0,0,0, 0.03]
        for j in range(11):
            template = templates[j]
            res = cv2.matchTemplate(diff,template,cv2.TM_SQDIFF_NORMED)
            score.append((j,res.min(axis=0).min(axis=0) + score_addn[j]))

        score = sorted(score, key=lambda x: x[1])
        pred = score[0][0] if score[0][1] < 0.18 else 10

        #if args.verbose:
        #    print(",".join(["%d %.3f" % x for x in score]))
        if args.images:
            for j in range(11):
                temp_height,temp_width = templates[j].shape[:2]
                temp_x = i*args.digits_width+(args.digits_width-temp_width)//2
                temp_y = j*args.digits_height+(args.digits_height-temp_height)//2
                comp_img[j*args.digits_height:j*args.digits_height+args.digits_height, i*args.digits_width:i*args.digits_width+args.digits_width, 0] = diff
                comp_img[j*args.digits_height:j*args.digits_height+args.digits_height, i*args.digits_width:i*args.digits_width+args.digits_width, 1] = (0 if pred==j else diff)
                comp_img[j*args.digits_height:j*args.digits_height+args.digits_height, i*args.digits_width:i*args.digits_width+args.digits_width, 2] = 128
                comp_img[temp_y:temp_y+temp_height, temp_x:temp_x+temp_width, 2] = templates[j]
        
        output_digits.append(pred)

    # sss = "files/digits6/" + str(count) + "-" + "".join([str(i) if i < 10 else '_' for i in output_digits]) + ".png"
    # print(sss)
    # cv2.imwrite(sss, image)

    print("digits " + "".join([str(i) if i < 10 else '_' for i in output_digits]), flush=True)
    # if args.images:
    #     cv2.imshow('Digit', comp_img)
    #     cv2.waitKey(500)

### check for frames of the challenge mode result screen

# # https://stackoverflow.com/questions/50899692/most-dominant-color-in-rgb-image-opencv-numpy-python
# def bincount_app(a):
#     a2D = a.reshape(-1,a.shape[-1])
#     a2D = np.floor_divide(a2D,64)
#     col_range = (4, 4, 4) # generically : a2D.max(0)+1
#     a1D = np.ravel_multi_index(a2D.T, col_range)
#     return np.unravel_index(np.bincount(a1D).argmax(), col_range)
    
# def is_chresult_screen(frame):
#     height,width = frame.shape[:2]
#     x = width//8
#     y = height//25
#     window = frame[0:y, 3*x:5*x, :]
#     b,g,r = window.mean(axis=0).mean(axis=0)
#     #print("frame: %d %d %d" % (b,g,r))
#     return abs(b-252) + abs(g-11) + abs(r-1) < 15 or abs(b-128) + abs(g-0) + abs(r-0) < 5
#     # b,g,r = bincount_app(frame)
#     # if args.verbose:
#     # return b==3 and g==2 and r==2

# def is_fadeout_screen(frame):
#     average = frame.mean(axis=0).mean(axis=0)
#     return average[0] < 5 and average[1] < 5 and average[2] < 5

def get_screen_type(frame):
    if frame.max(axis=0).max(axis=0).max(axis=0) < args.fadeout_frame_intensity:
        return "fadeout"
    height,width = frame.shape[:2]

    # look for challenge mode result screen
    x = width//8
    y = height//100
    window_top = frame[y:4*y, 3*x:5*x, :]
    b,g,r = window_top.mean(axis=0).mean(axis=0)
    if abs(b-args.chresult_color_b) < 20 and abs(g-args.chresult_color_g) + abs(r-args.chresult_color_r) < 20:
        bM,gM,rM = window_top.max(axis=0).max(axis=0)
        bm,gm,rm = window_top.min(axis=0).min(axis=0)
        if bM-bm < 35 and gM-gm+rM-rm < 25:
            return "chresult"
    
    x = width
    y = height//20
    window1 = frame[0:4*y, 0:x, :]
    window2 = frame[4*y:8*y, 0:x, :]
    window3 = frame[8*y:10*y, 0:x, :]
    window4 = frame[10*y:13*y, x//4:3*x//4, :]
    window5 = frame[13*y:height, 0:x, :]
    average1 = window1.mean(axis=0).mean(axis=0)
    average2 = window2.mean(axis=0).mean(axis=0)
    average3 = window3.mean(axis=0).mean(axis=0)
    average4 = window4.mean(axis=0).mean(axis=0)
    average5 = window5.max(axis=0).max(axis=0)

    # check for rough brightness levels
    f = args.fadeout_frame_intensity
    a = 15
    b = 45
    if max(average5) >= f+a:
        return None
    if not (average1[0] < 2*f+a and average1[1] < 2*f+a and average1[2] < 2*f+a and \
        average2[0] < 2*f+b and average2[1] < 2*f+b and \
        average3[0] < 2*f+a and average3[1] < 2*f+a and average3[2] < 2*f+a and \
        average4[0] < 2*f+b and average4[1] < 2*f+b and average4[2] < 2*f+b):
        return None

    # look for the word sublevel on the screen
    window4 = frame[10*y:13*y, 0:x, :]
    col_max = window4.max(axis=2).max(axis=0)
    black_space = []
    white_space = []
    count = 0
    white = True
    for i in range(len(col_max)):
        if col_max[i] > args.fadeout_frame_intensity+10 and i > width/40 and i < width*39/40:
            if not white:
                black_space.append(count)
                count = 0
            white = True
            count += 1
        else:
            if white and count > 0:
                white_space.append(count)
                count = 0
            white = False
            count += 1
    black_space.append(count)
    #print(col_max)
    
    if len(white_space) >= 3 and sum([1 if x>width*10/960 else 0 for x in white_space]) <= 12 \
        and max(white_space) > width * 25/960 and max(white_space) < width * 90/960 \
        and black_space[0] > width/6 and black_space[-1] > width/6 \
        and black_space[0] < width*7/16 and black_space[-1] < width*7/16 \
        and sum(white_space) > width * 100/960 \
        and (black_space[-2] > min(white_space[0:3])/2 or black_space[-3] > min(white_space[0:3])/2):
        # word sublevel is found

        # check for yellow text
        window3 = frame[8*y:10*y, width//4:3*width//4, :]
        average3 = window3.mean(axis=0).mean(axis=0)
        if average3[2]-average3[0] and average3[1]-average3[0] > args.chenter_redness:
            return "areaenter"

        # check for red bg.
        window2 = frame[4*y:8*y, width//4:3*width//4, :]
        average2 = window2.mean(axis=0).mean(axis=0)
        if average2[2]-average2[0] > args.chenter_redness:
            return "chenter"
        else:
            return "storyenter"
    else:
        if args.verbose and False and len(white_space) > 1:
            print(white_space)
            if not len(white_space) >= 3:
                print("whitespace too short")
            if not sum([1 if x>width*10/960 else 0 for x in white_space]) <= 12:
                print("whitespace too long")
            if not max(white_space) > width * 25/960:
                print("whitespace too thin")
            if not max(white_space) < width * 150/960:
                print("whitespace too thick")
            if not black_space[0] > width/6:
                print("blackspace 0 too thin")
            if not black_space[-1] > width/6:
                print("blackspace -1 too thin")
            if not black_space[0] < width*7/16:
                print("blackspace 0 too thick")
            if not black_space[-1] < width*7/16:
                print("blackspace -1 too thick") 
            if not sum(white_space) > width * 100/960:
                print("sum whitespace too thin " + str(sum(white_space))) 
            if not (black_space[-2] > min(white_space[0:3])/2 or black_space[-3] > min(white_space[0:3])/2):
                print("blackspace gap too thin")

    return "nearfadeout"


# def generate_new_templates(image):

#     copy = image.copy()
    
#     for i in range(5):
#         img = image[args.y:args.y+args.height, args.x+args.spacing*i:args.x+args.spacing*i+args.width, :]
#         img = img.copy()
#         #blur = cv2.GaussianBlur(img,(139,139),0)
#         blur = np.zeros(img.shape, np.uint8)
#         blur[:,:] = frame.mean(axis=0).mean(axis=0)
#         diff = cv2.subtract(128 + cv2.subtract(img,blur),cv2.subtract(blur,img))
#         diff = cv2.cvtColor(diff, cv2.COLOR_BGR2GRAY)

#         cv2.imwrite(args.templates + str(count) + "-" + str(i) + ".png", diff)

#         if i % 2 == 0:
#             copy[args.y:args.y+args.height, args.x+args.spacing*i:args.x+args.spacing*i+args.width, 2] = 200
#         else:
#             copy[args.y:args.y+args.height, args.x+args.spacing*i:args.x+args.spacing*i+args.width, 1] = 200
    
#     cv2.imshow('Digit', copy)
#     cv2.waitKey(args.template_wait)

#     with open("files/continuous_config.txt", "r") as f:
#         updated = Namespace(**ast.literal_eval(f.read()))
#         args.x = updated.x
#         args.y = updated.y
#         args.spacing = updated.spacing
#         args.width = updated.width
#         args.height = updated.height
    
falling_img = None
union_img = None
frames_since_first_story = 10000
frames_since_last_story = 10000
story_frames = []
story_frames_processed = False
num_letters_info = 0

def process_story_frames_name_known():
    print("processing story frames with name known")

    # find the cave name
    cave_name = ""

    global default_cave_index
    global num_letters_info
    global falling_img
    read_from_cave_name_file = False
    try:
        with open("files/cave_name.txt") as f:
            cave_name = f.readline().strip()
    except:
        pass
    if cave_name == "":
        cave_name = default_cave_order[default_cave_index]
        default_cave_index += 1
    else:
        read_from_cave_name_file = True
    #print("cave=" + cave_name)
    cave_name_string = cave_name
    cave_name = cave_name.split("_")[1:] if cave_name[0]=="_" else [i for i in cave_name.replace("_"," ")]
            

    height,width = story_frames[0].shape[:2]

    #print(height)
    #print(width)

    # compute the average image after the letters have stopped moving
    if args.images:
        num_avg = 25
        sum_img = story_frames[0].copy()
        sum_img[:,:,:] = 0
        for frame in story_frames[-num_avg:]:
            sum_img = sum_img + frame / num_avg
        _,avg_thresh_img = cv2.threshold(sum_img,75,255,cv2.THRESH_BINARY)

    # important params
    max_for_falling = args.max_for_falling # IMPORTANT PARAM
    max_row_for_falling = int(height*max_for_falling)

    # find the expected with of the image
    temp_w = 0
    temp_h = 0
    for l in cave_name:
        if l in letters:
            img = letters[l]
            temp_h = max(temp_h, img.shape[0])
            temp_w += img.shape[1]
        else:
            temp_w += letters['l'].shape[1] * other_letters_w[l]

    # compute the letters postions, scrunching if necesary
    xs0 = []
    xs1 = []
    x_off = int(width/2 - temp_w/2 + int(args.letters_xoffset*width))
    y_off = int(height*args.letters_yoffset)
    x_scrunch = 1
    x_scrunch_limit = args.x_scrunch_limit
    if temp_w > x_scrunch_limit * width:
        x_scrunch = x_scrunch_limit * width/temp_w
        x_off = int(width * (1-x_scrunch_limit)//2)+int(args.letters_xoffset*width)
        #print("x scr " + str(x_scrunch))
    if args.images:
        sum_img[:,:,0]=0
        sum_img[:,int(width*(1-x_scrunch_limit)//2)+int(args.letters_xoffset*width),0] = 255
        sum_img[:,int(width-width*(1-x_scrunch_limit)//2)+int(args.letters_xoffset*width),0] = 255
    for l in cave_name:
        xs0.append(int(x_off))
        if l in letters:
            if args.images:
                img = letters[l].copy()
                img[:,:,1:2] = 0
                img = cv2.resize(img, (int(img.shape[1]*x_scrunch), img.shape[0] ), interpolation=cv2.INTER_NEAREST)
                sum_img[y_off:y_off+img.shape[0], int(x_off):int(x_off)+img.shape[1], :] = sum_img[y_off:y_off+img.shape[0], int(x_off):int(x_off)+img.shape[1], :] + img
            x_off += letters[l].shape[1]*x_scrunch
        else:
            x_off += letters['l'].shape[1] * other_letters_w[l] * x_scrunch
        xs1.append(int(x_off))
    
    # determine vertical cutoffs to use
    xs0_use = []
    xs1_use = []
    spacing_needed = int(width * 0.008)
    #print("sp " + str(spacing_needed))
    for i,l in enumerate(cave_name):
        if l not in letters:
            xs0_use.append(xs0[i])
            xs1_use.append(xs1[i])
            continue
        x0 = max(xs0[i]+1, xs1[i-1]-int((letters[cave_name[i-1]].shape[1]-letters_xoff[cave_name[i-1]]-letters_width[cave_name[i-1]])*x_scrunch)+spacing_needed if i>0 and cave_name[i-1] in letters else 0)
        x1 = min(xs1[i]-1, xs0[i+1]+int(letters_xoff[cave_name[i+1]]*x_scrunch)-spacing_needed if i+1<len(xs0) and cave_name[i+1] in letters else width)
        if i+1<len(xs0) and cave_name[i+1]=="'":
            x1 -= spacing_needed
        if x0 + 4 >= x1:
            diff = (x0 + 4 - x1) // 2
            x0 -= diff
            x1 += diff
        xs0_use.append(x0)
        xs1_use.append(x1)
        if args.images:
            sum_img[0:height//2,x0,0] = 255
            sum_img[0:height//2,x1,0] = 255

    
    # for each frame with a falling letter, compute the location of the falling letter
    locs = np.zeros((len(cave_name), 48))
    for story_frame_count,frame in enumerate(story_frames[0:48]):
        #cv2.imwrite("output/!im/debug_a" + str(story_frame_count)+".png",frame)

        #print("storyenter " + str(story_frame_count), flush=True)
        #_,img = cv2.threshold(frame,13,255,cv2.THRESH_BINARY) # may need to change this for wii
        for i,l in enumerate(cave_name):
            if l not in letters: continue
            #print(f"{l} {xs0_use[i]} {xs1_use[i]} {img.shape}")
            section_img = frame[0:max_row_for_falling,xs0_use[i]:xs1_use[i],:]
            if section_img.max(axis=2).max(axis=1).max(axis=0) < args.fadeout_frame_intensity:
                continue
            section_img_blur = cv2.blur(section_img, (25,25))
            section_img = cv2.subtract(section_img, section_img_blur)
            #if args.images and num_letters_info == 0:
                #cv2.imwrite("output/!im/chars/section_" + str(num_letters_info) + " " + str(i) + "_" + str(story_frame_count) + ".png", section_img)
                #cv2.imwrite("output/!im/chars/section_" + str(num_letters_info) + " " + str(i) + "_" + str(story_frame_count) + "b.png", section_img_blur)
            row_means = section_img.max(axis=2).max(axis=1)
            #print(row_means)
            first_nonzero = -1
            last_nonzero = -1
            num_rows_with_stuff = 0
            for j,r in enumerate(row_means):
                if r > args.letter_intensity_thresh:
                    if first_nonzero == -1:
                        first_nonzero = j
                    num_rows_with_stuff += 1
                    last_nonzero = j
            if last_nonzero >= 4 and last_nonzero < max_row_for_falling-1 and num_rows_with_stuff > min(last_nonzero*.75, letters_height[l]*.75):
                # print(str(i) + " " + str(story_frame_count))
                # obs_means = section_img.max(axis=2).max(axis=1)
                # temp_means = letters[l].max(axis=2).max(axis=1)
                # print(",".join([str(int(x)) for x in obs_means]))
                # print(",".join([str(int(x)) for x in temp_means]))
                # obs_shift = []
                # temp_shift = []
                # for j in range(5, -letters_height[l] - 5, -1):
                #     idx = last_nonzero + j
                #     obs_shift.append(int(obs_means[idx]) if idx >= 0 and idx < len(obs_means) else -1)
                #     idx = len(temp_means) - letters_y_addn[l] + j - 1
                #     temp_shift.append(int(temp_means[idx]) if idx >= 0 and idx < len(temp_means) else -1)
                # print(" ".join(["%3d" % x for x in obs_shift]))
                # print(" ".join(["%3d" % x for x in temp_shift]))
                #if first_nonzero > 0:
                #    print(str(i) + " " + str(last_nonzero-first_nonzero) + " " + str(letters_height[l]))
                locs[i][story_frame_count] = last_nonzero 
                #print(str(i//2) + " " + str(last_nonzero))
                #info_string.append(str(i//2+spaces_between[i//2])+","+str(last_nonzero)+",")
                #union_img[last_nonzero,xs0_use[i]:xs1_use[i],:]=0
                #union_img[last_nonzero,xs0_use[i]:xs1_use[i],2]=255
                if args.images:
                    falling_img[last_nonzero,xs0_use[i]:xs1_use[i],:]=0
                    falling_img[last_nonzero,xs0_use[i]:xs1_use[i],2]=255
                    #img[last_nonzero,whitespace[i]:whitespace[i+1],:]=0
                    #img[last_nonzero,whitespace[i]:whitespace[i+1],2]=255
                    if num_letters_info == 0:
                        ims = frame[0:max_row_for_falling,xs0_use[i]:xs1_use[i],2]
                        imgs = ims.copy()
                        imgs[last_nonzero,::5] = 255
                        if first_nonzero > 0:
                            imgs[first_nonzero,::5] = 255
                        cv2.imwrite("output/!im/chars/section_" + str(num_letters_info) + "_" + str(i) + "_" + str(story_frame_count) + "c.png", imgs)
                
        if args.images:
            falling_img = falling_img + frame/5
            #cv2.imwrite("output/!im/debug_" + str(count) + "s" + str(story_frame_count) + ".png", img)
        #info_string.append(";")

    # if args.verbose:
    #     for x in locs:
    #         print(x)

    # try to do some sanity checking on the output...
    # each non space char should have 3-6 entries, all consecutive, and the diffs should be around a certain value
    # otherwise, zero out
    num_bad_char = 0
    num_good_char = 0
    for i,l in enumerate(cave_name):
        nonzero = []
        nonzero_idx = []
        for j,y in enumerate(locs[i]):
            if y>0:
                nonzero.append(y)
                nonzero_idx.append(j)
        if len(nonzero) == 0: 
            if not (l==" " or l =="'"):
                num_bad_char += 1
            continue
        good = len(nonzero) >= 3 and len(nonzero) <= 7 and nonzero_idx[-1]-nonzero_idx[0] == len(nonzero)-1
        for j in range(len(nonzero)-1):
            diff = nonzero[j+1]-nonzero[j]
            if diff/height < 10/720 or diff/height > 35/720:
                good=False
        if not good:
            num_bad_char += 1
            locs[i,:] = 0
        else:
            num_good_char += 1

    # if still good, create the info string. If bad but still seems like a cave entry, write out an empty infostring
    # otherwise, do nothing (this case shouldn't be hit hopefully)

    if num_bad_char > num_good_char and num_good_char < 4:
        print("storyfailed good:"+str(num_good_char)+" bad:"+str(num_bad_char))
    else:
        num_letters_info += 1
        if num_bad_char > len(cave_name)/4 and False: #disable this now that we have a timeout
            print("lettersinfo,,100,0;;;", flush=True)
        else:
            # compute & write out the info string...
            info_string = []
            offset_info = []
            for i,l in enumerate(cave_name):
                if l in letters:
                    offset_info.append(str(letters_y_addn[l]))
                else:
                    offset_info.append(str(-1))

            for j in range(len(locs[0])):
                s = ""
                for i in range(len(locs)):
                    if locs[i][j] > 0:
                        s += str(i) + "," + str(int(locs[i][j])) + ","
                s += ";"
                info_string.append(s)

            print("lettersinfo," + cave_name_string.replace(" ","_") + "," + str(height) 
                + "," + str(len(cave_name)) + "," + ",".join(offset_info) + ";" + "".join(info_string), flush=True) 
        
        if read_from_cave_name_file:
            with open('files/cave_name.txt', 'r') as fin:
                data = fin.read().splitlines(True)
            with open('files/cave_name.txt', 'w') as fout:
                fout.writelines(data[1:])   
        
    if args.images:
        min_row_for_columns = 26*height//100
        max_row_for_columns = 35*height//100
        sum_img[min_row_for_columns,:,:] = 255
        sum_img[max_row_for_columns,:,:] = 255
        # union_img[max_row_for_falling,:,:] = 0 
        # union_img[max_row_for_falling,:,0] = 155
        falling_img[max_row_for_falling,:,:] = 0 
        falling_img[max_row_for_falling,:,0] = 155


        cv2.imwrite("output/!im/debug_" + str(count) + "!avg" + ".png", sum_img)
        cv2.imwrite("output/!im/debug_" + str(count) + "!union_p" + ".png", falling_img)

    # if args.verbose:
    #     for x in locs:
    #         print(x)


def random_colorize(img):
    ret = img.copy()
    ret[:,:,0] = img[:,:,2]*(random.randint(100,255)/255)
    ret[:,:,1] = img[:,:,2]*(random.randint(100,255)/255)
    ret[:,:,2] = img[:,:,2]*(random.randint(100,255)/255)
    return ret

def adjust_gamma(image, gamma=1.0):
	# build a lookup table mapping the pixel values [0, 255] to
	# their adjusted gamma values
	invGamma = 1.0 / gamma
	table = np.array([((i / 255.0) ** invGamma) * 255
		for i in np.arange(0, 256)]).astype("uint8")
	# apply gamma correction using the lookup table
	return cv2.LUT(image, table)

    
### watch the video, find frames of the challenge mode result screen, and read the digits  
skip = 0
count = 0
last_frame_was_digit = False
last_perf_time = time.perf_counter()

ring_buffer_size = 10
ring_buffer_idx = 0
ring_buffer = [None for i in range(ring_buffer_size)]

# frame_for_save_count = 0
# frames_to_output_anyways = 0
# save_to_im_save = False

# while True:
#     frame_for_save_count += 1
#     frame = cv2.imread('im_save/' + str(frame_for_save_count) + '.png', cv2.IMREAD_COLOR)
#     ret = True

while(cap.isOpened()):
    ret, frame = cap.read()

    count += 1
    frames_since_first_story += 1
    frames_since_last_story += 1
    
    if not ret:
        break
    if skip > 0:
        skip -= 1
        continue

    if count == 1 and not isinstance(args.camera, int): # skip ahead
        try:
            if args.skip_seconds > 0:
                cap.set(cv2.CAP_PROP_POS_FRAMES, cap.get(cv2.CAP_PROP_POS_FRAMES)+args.skip_seconds*30)
                continue
        except:
            pass
 
    height,width = frame.shape[:2]
    if count == 1:
        print(f"height {height} width {width}")
    if (height != args.resize_y or width != args.resize_x) and args.resize:
        frame = cv2.resize(frame, (args.resize_x,args.resize_y), interpolation=cv2.INTER_NEAREST)
        height,width = frame.shape[:2]
    if args.crop:
        frame = frame[args.crop_y1:args.crop_y2,args.crop_x1:args.crop_x2,:]
    if args.gamma != 1:
        frame = adjust_gamma(frame, args.gamma)
    
    # ring_buffer[ring_buffer_idx] = frame
    # ring_buffer_idx = (ring_buffer_idx + 1) % ring_buffer_size
    # print(ring_buffer_idx)

    frame_type = get_screen_type(frame)
    
    if frame_type == 'fadeout':
        print("fadeout " + str(count),flush=True)
    elif frame_type == 'chenter':
        print("chlevelenter", flush=True)
    elif frame_type == 'areaenter':
        print("areaenter", flush=True)
    elif frame_type == 'storyenter':
        print("storyenter " + str(count), flush=True)
        #cv2.imwrite("output/!im/debug_" + str(count) + "test.png",frame)
        img = frame.copy()
        story_frames.append(img)
        #_,img = cv2.threshold(img,args.letter_intensity_thresh,255,cv2.THRESH_BINARY)
        #kernel = np.ones((3, 3), np.uint8) 
        #img = cv2.erode(img, kernel) 
        if frames_since_last_story > 80:
            print("resetting storyenter")
            falling_img = np.zeros(frame.shape)
            union_img = np.zeros(frame.shape)
            frames_since_first_story = 0
            story_frames = []
            story_frames.append(img)
            story_frames_processed = False
        frames_since_last_story = 0
        # frames_to_output_anyways = 40

        if frames_since_first_story >= 48 and len(story_frames) >= 48:
            if not story_frames_processed:
                story_frames_processed = True
                process_story_frames_name_known()
    elif frames_since_last_story >= 5 and not story_frames_processed and len(story_frames) >= 15:
        print("shortened storyenter " + str(len(story_frames)))
        story_frames_processed = True
        process_story_frames_name_known()

    elif frame_type == 'chresult':
        read_digits_on_frame(frame)
        last_frame_was_digit = True
    else:
        if last_frame_was_digit:
            print("donedigit",flush=True)
        elif frame_type == "nearfadeout":
            print("nearfadeout " + str(count),flush=True)
        elif frames_since_last_story > 60:
            skip = 0 if isinstance(args.camera, int) else 10
            #cap.set(cv2.CAP_PROP_POS_FRAMES, cap.get(cv2.CAP_PROP_POS_FRAMES)+10)
        last_frame_was_digit = False

    # if frames_to_output_anyways > 0 and save_to_im_save and args.images:
    #     frames_to_output_anyways -= 1
    #     frame_for_save_count += 1
    #     cv2.imwrite("im_save/" + str(frame_for_save_count) + ".png", frame)
    #     if frames_to_output_anyways == 0:
    #         for jjj in range(40):
    #             jjjj = frame.copy()
    #             jjjj[:,:,:]=0
    #             frame_for_save_count += 1
    #             cv2.imwrite("im_save/" + str(frame_for_save_count) + ".png", jjjj)

    
    if args.playback:
        cv2.imshow('Frame',frame)
        key_press = cv2.waitKey(1)
        if key_press & 0xFF == ord('q'):
            break

    this_time = time.perf_counter()
    if args.verbose and count<10:
        print(f"timer: {this_time-last_perf_time:.4f}")
    last_perf_time = this_time

cap.release()
cv2.destroyAllWindows()
print("exit")