convert.py

import cv2
import numpy as np
import time
import multiprocessing
from joblib import Parallel, delayed

aspect_ratio = 16 / 9

#Dimensions of the output in terminal characters
width = 80
height = int(width / (2 * aspect_ratio))

# Framerate of the source and output video
src_FPS = 30
dest_FPS = 15


num_cores = multiprocessing.cpu_count()

cap = cv2.VideoCapture('vid.mp4')
frames = []


#Our characters, and their approximate brightness values
charSet = " ,(S#g@"
levels = [0.000, 1.060, 2.167, 3.036, 3.977, 4.730, 6.000]
numChrs = len(charSet)


# Converts a greyscale video frame into a dithered 7-color frame
def processFrame(scaled):
  reduced = scaled * 6. / 255
  
  out = np.zeros((height, width), dtype= np.int8)
  
  line = ''
  for y in range(height):
    for x in range(width):
      level = min(6, max(0, int(reduced[y, x])))
      
      error = reduced[y, x] - levels[level]
  
      err16 = error / 16
  
      if (x + 1) < width:
        reduced[y    , x + 1] += 7 * err16
      if (y + 1) < height:
        reduced[y + 1, x    ] += 5 * err16
  
        if (x + 1) < width:
          reduced[y + 1, x + 1] += 1 * err16
        if (x - 1) > 0:
          reduced[y + 1, x - 1] += 3 * err16
      
      out[y, x] = level

  return out

# Prints out a frame in ASCII
def toStr(frame):
  line = ''
  
  for y in range(height):
    for x in range(width):
      line += charSet[frame[y, x]]
    line += '\n'
  
  return line

# Compute the prediction matrix for each character combination
# Each row in this matrix corresponds with a character, and lists
# in decreasing order, the next most likely character to follow this one
#
# We also convert the provided frame to this new markov encoding, and provide
# the count of each prediction rank to be passed to the huffman encoding
def computeMarkov(frame):
  mat = np.zeros((numChrs, numChrs)).astype(np.uint16)

  h, w = frame.shape

  prevChar = 0

  for y in range(h):
    for x in range(w):
      char = frame[y, x]

      mat[prevChar, char] += 1

      prevChar = char
  
  ranks = np.zeros((numChrs, numChrs)).astype(np.uint16)
  for i in range(numChrs):
    ranks[i][mat[i].argsort()] = 6 - np.arange(numChrs)

  cnt = np.zeros(numChrs).astype(np.uint16)

  out = np.zeros_like(frame)
  prevChar = 0
  for y in range(h):
    for x in range(w):
      char = frame[y, x]

      out[y, x] = ranks[prevChar, char]
      cnt[out[y, x]] += 1

      prevChar = char
  
  return out, ranks, cnt

# Computes Huffman encodings based on the counts of each number in the frame
def computeHuffman(cnts):
  codes = []
  sizes = []
  tree = []
  for i in range(len(cnts)):
    codes.append('')
    sizes.append((cnts[i], [i], i))
    tree.append((i, i))

  sizes = sorted(sizes, reverse = True)

  while(len(sizes) > 1):
    # Take the two least frequent entries
    right = sizes.pop()
    left  = sizes.pop()

    (lnum, lchars, ltree) = left
    (rnum, rchars, rtree) = right

    # Add a new tree node
    tree.append((ltree, rtree))

    # Update the encodings
    for char in lchars:
      codes[char] = '0' + codes[char]
    for char in rchars:
      codes[char] = '1' + codes[char]

    # Merge these entries
    new = (lnum + rnum, lchars + rchars, len(tree) - 1)

    # Find the position in the list to inser these entries
    for insertPos in range(len(sizes) + 1):
      # Append if we hit the end of the list
      if(insertPos == len(sizes)):
        sizes.append(new)
        break
        
      cnt, _, _ = sizes[insertPos]
      
      if(cnt <= lnum + rnum):
        sizes.insert(insertPos, new)
        break

  return codes, tree

# Take a markov frame and an array of huffman encodings, and create an array of
# bytes corresponding to the compressed frame
def convertHuffman(markovFrame, codes):
  out = ''

  h, w = frame.shape

  for y in range(h):
    for x in range(w):
      out = out + codes[markovFrame[y, x]]
  
  # Pad this bit-string to be byte-aligned
  padding = (8 - (len(out) % 8)) % 8
  out += ("0" * padding)

  # Convert each octet to a char
  compressed = []
  for i in range(0, len(out), 8):
    byte = out[i:i+8]
    char = 0
    for bit in range(8):
      char *= 2
      if byte[bit] == "1":
        char += 1

    compressed.append(char)

  return compressed

# Converts a rank matrix into a binary format to be stored in the output file
def encodeMatrix(ranks):
  out = []

  for row in ranks:
    encoding = 0

    fact = 1
    idxs = list(range(len(charSet)))

    for rank in range(len(charSet)):
      rank = list(row).index(rank)
      encoding += idxs.index(rank) * fact

      fact *= len(idxs)
      idxs.remove(rank)
    
    low_byte = int(encoding) % 256
    high_byte = (encoding - low_byte) // 256
    
    out.append(high_byte)
    out.append(low_byte)

  return out

# Converts the huffman tree into a binary format to be stored in the output file
def encodeTree(tree):
  tree = tree[len(charSet):]

  out = []

  for (l, r) in tree:
    out.append(l * 16 + r)

  return out

# Load all frames into memory, then convert them to greyscale and resize them to
# our terminal dimensions
vidFrames = []
while(cap.isOpened()):
  if (len(vidFrames) % 500) == 0:
    print('Loading frame %i' % len(vidFrames))
  
  # Skip frames to reach target framerate
  for i in range(int(src_FPS / dest_FPS)):
    ret, frame = cap.read()
  
  if frame is None:
    break
  
  gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
  scaled = cv2.resize(gray, (width, height))
  
  vidFrames.append(scaled)

# Compute dithering for all frames in parallel
print('Dithering Frames')
frames = Parallel(n_jobs=num_cores)(delayed(processFrame)(i) for i in vidFrames)

# Compute markov and huffman encoding for all frames
print('Encoding Frames')
out = ''
size = 0

with open('data', 'wb') as filehandle:
  for frame in frames:
    markovFrame, ranks, cnts = computeMarkov(frame)

    codes, tree = computeHuffman(cnts)
    chars = convertHuffman(markovFrame, codes)

    matrixData = encodeMatrix(ranks)
    treeData = encodeTree(tree)

    filehandle.write(bytearray(matrixData))
    filehandle.write(bytearray(treeData))
    filehandle.write(bytearray(chars))

    size += len(matrixData) + len(treeData) + len(chars)

# Print the size of the output file in human-readable form
if size > 1048576:
  print('%.1f MB' % (size / 1048576))
elif size > 1024:
  print('%.1f KB' % (size / 1024))
else:
  print('%i B' % (size))