ii-pix/dither_apply.pyx
2021-01-11 23:54:00 +00:00

147 lines
5.1 KiB
Cython

# cython: infer_types=True
cimport cython
import numpy as np
# from cython.parallel import prange
# from cython.view cimport array as cvarray
# from libc.stdlib cimport malloc, free
@cython.boundscheck(False)
@cython.wraparound(False)
cdef float clip(float a, float min_value, float max_value) nogil:
return min(max(a, min_value), max_value)
@cython.boundscheck(False)
@cython.wraparound(False)
cdef void apply_one_line(float[:, :, ::1] pattern, int xl, int xr, float[:, ::1] image, float[] quant_error) nogil:
cdef int i, j
cdef float error
for i in range(xr - xl):
for j in range(3):
error = pattern[0, i, 0] * quant_error[j]
image[xl+i, j] = clip(image[xl + i, j] + error, 0, 255)
@cython.boundscheck(False)
@cython.wraparound(False)
def apply(dither, screen, int x, int y, float [:, :, ::1]image, float[::1] quant_error):
cdef int i, j, k
# XXX only need 2 dimensions now
cdef float[:, :, ::1] pattern = dither.PATTERN
cdef int yt, yb, xl, xr
yt, yb = y_dither_bounds(pattern, dither.ORIGIN[0], screen.Y_RES, y)
xl, xr = x_dither_bounds(pattern, dither.ORIGIN[1], screen.X_RES, x)
cdef float error
# We could avoid clipping here, i.e. allow RGB values to extend beyond
# 0..255 to capture a larger range of residual error. This is faster
# but seems to reduce image quality.
for i in range(yb - yt):
for j in range(xr - xl):
for k in range(3):
error = pattern[i, j, 0] * quant_error[k]
image[yt+i, xl+j, k] = clip(image[yt+i, xl+j, k] + error, 0, 255)
@cython.boundscheck(False)
@cython.wraparound(False)
cdef x_dither_bounds(float [:, :, ::1] pattern, int x_origin, int x_res, int x):
cdef int el = max(x_origin - x, 0)
cdef int er = min(pattern.shape[1], x_res - 1 - x)
cdef int xl = x - x_origin + el
cdef int xr = x - x_origin + er
return xl, xr
@cython.boundscheck(False)
@cython.wraparound(False)
cdef y_dither_bounds(float [:, :, ::1] pattern, int y_origin, int y_res, int y):
pshape = pattern.shape
et = max(y_origin - y, 0)
eb = min(pshape[0], y_res - 1 - y)
yt = y - y_origin + et
yb = y - y_origin + eb
return yt, yb
@cython.boundscheck(False)
@cython.wraparound(False)
def dither_lookahead(
screen, float[:,:,::1] image_rgb, dither, differ, int x, int y, char[:, ::1] options_4bit,
float[:, :, ::1] options_rgb, int lookahead):
cdef float[:, :, ::1] pattern = dither.PATTERN
cdef int x_res = screen.X_RES
cdef int dither_x_origin = dither.ORIGIN[1]
cdef int xl, xr
xl, xr = x_dither_bounds(pattern, dither_x_origin, x_res, x)
# X coord value of larger of dither bounding box or lookahead horizon
cdef int xxr = min(max(x + lookahead, xr), x_res)
cdef int i, j, k, l
cdef float[:, :, ::1] lah_image_rgb = np.empty(
(2 ** lookahead, lookahead + xr - xl, 3), dtype=np.float32)
for i in range(2**lookahead):
# Copies of input pixels so we can dither in bulk
for j in range(xxr - x):
for k in range(3):
lah_image_rgb[i, j, k] = image_rgb[y, x+j, k]
# lah_image_rgb[:, 0:xxr - x, :] = image_rgb[y, x:xxr, :]
# Leave enough space at right of image so we can dither the last of our lookahead pixels.
for j in range(xxr - x, lookahead + xr - xl):
for k in range(3):
lah_image_rgb[i, j, k] = 0
cdef float[3] quant_error
# Iterating by row then column is faster for some reason?
for i in range(xxr - x):
xl, xr = x_dither_bounds(pattern, dither_x_origin, x_res, i)
for j in range(2 ** lookahead):
# Don't update the input at position x (since we've already chosen
# fixed outputs), but do propagate quantization errors to positions >x
# so we can compensate for how good/bad these choices were
# options_rgb choices are fixed, but we can still distribute
# quantization error from having made these choices, in order to compute
# the total error
for k in range(3):
quant_error[k] = lah_image_rgb[j, i, k] - options_rgb[j, i, k]
apply_one_line(pattern, xl, xr, lah_image_rgb[j, :, :], quant_error)
cdef int best
cdef int best_error = 2**31-1
cdef int total_error
cdef long flat, dist, bit4
cdef long r, g, b
cdef (unsigned char)[:, ::1] distances = differ._distances
for i in range(2**lookahead):
total_error = 0
for j in range(lookahead):
# Clip lah_image_rgb into 0..255 range to prepare for computing colour distance
r = long(clip(lah_image_rgb[i, j, 0], 0, 255))
g = long(clip(lah_image_rgb[i, j, 1], 0, 255))
b = long(clip(lah_image_rgb[i, j, 2], 0, 255))
flat = (r << 16) + (g << 8) + b
bit4 = options_4bit[i, j]
dist = distances[flat, bit4]
total_error += dist ** 2
if total_error >= best_error:
break
if total_error < best_error:
best_error = total_error
best = i
return options_4bit[best, 0], options_rgb[best, 0, :]