ii-pix/dither.pyx

257 lines
9.5 KiB
Cython
Raw Normal View History

2021-01-10 22:12:14 +00:00
# cython: infer_types=True
2021-02-04 23:00:10 +00:00
# cython: profile=True
2021-01-10 22:12:14 +00:00
cimport cython
2021-01-15 22:58:01 +00:00
import functools
2021-01-10 22:12:14 +00:00
import numpy as np
2021-02-05 00:08:14 +00:00
# cimport numpy as np
2021-01-12 10:00:56 +00:00
from cython.view cimport array as cvarray
2021-01-12 10:21:31 +00:00
from libc.stdlib cimport malloc, free
2021-01-10 22:12:14 +00:00
2021-01-22 22:26:10 +00:00
2021-01-22 22:06:25 +00:00
# TODO: use a cdef class
cdef struct Dither:
2021-01-22 22:19:48 +00:00
float* pattern # Flattened dither pattern
2021-01-22 22:06:25 +00:00
int x_shape
int y_shape
int x_origin
int y_origin
2021-01-22 22:19:48 +00:00
cdef struct Image:
float* flat # Flattened image array
int shape0
int shape1
int shape2
2021-01-10 22:12:14 +00:00
cdef float clip(float a, float min_value, float max_value) nogil:
return min(max(a, min_value), max_value)
2021-02-04 23:00:10 +00:00
cdef int dither_bounds_xl(Dither *dither, int x) nogil:
2021-01-22 22:06:25 +00:00
cdef int el = max(dither.x_origin - x, 0)
cdef int xl = x - dither.x_origin + el
2021-01-12 22:22:37 +00:00
return xl
2021-01-11 23:41:04 +00:00
2021-01-22 22:26:10 +00:00
2021-02-04 23:00:10 +00:00
cdef int dither_bounds_xr(Dither *dither, int x_res, int x) nogil:
2021-01-22 22:06:25 +00:00
cdef int er = min(dither.x_shape, x_res - x)
cdef int xr = x - dither.x_origin + er
2021-01-12 22:22:37 +00:00
return xr
2021-01-11 23:41:04 +00:00
2021-01-22 22:26:10 +00:00
2021-02-04 23:00:10 +00:00
cdef int dither_bounds_yt(Dither *dither, int y) nogil:
2021-01-22 22:06:25 +00:00
cdef int et = max(dither.y_origin - y, 0)
cdef int yt = y - dither.y_origin + et
2021-01-11 23:41:04 +00:00
2021-01-12 22:22:37 +00:00
return yt
2021-02-04 23:00:10 +00:00
cdef int dither_bounds_yb(Dither *dither, int y_res, int y) nogil:
2021-01-22 22:06:25 +00:00
cdef int eb = min(dither.y_shape, y_res - y)
cdef int yb = y - dither.y_origin + eb
2021-01-12 22:22:37 +00:00
return yb
2021-01-22 22:26:10 +00:00
@cython.boundscheck(False)
@cython.wraparound(False)
@functools.lru_cache(None)
2021-02-04 23:16:31 +00:00
def lookahead_options(screen, lookahead, last_pixel_4bit, x):
2021-02-05 00:08:14 +00:00
options_4bit = np.empty((2 ** lookahead, lookahead), dtype=np.uint8)
options_rgb = np.empty((2 ** lookahead, lookahead, 3), dtype=np.float32)
2021-01-22 22:26:10 +00:00
for i in range(2 ** lookahead):
output_pixel_nbit = last_pixel_nbit
2021-01-22 22:26:10 +00:00
for j in range(lookahead):
xx = x + j
2021-02-04 23:16:31 +00:00
palette_choices_4bit, palette_choices_rgb = \
screen.pixel_palette_options(output_pixel_4bit, xx)
2021-02-05 00:08:14 +00:00
output_pixel_4bit = palette_choices_4bit[(i & (1 << j)) >> j]
output_pixel_rgb = np.array(
palette_choices_rgb[(i & (1 << j)) >> j])
options_4bit[i, j] = output_pixel_4bit
options_rgb[i, j, :] = output_pixel_rgb
2021-01-22 22:26:10 +00:00
return options_nbit, options_rgb
2021-01-22 22:26:10 +00:00
2021-01-21 23:23:19 +00:00
@cython.boundscheck(False)
2021-01-11 23:04:47 +00:00
@cython.wraparound(False)
2021-02-04 23:00:10 +00:00
cdef int dither_lookahead(Dither* dither,
2021-02-05 00:48:01 +00:00
float[:, :, ::1] image_rgb, int x, int y, unsigned char[:, ::1] options_4bit,
2021-02-05 00:08:14 +00:00
float[:, :, ::1] options_rgb, int lookahead, unsigned char[:, ::1] distances, int x_res):
2021-01-11 20:43:28 +00:00
cdef int i, j, k, l
# Don't bother dithering past the lookahead horizon or edge of screen.
cdef int xxr = min(x + lookahead, x_res)
cdef int lah_shape1 = xxr - x
2021-01-12 10:21:31 +00:00
cdef int lah_shape2 = 3
cdef float *lah_image_rgb = <float *> malloc(lah_shape1 * lah_shape2 * sizeof(float))
2021-01-11 23:41:04 +00:00
2021-01-12 00:27:03 +00:00
cdef float[3] quant_error
2021-01-15 22:58:01 +00:00
cdef unsigned char bit4
2021-01-11 21:35:13 +00:00
cdef int best
cdef int best_error = 2**31-1
cdef int total_error
2021-01-15 22:58:01 +00:00
cdef long flat, dist
2021-01-11 22:19:41 +00:00
cdef long r, g, b
2021-02-05 00:48:01 +00:00
for i in range(1 << lookahead):
# Working copy of input pixels
for j in range(xxr - x):
for k in range(3):
lah_image_rgb[j * lah_shape2 + k] = image_rgb[y, x+j, k]
2021-01-11 21:35:13 +00:00
total_error = 0
for j in range(xxr - x):
xl = dither_bounds_xl(dither, j)
xr = dither_bounds_xr(dither, xxr - x, j)
# We don't update the input at position x (since we've already chosen
# fixed outputs), but we do propagate quantization errors to positions >x
# so we can compensate for how good/bad these choices were. i.e. the
# options_rgb choices are fixed, but we can still distribute quantization error
# from having made these choices, in order to compute the total error.
for k in range(3):
quant_error[k] = lah_image_rgb[j * lah_shape2 + k] - options_rgb[i, j, k]
apply_one_line(dither, xl, xr, j, lah_image_rgb, lah_shape2, quant_error)
r = <long>lah_image_rgb[j * lah_shape2 + 0]
g = <long>lah_image_rgb[j * lah_shape2 + 1]
b = <long>lah_image_rgb[j * lah_shape2 + 2]
2021-01-11 22:19:41 +00:00
flat = (r << 16) + (g << 8) + b
bit4 = options_nbit[i, j]
2021-01-11 22:19:41 +00:00
dist = distances[flat, bit4]
total_error += dist * dist
2021-01-21 23:33:12 +00:00
if total_error >= best_error:
break
2021-01-11 21:35:13 +00:00
if total_error < best_error:
best_error = total_error
best = i
2021-01-12 10:21:31 +00:00
free(lah_image_rgb)
2021-02-04 23:00:10 +00:00
return best
2021-01-12 10:00:56 +00:00
2021-02-04 23:00:10 +00:00
cdef void apply_one_line(Dither* dither, int xl, int xr, int x, float[] image, int image_shape1, float[] quant_error) nogil:
2021-01-22 22:26:10 +00:00
cdef int i, j
cdef float error
2021-01-12 10:00:56 +00:00
2021-01-22 22:26:10 +00:00
for i in range(xl, xr):
for j in range(3):
error = dither.pattern[i - x + dither.x_origin] * quant_error[j]
image[i * image_shape1 + j] = clip(image[i * image_shape1 + j] + error, 0, 255)
2021-02-05 00:48:01 +00:00
@cython.boundscheck(False)
@cython.wraparound(False)
cdef void apply(Dither* dither, int x_res, int y_res, int x, int y, float[:,:,::1] image, float[] quant_error):
2021-01-22 22:26:10 +00:00
cdef int i, j, k
cdef int yt = dither_bounds_yt(dither, y)
2021-02-04 23:00:10 +00:00
cdef int yb = dither_bounds_yb(dither, y_res, y)
2021-01-22 22:26:10 +00:00
cdef int xl = dither_bounds_xl(dither, x)
2021-02-04 23:00:10 +00:00
cdef int xr = dither_bounds_xr(dither, x_res, x)
2021-01-12 10:00:56 +00:00
2021-01-22 22:26:10 +00:00
cdef float error
# We could avoid clipping here, i.e. allow RGB values to extend beyond
# 0..255 to capture a larger range of residual error. This is faster
# but seems to reduce image quality.
# TODO: is this still true?
for i in range(yt, yb):
for j in range(xl, xr):
for k in range(3):
error = dither.pattern[(i - y) * dither.x_shape + j - x + dither.x_origin] * quant_error[k]
2021-02-05 00:48:01 +00:00
image[i,j,k] = clip(image[i,j,k] + error, 0, 255)
2021-01-12 10:00:56 +00:00
2021-01-15 22:58:01 +00:00
@cython.boundscheck(False)
@cython.wraparound(False)
2021-02-04 23:00:10 +00:00
def find_nearest_colour(float[::1] pixel_rgb, unsigned char[::1] options_4bit, unsigned char[:, ::1] options_rgb, unsigned char[:, ::1] distances):
cdef int best, dist
2021-01-15 22:58:01 +00:00
cdef unsigned char bit4
cdef int best_dist = 2**8
cdef long flat
2021-02-04 23:00:10 +00:00
for i in range(options_4bit.shape[0]):
2021-01-15 22:58:01 +00:00
flat = (<long>pixel_rgb[0] << 16) + (<long>pixel_rgb[1] << 8) + <long>pixel_rgb[2]
bit4 = options_nbit[i]
2021-01-15 22:58:01 +00:00
dist = distances[flat, bit4]
if dist < best_dist:
best_dist = dist
best = i
return options_nbit[best], options_rgb[best, :]
2021-01-15 22:58:01 +00:00
2021-01-12 10:00:56 +00:00
@cython.boundscheck(False)
@cython.wraparound(False)
def dither_image(screen, float[:, :, ::1] image_rgb, dither, int lookahead, unsigned char verbose):
cdef (unsigned char)[:, ::1] image_nbit = np.empty(
2021-01-12 10:00:56 +00:00
(image_rgb.shape[0], image_rgb.shape[1]), dtype=np.uint8)
cdef int yres = screen.Y_RES
cdef int xres = screen.X_RES
cdef int y, x, i
cdef float[3] quant_error
cdef (unsigned char)[:, ::1] options_nbit
2021-01-12 10:00:56 +00:00
cdef float[:, :, ::1] options_rgb
cdef unsigned char output_pixel_nbit
2021-01-22 22:19:48 +00:00
cdef float[3] input_pixel_rgb
2021-01-12 10:00:56 +00:00
2021-01-22 22:26:10 +00:00
# Flatten python image array for more efficient access
cdef Image cimage_rgb
cimage_rgb.flat = <float *> malloc(image_rgb.shape[0] * image_rgb.shape[1] * image_rgb.shape[2] * sizeof(float))
cimage_rgb.shape0 = image_rgb.shape[0]
cimage_rgb.shape1 = image_rgb.shape[1]
cimage_rgb.shape2 = image_rgb.shape[2]
2021-02-05 00:48:01 +00:00
#for y in range(cimage_rgb.shape0):
# for x in range(cimage_rgb.shape1):
# for i in range(cimage_rgb.shape2):
# cimage_rgb.flat[y * cimage_rgb.shape1 * cimage_rgb.shape2 + x * cimage_rgb.shape2 + i] = (
# image_rgb[y, x, i])
2021-01-22 22:26:10 +00:00
# Flatten python dither pattern array for more efficient access
2021-01-22 22:06:25 +00:00
cdef Dither cdither
cdither.y_shape = dither.PATTERN.shape[0]
cdither.x_shape = dither.PATTERN.shape[1]
cdither.y_origin = dither.ORIGIN[0]
cdither.x_origin = dither.ORIGIN[1]
# Convert dither.PATTERN to a malloced array which is faster to access
cdither.pattern = <float *> malloc(cdither.x_shape * cdither.y_shape * sizeof(float))
for i in range(cdither.y_shape):
for j in range(cdither.x_shape):
cdither.pattern[i * cdither.x_shape + j] = dither.PATTERN[i, j, 0]
2021-01-21 23:33:12 +00:00
2021-02-04 23:00:10 +00:00
cdef (unsigned char)[:, ::1] distances = screen.palette.distances
2021-01-12 10:00:56 +00:00
for y in range(yres):
if verbose:
print("%d/%d" % (y, yres))
output_pixel_nbit = 0
2021-01-12 10:00:56 +00:00
for x in range(xres):
2021-01-22 22:19:48 +00:00
for i in range(3):
2021-02-05 00:48:01 +00:00
input_pixel_rgb[i] = image_rgb[y,x,i] #cimage_rgb.flat[
#y * cimage_rgb.shape1 * cimage_rgb.shape2 + x * cimage_rgb.shape2 + i]
2021-01-15 22:58:01 +00:00
if lookahead:
2021-02-04 23:00:10 +00:00
palette_choices_4bit, palette_choices_rgb = lookahead_options(
screen, lookahead, output_pixel_4bit, x % 4)
best_idx = dither_lookahead(
2021-02-05 00:48:01 +00:00
&cdither, image_rgb, x, y, palette_choices_4bit, palette_choices_rgb, lookahead, distances, xres)
2021-02-04 23:00:10 +00:00
output_pixel_4bit = palette_choices_4bit[best_idx, 0]
output_pixel_rgb = palette_choices_rgb[best_idx, 0, :]
2021-01-15 22:58:01 +00:00
else:
2021-02-04 23:00:10 +00:00
palette_choices_4bit, palette_choices_rgb = screen.pixel_palette_options(output_pixel_4bit, x)
output_pixel_4bit, output_pixel_rgb = \
find_nearest_colour(input_pixel_rgb, palette_choices_4bit, palette_choices_rgb, distances)
2021-01-12 10:00:56 +00:00
for i in range(3):
quant_error[i] = input_pixel_rgb[i] - output_pixel_rgb[i]
2021-02-04 23:00:10 +00:00
image_4bit[y, x] = output_pixel_4bit
2021-02-05 00:48:01 +00:00
apply(&cdither, xres, yres, x, y, image_rgb, quant_error)
2021-01-21 23:17:55 +00:00
for i in range(3):
image_rgb[y, x, i] = output_pixel_rgb[i]
2021-01-12 10:00:56 +00:00
2021-01-22 22:06:25 +00:00
free(cdither.pattern)
2021-01-22 22:26:10 +00:00
free(cimage_rgb.flat)
return image_nbit, np.array(image_rgb)