mirror of
https://github.com/pruten/shoebill.git
synced 2025-01-14 10:32:49 +00:00
76f2b35170
- Fixed inst_ext, which was completely broken since last commit, whoops! - Added a bunch of __builtin_expect()s in all the critical paths, and now Marathon runs quite noticeably faster. - Fixed (I think) all the SDL makefiles
452 lines
15 KiB
C
452 lines
15 KiB
C
/*
|
|
* Copyright (c) 2013, Peter Rutenbar <pruten@gmail.com>
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions are met:
|
|
*
|
|
* 1. Redistributions of source code must retain the above copyright notice, this
|
|
* list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
* this list of conditions and the following disclaimer in the documentation
|
|
* and/or other materials provided with the distribution.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
|
* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
|
|
* ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
|
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
|
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
|
|
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
|
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include <assert.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include "shoebill.h"
|
|
|
|
#include "video_rom/rom.c"
|
|
|
|
typedef struct __attribute__ ((__packed__)) {
|
|
uint32_t structure_size;
|
|
uint32_t offset_to_ram;
|
|
|
|
uint16_t line_width; // the number of byten is a scan line
|
|
uint16_t top;
|
|
uint16_t left;
|
|
uint16_t bottom;
|
|
uint16_t right;
|
|
uint16_t version;
|
|
uint16_t pack_type;
|
|
|
|
uint32_t pack_size;
|
|
uint32_t hres;
|
|
uint32_t vres;
|
|
|
|
uint16_t pixel_type;
|
|
uint16_t pixel_size;
|
|
uint16_t num_comp;
|
|
uint16_t comp_size;
|
|
|
|
uint32_t plane_bytes;
|
|
} video_params_t;
|
|
|
|
static uint32_t compute_nubus_crc(uint8_t *rom, uint32_t len)
|
|
{
|
|
uint32_t i, sum = 0;
|
|
|
|
for (i=0; i<len; i++) {
|
|
uint8_t byte = rom[i];
|
|
|
|
if (i==(len-9) || i==(len-10) || i==(len-11) || i==(len-12))
|
|
byte = 0;
|
|
|
|
sum = (sum << 1) + (sum >> 31) + byte;
|
|
}
|
|
|
|
rom[len-9] = sum & 0xff;
|
|
rom[len-10] = (sum >> 8) & 0xff;
|
|
rom[len-11] = (sum >> 16) & 0xff;
|
|
rom[len-12] = (sum >> 24) & 0xff;
|
|
|
|
return sum;
|
|
}
|
|
|
|
static void _switch_depth(shoebill_card_video_t *ctx, uint32_t depth)
|
|
{
|
|
ctx->depth = depth;
|
|
}
|
|
|
|
void nubus_video_init(void *_ctx, uint8_t slotnum,
|
|
uint16_t width, uint16_t height, uint16_t scanline_width)
|
|
{
|
|
shoebill_card_video_t *ctx = (shoebill_card_video_t*)_ctx;
|
|
ctx->width = width;
|
|
ctx->height = height;
|
|
ctx->scanline_width = scanline_width;
|
|
ctx->pixels = scanline_width * height;
|
|
ctx->line_offset = 0;
|
|
|
|
ctx->direct_buf = p_alloc(shoe.pool, (ctx->pixels+4) * sizeof(video_ctx_color_t));
|
|
ctx->temp_buf = p_alloc(shoe.pool, (ctx->pixels+4) * sizeof(video_ctx_color_t));
|
|
|
|
ctx->clut = p_alloc(shoe.pool, 256 * sizeof(video_ctx_color_t));
|
|
ctx->rom = p_alloc(shoe.pool, 4096);
|
|
|
|
// Set the depth and clut for B&W
|
|
_switch_depth(ctx, 1);
|
|
memset(ctx->clut, 0, 256 * 4);
|
|
ctx->clut[0].r = 0xff;
|
|
ctx->clut[0].g = 0xff;
|
|
ctx->clut[0].b = 0xff;
|
|
|
|
memcpy(ctx->rom, _video_rom, 4096);
|
|
|
|
video_params_t *params = (video_params_t*)ctx->rom;
|
|
|
|
// Load our chosen width/height into all the paramater blocks in the video rom
|
|
params[0].line_width = htons(scanline_width / 8);
|
|
params[0].right = htons(width);
|
|
params[0].bottom = htons(height);
|
|
|
|
params[1].line_width = htons(scanline_width / 4);
|
|
params[1].right = htons(width);
|
|
params[1].bottom = htons(height);
|
|
|
|
params[2].line_width = htons(scanline_width / 2);
|
|
params[2].right = htons(width);
|
|
params[2].bottom = htons(height);
|
|
|
|
params[3].line_width = htons(scanline_width);
|
|
params[3].right = htons(width);
|
|
params[3].bottom = htons(height);
|
|
|
|
params[4].line_width = htons(scanline_width * 2);
|
|
params[4].right = htons(width);
|
|
params[4].bottom = htons(height);
|
|
|
|
params[5].line_width = htons(scanline_width * 4);
|
|
params[5].right = htons(width);
|
|
params[5].bottom = htons(height);
|
|
|
|
// Recompute the rom crc
|
|
compute_nubus_crc(ctx->rom, 4096);
|
|
|
|
shoe.slots[slotnum].ctx = ctx;
|
|
}
|
|
|
|
uint32_t nubus_video_read_func(const uint32_t rawaddr, const uint32_t size,
|
|
const uint8_t slotnum)
|
|
{
|
|
shoebill_card_video_t *ctx = (shoebill_card_video_t*)shoe.slots[slotnum].ctx;
|
|
const uint32_t addr = rawaddr & 0x00ffffff;
|
|
|
|
// ROM and control registers
|
|
if sunlikely((addr >> 20) == 0xf) {
|
|
|
|
slog("nubus_video_read_func: got a read to 0x%08x sz=%u\n", rawaddr, size);
|
|
|
|
// ROM (0xFsFFxxxx)
|
|
if ((addr >> 16) == 0xff) {
|
|
if (addr & 3) // Respond to lane 1 only
|
|
return 0;
|
|
return ctx->rom[(addr >> 2) % 4096];
|
|
}
|
|
|
|
// CLUT table (0xFsFE0xxx)
|
|
|
|
// Control registers (0xFsF0xxxx)
|
|
if ((addr >> 16) == 0xf0) {
|
|
switch ((addr & 0x0000ffff) >> 2) {
|
|
// case 0: // clear interrupt flag (write-only)
|
|
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
// Else, this is video ram
|
|
|
|
uint32_t i, result = 0;
|
|
if slikely(addr < (ctx->pixels * 4)) {
|
|
for (i=0; i<size; i++)
|
|
result = (result << 8) | ((uint8_t*)ctx->direct_buf)[addr + i];
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
void _gray_page(shoebill_card_video_t *ctx)
|
|
{
|
|
uint32_t h, w, i;
|
|
|
|
if (ctx->depth <= 8) {
|
|
uint16_t pat;
|
|
uint8_t *ptr = ctx->direct_buf;
|
|
uint32_t width_bytes = (ctx->depth * ctx->scanline_width) / 8;
|
|
switch (ctx->depth) {
|
|
case 1:
|
|
pat = 0xaaaa;
|
|
break;
|
|
case 2:
|
|
pat = 0xcccc;
|
|
break;
|
|
case 4:
|
|
pat = 0xf0f0;
|
|
break;
|
|
case 8:
|
|
pat = 0x00ff;
|
|
break;
|
|
}
|
|
|
|
for (h=0; h<ctx->height; h++) {
|
|
for (w=0; w < width_bytes; w++)
|
|
ptr[w] = pat >> ((w&1)*8);
|
|
ptr += width_bytes;
|
|
pat ^= 0xffff;
|
|
}
|
|
}
|
|
else if (ctx->depth == 16) {
|
|
const uint16_t fill_word = htons(0x4210);
|
|
uint16_t *ptr = (uint16_t*)ctx->direct_buf;
|
|
for (i=0; i < (ctx->width * ctx->height); i++)
|
|
ptr[i] = fill_word;
|
|
}
|
|
else if (ctx->depth == 32) {
|
|
const uint32_t fill_long = htonl(0x00808080);
|
|
uint32_t *ptr = (uint32_t*)ctx->direct_buf;
|
|
for (i=0; i < (ctx->width * ctx->height); i++)
|
|
ptr[i] = fill_long;
|
|
}
|
|
else
|
|
assert(!"unknown depth");
|
|
}
|
|
|
|
void nubus_video_write_func(const uint32_t rawaddr, const uint32_t size,
|
|
const uint32_t data, const uint8_t slotnum)
|
|
{
|
|
shoebill_card_video_t *ctx = (shoebill_card_video_t*)shoe.slots[slotnum].ctx;
|
|
const uint32_t addr = rawaddr & 0x00ffffff;
|
|
uint32_t i;
|
|
|
|
// ROM and control registers
|
|
if sunlikely((addr >> 20) == 0xf) {
|
|
|
|
slog("nubus_video_write_func: got a write to 0x%08x sz=%u data=0x%x\n", rawaddr, size, data);
|
|
|
|
// ROM (0xFsFFxxxx)
|
|
if ((addr >> 16) == 0xff)
|
|
return ; // can't write to rom
|
|
|
|
// CLUT table (0xFsFE0xxx)
|
|
|
|
// Control registers (0xFsF0xxxx)
|
|
if ((addr >> 16) == 0xf0) {
|
|
switch ((addr & 0x0000ffff) >> 2) {
|
|
case 0: {// Clear interrupt flag
|
|
shoe.via[1].rega_input |= (1 << (slotnum - 9));
|
|
break;
|
|
}
|
|
case 1: { // Set depth
|
|
uint32_t newdepth;
|
|
switch (data) {
|
|
case 128:
|
|
newdepth = 1;
|
|
break;
|
|
case 129:
|
|
newdepth = 2;
|
|
break;
|
|
case 130:
|
|
newdepth = 4;
|
|
break;
|
|
case 131:
|
|
newdepth = 8;
|
|
break;
|
|
case 132:
|
|
newdepth = 16;
|
|
break;
|
|
case 133:
|
|
newdepth = 32;
|
|
break;
|
|
default:
|
|
assert(!"driver tried to set bogus depth");
|
|
}
|
|
_switch_depth(ctx, newdepth);
|
|
slog("nubus_magic: set depth = %u\n", ctx->depth);
|
|
break;
|
|
}
|
|
case 2: { // Gray out screen buffer
|
|
|
|
_gray_page(ctx);
|
|
|
|
slog("nubus_magic: grey screen\n");
|
|
break;
|
|
}
|
|
case 3: { // Set clut index
|
|
ctx->clut_idx = data & 0xff;
|
|
// assert(ctx->clut_idx < 256);
|
|
slog("nubus_magic: set clut_idx = %u\n", ctx->clut_idx);
|
|
break;
|
|
}
|
|
case 4: { // Set red component of clut
|
|
ctx->clut[ctx->clut_idx].r = (data >> 8) & 0xff;
|
|
slog("nubus_magic: set %u.red = 0x%04x\n", ctx->clut_idx, data);
|
|
break;
|
|
}
|
|
case 5: { // Set green component of clut
|
|
ctx->clut[ctx->clut_idx].g = (data >> 8) & 0xff;
|
|
slog("nubus_magic: set %u.green = 0x%04x\n", ctx->clut_idx, data);
|
|
break;
|
|
}
|
|
case 6: { // Set blue component of clut
|
|
ctx->clut[ctx->clut_idx].b = (data >> 8) & 0xff;
|
|
slog("nubus_magic: set %u.blue = 0x%04x\n", ctx->clut_idx, data);
|
|
break;
|
|
}
|
|
case 7: { // Set interrupts
|
|
shoe.slots[slotnum].interrupts_enabled = (data != 0);
|
|
slog("nubus_magic: interrupts_enabled = %u\n",
|
|
shoe.slots[slotnum].interrupts_enabled);
|
|
break;
|
|
}
|
|
case 8: { // Debug
|
|
slog("video_debug: 0x%08x\n", data);
|
|
break;
|
|
}
|
|
case 9: { // Gray out CLUT
|
|
if (!data) break;
|
|
for (i=0; i<256; i++) {
|
|
ctx->clut[i].r = 0x80;
|
|
ctx->clut[i].g = 0x80;
|
|
ctx->clut[i].b = 0x80;
|
|
}
|
|
break;
|
|
}
|
|
case 10: { // Use luminance (a.k.a. setGray)
|
|
slog("nubus_magic: use_luminance = %u\n", data);
|
|
// FIXME: not implemented
|
|
break;
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
return ;
|
|
}
|
|
|
|
// Else, this is video ram
|
|
|
|
if slikely(addr < (ctx->pixels * 4)) {
|
|
uint32_t mydata, myaddr;
|
|
for (myaddr = addr + size, mydata = data; addr < myaddr; ) {
|
|
((uint8_t*)ctx->direct_buf)[--myaddr] = mydata & 0xff;
|
|
mydata >>= 8;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
static void _do_clut_translation(shoebill_card_video_t *ctx)
|
|
{
|
|
uint32_t i;
|
|
|
|
switch (ctx->depth) {
|
|
case 1: {
|
|
for (i=0; i < ctx->pixels/8; i++) {
|
|
const uint8_t byte = ctx->direct_buf[i];
|
|
ctx->temp_buf[i * 8 + 0] = ctx->clut[(byte >> 7) & 1];
|
|
ctx->temp_buf[i * 8 + 1] = ctx->clut[(byte >> 6) & 1];
|
|
ctx->temp_buf[i * 8 + 2] = ctx->clut[(byte >> 5) & 1];
|
|
ctx->temp_buf[i * 8 + 3] = ctx->clut[(byte >> 4) & 1];
|
|
ctx->temp_buf[i * 8 + 4] = ctx->clut[(byte >> 3) & 1];
|
|
ctx->temp_buf[i * 8 + 5] = ctx->clut[(byte >> 2) & 1];
|
|
ctx->temp_buf[i * 8 + 6] = ctx->clut[(byte >> 1) & 1];
|
|
ctx->temp_buf[i * 8 + 7] = ctx->clut[(byte >> 0) & 1];
|
|
}
|
|
break;
|
|
}
|
|
case 2: {
|
|
for (i=0; i < ctx->pixels/4; i++) {
|
|
const uint8_t byte = ctx->direct_buf[i];
|
|
ctx->temp_buf[i * 4 + 0] = ctx->clut[(byte >> 6) & 3];
|
|
ctx->temp_buf[i * 4 + 1] = ctx->clut[(byte >> 4) & 3];
|
|
ctx->temp_buf[i * 4 + 2] = ctx->clut[(byte >> 2) & 3];
|
|
ctx->temp_buf[i * 4 + 3] = ctx->clut[(byte >> 0) & 3];
|
|
}
|
|
break;
|
|
}
|
|
case 4: {
|
|
for (i=0; i < ctx->pixels/2; i++) {
|
|
const uint8_t byte = ctx->direct_buf[i];
|
|
ctx->temp_buf[i * 2 + 0] = ctx->clut[(byte >> 4) & 0xf];
|
|
ctx->temp_buf[i * 2 + 1] = ctx->clut[(byte >> 0) & 0xf];
|
|
}
|
|
break;
|
|
}
|
|
case 8: {
|
|
for (i=0; i < ctx->pixels; i++)
|
|
ctx->temp_buf[i] = ctx->clut[ctx->direct_buf[i]];
|
|
break;
|
|
}
|
|
case 16: {
|
|
uint16_t *direct = (uint16_t*)ctx->direct_buf;
|
|
for (i=0; i < ctx->pixels; i++) {
|
|
const uint16_t p = ntohs(direct[i]);
|
|
video_ctx_color_t tmp;
|
|
tmp.r = ((p >> 10) & 31);
|
|
tmp.g = (p >> 5) & 31;
|
|
tmp.b = (p >> 0) & 31;
|
|
|
|
ctx->temp_buf[i].r = (tmp.r << 3) | (tmp.r >> 2);
|
|
ctx->temp_buf[i].g = (tmp.g << 3) | (tmp.g >> 2);
|
|
ctx->temp_buf[i].b = (tmp.b << 3) | (tmp.b >> 2);
|
|
|
|
}
|
|
break;
|
|
}
|
|
|
|
case 32: {
|
|
uint32_t *direct = (uint32_t*)ctx->direct_buf, *tmp = (uint32_t*)ctx->temp_buf;
|
|
for (i=0; i < ctx->pixels; i++)
|
|
tmp[i] = direct[i] >> 8;
|
|
|
|
|
|
// OpenGL wants RGBA
|
|
// Apple must be ARGB (which is BGRA, when dereferenced)
|
|
break;
|
|
}
|
|
|
|
default:
|
|
assert(!"unsupported depth");
|
|
|
|
}
|
|
}
|
|
|
|
shoebill_video_frame_info_t nubus_video_get_frame(shoebill_card_video_t *ctx,
|
|
_Bool just_params)
|
|
{
|
|
shoebill_video_frame_info_t result;
|
|
|
|
result.width = ctx->width;
|
|
result.height = ctx->height;
|
|
result.scan_width = ctx->scanline_width;
|
|
result.depth = ctx->depth;
|
|
|
|
// If caller just wants video parameters...
|
|
if (just_params)
|
|
return result;
|
|
|
|
_do_clut_translation(ctx);
|
|
result.buf = (uint8_t*)ctx->temp_buf;
|
|
return result;
|
|
}
|
|
|
|
|
|
|
|
|
|
|