/* * Apple // emulator for *ix * * This software package is subject to the GNU General Public License * version 3 or later (your choice) as published by the Free Software * Foundation. * * Copyright 2013-2015 Aaron Culliney * */ /* * 65c02 CPU timing support. Source inspired/derived from AppleWin. * * Simplified timing loop for each execution period: * * ..{...+....[....|..................|.........]....^....|....^....^....}...... * ti MBB CHK CHK MBE CHX SPK MBX tj ZZZ * * - ti : timing sample begin (lock out interface thread) * - tj : timing sample end (unlock interface thread) * - [ : cpu65_run() * - ] : cpu65_run() finished * - CHK : incoming timing_checkpoint_cycles() call from IO (bumps cycles_count_total) * - CHX : update remainder of timing_checkpoint_cycles() for execution period * - MBB : Mockingboard begin * - MBE : Mockingboard end/flush (output) * - MBX : Mockingboard end video frame (output) * - SPK : Speaker output * - ZZZ : housekeeping+sleep (or not) * */ #include "common.h" #define DEBUG_TIMING (!defined(NDEBUG) && 0) // enable to print timing stats #if DEBUG_TIMING # define TIMING_LOG(...) LOG(__VA_ARGS__) #else # define TIMING_LOG(...) #endif #define DISK_MOTOR_QUIET_NSECS 2000000 // VBL constants? #define uCyclesPerLine 65 // 25 cycles of HBL & 40 cycles of HBL' #define uVisibleLinesPerFrame (64*3) // 192 #define uLinesPerFrame (262) // 64 in each third of the screen & 70 in VBL #define dwClksPerFrame (uCyclesPerLine * uLinesPerFrame) // 17030 // cycle counting double cycles_persec_target = CLK_6502; unsigned long cycles_count_total = 0; // Running at spec ~1MHz, this will approach overflow in ~4000secs (for 32bit architectures) int cycles_speaker_feedback = 0; int32_t cpu65_cycles_to_execute = 0; // cycles-to-execute by cpu65_run() int32_t cpu65_cycle_count = 0; // cycles currently excuted by cpu65_run() int32_t irqCheckTimeout = IRQ_CHECK_CYCLES; static int32_t cycles_checkpoint_count = 0; static unsigned int g_dwCyclesThisFrame = 0; // scaling and speed adjustments #if !MOBILE_DEVICE static bool auto_adjust_speed = true; #endif static bool is_paused = false; static unsigned long _pause_spinLock = 0; double cpu_scale_factor = 1.0; double cpu_altscale_factor = 1.0; bool is_fullspeed = false; bool alt_speed_enabled = false; // misc volatile uint8_t emul_reinitialize = 1; static bool emul_reinitialize_audio = false; static bool emul_pause_audio = false; static bool emul_resume_audio = false; static bool cpu_shutting_down = false; pthread_t cpu_thread_id = 0; pthread_mutex_t interface_mutex = PTHREAD_MUTEX_INITIALIZER; pthread_cond_t dbg_thread_cond = PTHREAD_COND_INITIALIZER; pthread_cond_t cpu_thread_cond = PTHREAD_COND_INITIALIZER; // ----------------------------------------------------------------------------- struct timespec timespec_diff(struct timespec start, struct timespec end, bool *negative) { struct timespec t; if (negative) { *negative = false; } // if start > end, swizzle... if ( (start.tv_sec > end.tv_sec) || ((start.tv_sec == end.tv_sec) && (start.tv_nsec > end.tv_nsec)) ) { t=start; start=end; end=t; if (negative) { *negative = true; } } // assuming time_t is signed ... if (end.tv_nsec < start.tv_nsec) { t.tv_sec = end.tv_sec - start.tv_sec - 1; t.tv_nsec = 1000000000 + end.tv_nsec - start.tv_nsec; } else { t.tv_sec = end.tv_sec - start.tv_sec; t.tv_nsec = end.tv_nsec - start.tv_nsec; } return t; } struct timespec timespec_add(struct timespec start, unsigned long nsecs) { start.tv_nsec += nsecs; if (start.tv_nsec > NANOSECONDS_PER_SECOND) { start.tv_sec += (start.tv_nsec / NANOSECONDS_PER_SECOND); start.tv_nsec %= NANOSECONDS_PER_SECOND; } return start; } static void _timing_initialize(double scale) { is_fullspeed = (scale > CPU_SCALE_FASTEST_PIVOT); if (!is_fullspeed) { cycles_persec_target = CLK_6502 * scale; } speaker_reset(); //TIMING_LOG("ClockRate:%0.2lf ClockCyclesPerSpeakerSample:%0.2lf", cycles_persec_target, speaker_cyclesPerSample()); } #if !TESTING static #endif void reinitialize(void) { #if !TESTING assert(pthread_self() == cpu_thread_id); #endif cycles_count_total = 0; g_dwCyclesThisFrame = 0; irqCheckTimeout = IRQ_CHECK_CYCLES; #if TESTING extern unsigned long (*testing_getCyclesCount)(void); if (testing_getCyclesCount) { cycles_count_total = testing_getCyclesCount(); } #endif vm_initialize(); softswitches = SS_TEXT | SS_IOUDIS | SS_C3ROM | SS_LCWRT | SS_LCSEC; video_setDirty(A2_DIRTY_FLAG); cpu65_init(); timing_initialize(); MB_Reset(); } void timing_initialize(void) { #if !TESTING # ifdef __APPLE__ # warning FIXME TODO : this assert is firing on iOS port ... but the assert is valid ... fix soon # else assert(cpu_isPaused() || (pthread_self() == cpu_thread_id)); # endif #endif _timing_initialize(alt_speed_enabled ? cpu_altscale_factor : cpu_scale_factor); } void timing_toggleCPUSpeed(void) { assert(cpu_isPaused() || (pthread_self() == cpu_thread_id)); alt_speed_enabled = !alt_speed_enabled; timing_initialize(); } static void timing_reinitializeAudio(void) { SPINLOCK_ACQUIRE(&_pause_spinLock); assert(pthread_self() != cpu_thread_id); #if !TESTING assert(cpu_isPaused()); #endif emul_reinitialize_audio = true; emul_pause_audio = false; emul_resume_audio = false; SPINLOCK_RELINQUISH(&_pause_spinLock); } void cpu_pause(void) { assert(pthread_self() != cpu_thread_id); SPINLOCK_ACQUIRE(&_pause_spinLock); do { if (is_paused) { break; } // CPU thread will be paused when it next tries to acquire interface_mutex LOG("PAUSING CPU..."); if (!emul_reinitialize_audio) { emul_pause_audio = true; } pthread_mutex_lock(&interface_mutex); is_paused = true; } while (0); SPINLOCK_RELINQUISH(&_pause_spinLock); } void cpu_resume(void) { assert(pthread_self() != cpu_thread_id); SPINLOCK_ACQUIRE(&_pause_spinLock); do { if (!is_paused) { break; } // CPU thread will be unblocked to acquire interface_mutex if (!emul_reinitialize_audio) { emul_resume_audio = true; } LOG("RESUMING CPU..."); pthread_mutex_unlock(&interface_mutex); is_paused = false; } while (0); SPINLOCK_RELINQUISH(&_pause_spinLock); } bool cpu_isPaused(void) { return is_paused; } #if !MOBILE_DEVICE bool timing_shouldAutoAdjustSpeed(void) { double speed = alt_speed_enabled ? cpu_altscale_factor : cpu_scale_factor; return auto_adjust_speed && (speed <= CPU_SCALE_FASTEST_PIVOT); } #endif static void *cpu_thread(void *dummyptr) { assert(pthread_self() == cpu_thread_id); LOG("cpu_thread : initialized..."); struct timespec deltat = { 0 }; #if !MOBILE_DEVICE struct timespec disk_motor_time = { 0 }; #endif struct timespec t0 = { 0 }; // the target timer struct timespec ti = { 0 }; // actual before time sample struct timespec tj = { 0 }; // actual after time sample bool negative = false; long drift_adj_nsecs = 0; // generic drift adjustment between target and actual int debugging_cycles = 0; unsigned long dbg_ticks = 0; #if DEBUG_TIMING int speaker_neg_feedback = 0; int speaker_pos_feedback = 0; unsigned long dbg_cycles_executed = 0; #endif audio_init(); speaker_init(); MB_Initialize(); cpu_runloop: do { LOG("CPUTHREAD %lu LOCKING FOR MAYBE INITIALIZING AUDIO ...", cpu_thread_id); pthread_mutex_lock(&interface_mutex); if (emul_reinitialize_audio) { emul_reinitialize_audio = false; speaker_destroy(); extern void MB_SoftDestroy(void); MB_SoftDestroy(); audio_shutdown(); audio_init(); speaker_init(); extern void MB_SoftInitialize(void); MB_SoftInitialize(); } pthread_mutex_unlock(&interface_mutex); LOG("UNLOCKING FOR MAYBE INITIALIZING AUDIO ..."); if (emul_reinitialize) { reinitialize(); } LOG("cpu_thread : begin main loop ..."); clock_gettime(CLOCK_MONOTONIC, &t0); do { SCOPE_TRACE_CPU("CPU mainloop"); // -LOCK----------------------------------------------------------------------------------------- SAMPLE ti if (UNLIKELY(emul_pause_audio)) { emul_pause_audio = false; audio_pause(); } pthread_mutex_lock(&interface_mutex); if (UNLIKELY(emul_resume_audio)) { emul_resume_audio = false; audio_resume(); } clock_gettime(CLOCK_MONOTONIC, &ti); deltat = timespec_diff(t0, ti, &negative); if (deltat.tv_sec) { if (!is_fullspeed) { TIMING_LOG("NOTE : serious divergence from target time ..."); } t0 = ti; deltat = timespec_diff(t0, ti, &negative); } t0 = timespec_add(t0, EXECUTION_PERIOD_NSECS); // expected interval drift_adj_nsecs = negative ? ~deltat.tv_nsec : deltat.tv_nsec; // set up increment & decrement counters cpu65_cycles_to_execute = (cycles_persec_target / 1000); // cycles_persec_target * EXECUTION_PERIOD_NSECS / NANOSECONDS_PER_SECOND if (!is_fullspeed) { cpu65_cycles_to_execute += cycles_speaker_feedback; } if (cpu65_cycles_to_execute < 0) { cpu65_cycles_to_execute = 0; } MB_StartOfCpuExecute(); if (is_debugging) { debugging_cycles = cpu65_cycles_to_execute; } do { if (is_debugging) { cpu65_cycles_to_execute = 1; } cpu65_cycle_count = 0; cycles_checkpoint_count = 0; cpu65_run(); // run emulation for cpu65_cycles_to_execute cycles ... #if DEBUG_TIMING dbg_cycles_executed += cpu65_cycle_count; #endif g_dwCyclesThisFrame += cpu65_cycle_count; if (is_debugging) { debugging_cycles -= cpu65_cycle_count; timing_checkpoint_cycles(); if (c_debugger_should_break() || (debugging_cycles <= 0)) { int err = 0; if ((err = pthread_cond_signal(&dbg_thread_cond))) { ERRLOG("pthread_cond_signal : %d", err); } if ((err = pthread_cond_wait(&cpu_thread_cond, &interface_mutex))) { ERRLOG("pthread_cond_wait : %d", err); } if (debugging_cycles <= 0) { break; } } if (emul_reinitialize) { pthread_mutex_unlock(&interface_mutex); goto cpu_runloop; } } } while (is_debugging); MB_UpdateCycles(); timing_checkpoint_cycles(); speaker_flush(); // play audio if (g_dwCyclesThisFrame >= dwClksPerFrame) { g_dwCyclesThisFrame -= dwClksPerFrame; MB_EndOfVideoFrame(); } clock_gettime(CLOCK_MONOTONIC, &tj); pthread_mutex_unlock(&interface_mutex); // -UNLOCK--------------------------------------------------------------------------------------- SAMPLE tj #if !MOBILE_DEVICE if (timing_shouldAutoAdjustSpeed()) { disk_motor_time = timespec_diff(disk6.motor_time, tj, &negative); assert(!negative); if (!is_fullspeed && !speaker_isActive() && !video_isDirty(A2_DIRTY_FLAG) && (!disk6.motor_off && (disk_motor_time.tv_sec || disk_motor_time.tv_nsec > DISK_MOTOR_QUIET_NSECS)) ) { TIMING_LOG("auto switching to full speed"); _timing_initialize(CPU_SCALE_FASTEST); } } #endif if (!is_fullspeed) { deltat = timespec_diff(ti, tj, &negative); if (negative) { // 2016/05/05 : crash report from the wild on Android if we assert(!negative) LOG("WHOA... time went backwards! Did you just cross a timezone?"); deltat.tv_sec = 1; } long sleepfor = 0; if (LIKELY(!deltat.tv_sec)) { sleepfor = EXECUTION_PERIOD_NSECS - drift_adj_nsecs - deltat.tv_nsec; } if (sleepfor <= 0) { // lagging ... static time_t throttle_warning = 0; if (t0.tv_sec - throttle_warning > 0) { TIMING_LOG("not sleeping to catch up ... %ld . %ld", deltat.tv_sec, deltat.tv_nsec); throttle_warning = t0.tv_sec; } } else { deltat.tv_sec = 0; deltat.tv_nsec = sleepfor; TRACE_CPU_BEGIN("sleep"); nanosleep(&deltat, NULL); TRACE_CPU_END(); } dbg_ticks += EXECUTION_PERIOD_NSECS; if ((dbg_ticks % (NANOSECONDS_PER_SECOND>>1)) == 0) { video_flashText(); // TODO FIXME : proper FLASH timing ... } #if DEBUG_TIMING // collect timing statistics if (speaker_neg_feedback > cycles_speaker_feedback) { speaker_neg_feedback = cycles_speaker_feedback; } if (speaker_pos_feedback < cycles_speaker_feedback) { speaker_pos_feedback = cycles_speaker_feedback; } if ((dbg_ticks % NANOSECONDS_PER_SECOND) == 0) { TIMING_LOG("tick:(%ld.%ld) real:(%ld.%ld) cycles exe: %d ... speaker feedback: %d/%d", t0.tv_sec, t0.tv_nsec, ti.tv_sec, ti.tv_nsec, dbg_cycles_executed, speaker_neg_feedback, speaker_pos_feedback); dbg_cycles_executed = 0; speaker_neg_feedback = 0; speaker_pos_feedback = 0; } #endif if ((dbg_ticks % NANOSECONDS_PER_SECOND) == 0) { dbg_ticks = 0; } } #if !MOBILE_DEVICE if (timing_shouldAutoAdjustSpeed()) { if (is_fullspeed && ( speaker_isActive() || video_isDirty(A2_DIRTY_FLAG) || (disk6.motor_off && (disk_motor_time.tv_sec || disk_motor_time.tv_nsec > DISK_MOTOR_QUIET_NSECS))) ) { double speed = alt_speed_enabled ? cpu_altscale_factor : cpu_scale_factor; if (speed <= CPU_SCALE_FASTEST_PIVOT) { TIMING_LOG("auto switching to configured speed"); _timing_initialize(speed); } } } #endif if (UNLIKELY(emul_reinitialize)) { break; } if (UNLIKELY(emul_reinitialize_audio)) { break; } if (UNLIKELY(cpu_shutting_down)) { break; } } while (1); if (UNLIKELY(cpu_shutting_down)) { break; } } while (1); speaker_destroy(); MB_Destroy(); audio_shutdown(); cpu_thread_id = 0; cpu_pause(); disk6_eject(0); disk6_eject(1); return NULL; } void timing_startCPU(void) { cpu_shutting_down = false; int err = TEMP_FAILURE_RETRY(pthread_create(&cpu_thread_id, NULL, (void *)&cpu_thread, (void *)NULL)); if (err) { RELEASE_ERRLOG("pthread_create failed!"); RELEASE_BREAK(); } } void timing_stopCPU(void) { cpu_shutting_down = true; LOG("Emulator waiting for CPU thread clean up..."); if (pthread_join(cpu_thread_id, NULL)) { ERRLOG("OOPS: pthread_join of CPU thread ..."); } } unsigned int CpuGetCyclesThisVideoFrame(void) { assert(pthread_self() == cpu_thread_id); timing_checkpoint_cycles(); return g_dwCyclesThisFrame + cycles_checkpoint_count; } // Called when an IO-reg is accessed & accurate global cycle count info is needed void timing_checkpoint_cycles(void) { assert(pthread_self() == cpu_thread_id); const int32_t d = cpu65_cycle_count - cycles_checkpoint_count; assert(d >= 0); #if !TESTING cycles_count_total += d; #else unsigned long previous_cycles_count_total = cycles_count_total; cycles_count_total += d; if (UNLIKELY(cycles_count_total < previous_cycles_count_total)) { extern void (*testing_cyclesOverflow)(void); if (testing_cyclesOverflow) { testing_cyclesOverflow(); } } #endif cycles_checkpoint_count = cpu65_cycle_count; } // ---------------------------------------------------------------------------- bool timing_saveState(StateHelper_s *helper) { bool saved = false; int fd = helper->fd; do { long lVal = 0; lVal = (long)(cpu_scale_factor * 100.); if (!helper->save(fd, (uint8_t *)&lVal, sizeof(lVal))) { break; } lVal = (long)(cpu_altscale_factor * 100.); if (!helper->save(fd, (uint8_t *)&lVal, sizeof(lVal))) { break; } uint8_t bVal = alt_speed_enabled ? 1 : 0; if (!helper->save(fd, &bVal, sizeof(bVal))) { break; } saved = true; } while (0); return saved; } bool timing_loadState(StateHelper_s *helper) { bool loaded = false; int fd = helper->fd; do { long lVal = 0; if (!helper->load(fd, (uint8_t *)&lVal, sizeof(lVal))) { break; } cpu_scale_factor = lVal / 100.; if (!helper->load(fd, (uint8_t *)&lVal, sizeof(lVal))) { break; } cpu_altscale_factor = lVal / 100.; uint8_t bVal = 0; if (!helper->load(fd, &bVal, sizeof(bVal))) { break; } alt_speed_enabled = !!bVal; timing_initialize(); loaded = true; } while (0); return loaded; } // ---------------------------------------------------------------------------- static void vm_prefsChanged(const char *domain) { (void)domain; float fVal = 1.0; cpu_scale_factor = prefs_parseFloatValue(PREF_DOMAIN_VM, PREF_CPU_SCALE, &fVal) ? fVal / 100.f : 1.f; if (cpu_scale_factor < CPU_SCALE_SLOWEST) { cpu_scale_factor = CPU_SCALE_SLOWEST; } if (cpu_scale_factor > CPU_SCALE_FASTEST_PIVOT) { cpu_scale_factor = CPU_SCALE_FASTEST; } cpu_altscale_factor = prefs_parseFloatValue(PREF_DOMAIN_VM, PREF_CPU_SCALE_ALT, &fVal) ? fVal / 100.f : 1.f; if (cpu_altscale_factor < CPU_SCALE_SLOWEST) { cpu_altscale_factor = CPU_SCALE_SLOWEST; } if (cpu_altscale_factor > CPU_SCALE_FASTEST_PIVOT) { cpu_altscale_factor = CPU_SCALE_FASTEST; } static float audioLatency = 0.f; float latency = prefs_parseFloatValue(PREF_DOMAIN_AUDIO, PREF_AUDIO_LATENCY, &fVal) ? fVal : 0.25f; #define SMALL_EPSILON (1.f/1024.f) if (fabsf(audioLatency - latency) > SMALL_EPSILON) { audioLatency = latency; audio_setLatency(latency); timing_reinitializeAudio(); } static bool mbEnabled = false; bool bVal = false; bool enabled = prefs_parseBoolValue(PREF_DOMAIN_AUDIO, PREF_MOCKINGBOARD_ENABLED, &bVal) ? bVal : true; if (enabled != mbEnabled) { mbEnabled = enabled; MB_SetEnabled(enabled); timing_reinitializeAudio(); } } static __attribute__((constructor)) void _init_vm(void) { prefs_registerListener(PREF_DOMAIN_VM, &vm_prefsChanged); prefs_registerListener(PREF_DOMAIN_AUDIO, &vm_prefsChanged); }