/* RetroArch - A frontend for libretro. * Copyright (C) 2014-2017 - Ali Bouhlel * * RetroArch is free software: you can redistribute it and/or modify it under the terms * of the GNU General Public License as published by the Free Software Found- * ation, either version 3 of the License, or (at your option) any later version. * * RetroArch is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; * without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR * PURPOSE. See the GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along with RetroArch. * If not, see . */ #include #include #include #include <3ds.h> #include #include #include #ifdef HAVE_CONFIG_H #include "../../config.h" #endif #ifdef HAVE_MENU #include "../../menu/menu_driver.h" #endif #ifdef HAVE_GFX_WIDGETS #include "../gfx_widgets.h" #endif #include "../font_driver.h" #include "../../ctr/gpu_old.h" #include "ctr_gu.h" #include "../../configuration.h" #include "../../command.h" #include "../../driver.h" #include "../../retroarch.h" #include "../../verbosity.h" #include "../common/ctr_common.h" #ifndef HAVE_THREADS #include "../../tasks/tasks_internal.h" #endif /* An annoyance... * Have to keep track of bottom screen enable state * externally, otherwise cannot detect current state * when reinitialising... */ bool ctr_bottom_screen_enabled = true; static INLINE void ctr_check_3D_slider(ctr_video_t* ctr, ctr_video_mode_enum video_mode) { float slider_val = *(float*)0x1FF81080; if (slider_val == 0.0f) { ctr->video_mode = CTR_VIDEO_MODE_2D; ctr->enable_3d = false; return; } switch (video_mode) { case CTR_VIDEO_MODE_3D: { s16 offset = slider_val * 10.0f; ctr->video_mode = CTR_VIDEO_MODE_3D; ctr->frame_coords[1] = ctr->frame_coords[0]; ctr->frame_coords[2] = ctr->frame_coords[0]; ctr->frame_coords[1].x0 -= offset; ctr->frame_coords[1].x1 -= offset; ctr->frame_coords[2].x0 += offset; ctr->frame_coords[2].x1 += offset; GSPGPU_FlushDataCache(ctr->frame_coords, 3 * sizeof(ctr_vertex_t)); if (ctr->supports_parallax_disable) ctr_set_parallax_layer(true); ctr->enable_3d = true; } break; case CTR_VIDEO_MODE_2D_400X240: case CTR_VIDEO_MODE_2D_800X240: if (ctr->supports_parallax_disable) { ctr->video_mode = video_mode; ctr_set_parallax_layer(false); ctr->enable_3d = true; } else { ctr->video_mode = CTR_VIDEO_MODE_2D; ctr->enable_3d = false; } break; case CTR_VIDEO_MODE_2D: default: ctr->video_mode = CTR_VIDEO_MODE_2D; ctr->enable_3d = false; break; } } static INLINE void ctr_set_screen_coords(ctr_video_t * ctr) { if (ctr->rotation == 0) { ctr->frame_coords->x0 = ctr->vp.x; ctr->frame_coords->y0 = ctr->vp.y; ctr->frame_coords->x1 = ctr->vp.x + ctr->vp.width; ctr->frame_coords->y1 = ctr->vp.y + ctr->vp.height; } else if (ctr->rotation == 1) /* 90° */ { ctr->frame_coords->x0 = ctr->vp.x; ctr->frame_coords->y0 = ctr->vp.y; ctr->frame_coords->x1 = ctr->vp.x + ctr->vp.width; ctr->frame_coords->y1 = ctr->vp.y + ctr->vp.height; } else if (ctr->rotation == 2) /* 180° */ { ctr->frame_coords->x1 = ctr->vp.x; ctr->frame_coords->y1 = ctr->vp.y; ctr->frame_coords->x0 = ctr->vp.x + ctr->vp.width; ctr->frame_coords->y0 = ctr->vp.y + ctr->vp.height; } else /* 270° */ { ctr->frame_coords->x1 = ctr->vp.x; ctr->frame_coords->y1 = ctr->vp.y; ctr->frame_coords->x0 = ctr->vp.x + ctr->vp.width; ctr->frame_coords->y0 = ctr->vp.y + ctr->vp.height; } } static void ctr_update_viewport( ctr_video_t* ctr, settings_t *settings, int custom_vp_x, int custom_vp_y, unsigned custom_vp_width, unsigned custom_vp_height ) { int x = 0; int y = 0; float width = ctr->vp.full_width; float height = ctr->vp.full_height; float desired_aspect = video_driver_get_aspect_ratio(); bool video_scale_integer = settings->bools.video_scale_integer; unsigned aspect_ratio_idx = settings->uints.video_aspect_ratio_idx; if (ctr->rotation & 0x1) desired_aspect = 1.0 / desired_aspect; if (video_scale_integer) { video_viewport_get_scaled_integer(&ctr->vp, ctr->vp.full_width, ctr->vp.full_height, desired_aspect, ctr->keep_aspect); } else if (ctr->keep_aspect) { #if defined(HAVE_MENU) if (aspect_ratio_idx == ASPECT_RATIO_CUSTOM) { x = custom_vp_x; y = custom_vp_y; width = custom_vp_width; height = custom_vp_height; } else #endif { float delta; float device_aspect = ((float)ctr->vp.full_width) / ctr->vp.full_height; if (fabsf(device_aspect - desired_aspect) < 0.0001f) { /* If the aspect ratios of screen and desired aspect * ratio are sufficiently equal (floating point stuff), * assume they are actually equal. */ } else if (device_aspect > desired_aspect) { delta = (desired_aspect / device_aspect - 1.0f) / 2.0f + 0.5f; x = (int)roundf(width * (0.5f - delta)); width = (unsigned)roundf(2.0f * width * delta); } else { delta = (device_aspect / desired_aspect - 1.0f) / 2.0f + 0.5f; y = (int)roundf(height * (0.5f - delta)); height = (unsigned)roundf(2.0f * height * delta); } } ctr->vp.x = x; ctr->vp.y = y; ctr->vp.width = width; ctr->vp.height = height; } else { ctr->vp.x = ctr->vp.y = 0; ctr->vp.width = width; ctr->vp.height = height; } ctr_set_screen_coords(ctr); ctr->should_resize = false; } static void ctr_lcd_aptHook(APT_HookType hook, void* param) { ctr_video_t *ctr = (ctr_video_t*)param; if (!ctr) return; if (hook == APTHOOK_ONRESTORE) { GPUCMD_SetBufferOffset(0); shaderProgramUse(&ctr->shader); GPU_SetViewport(NULL, VIRT_TO_PHYS(ctr->drawbuffers.top.left), 0, 0, CTR_TOP_FRAMEBUFFER_HEIGHT, CTR_TOP_FRAMEBUFFER_WIDTH); GPU_DepthMap(-1.0f, 0.0f); GPU_SetFaceCulling(GPU_CULL_NONE); GPU_SetStencilTest(false, GPU_ALWAYS, 0x00, 0xFF, 0x00); GPU_SetStencilOp(GPU_STENCIL_KEEP, GPU_STENCIL_KEEP, GPU_STENCIL_KEEP); GPU_SetBlendingColor(0, 0, 0, 0); GPU_SetDepthTestAndWriteMask(false, GPU_ALWAYS, GPU_WRITE_COLOR); GPUCMD_AddMaskedWrite(GPUREG_EARLYDEPTH_TEST1, 0x1, 0); GPUCMD_AddWrite(GPUREG_EARLYDEPTH_TEST2, 0); GPU_SetAlphaBlending(GPU_BLEND_ADD, GPU_BLEND_ADD, GPU_SRC_ALPHA, GPU_ONE_MINUS_SRC_ALPHA, GPU_SRC_ALPHA, GPU_ONE_MINUS_SRC_ALPHA); GPU_SetAlphaTest(false, GPU_ALWAYS, 0x00); GPU_SetTextureEnable(GPU_TEXUNIT0); GPU_SetTexEnv(0, GPU_TEXTURE0, GPU_TEXTURE0, 0, 0, GPU_REPLACE, GPU_REPLACE, 0); GPU_SetTexEnv(1, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(2, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(3, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(4, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(5, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); ctrGuSetAttributeBuffers(2, VIRT_TO_PHYS(ctr->menu.frame_coords), CTRGU_ATTRIBFMT(GPU_SHORT, 4) << 0 | CTRGU_ATTRIBFMT(GPU_SHORT, 4) << 4, sizeof(ctr_vertex_t)); GPU_Finalize(); ctrGuFlushAndRun(true); gspWaitForEvent(GSPGPU_EVENT_P3D, false); ctr->p3d_event_pending = false; } if ((hook == APTHOOK_ONSUSPEND) && (ctr->video_mode == CTR_VIDEO_MODE_2D_400X240)) { memcpy(gfxTopRightFramebuffers[ctr->current_buffer_top], gfxTopLeftFramebuffers[ctr->current_buffer_top], 400 * 240 * 3); GSPGPU_FlushDataCache(gfxTopRightFramebuffers[ctr->current_buffer_top], 400 * 240 * 3); } if ((hook == APTHOOK_ONSUSPEND) && ctr->supports_parallax_disable) ctr_set_parallax_layer(*(float*)0x1FF81080 != 0.0); if ((hook == APTHOOK_ONSUSPEND) || (hook == APTHOOK_ONRESTORE) || (hook == APTHOOK_ONWAKEUP)) { Handle lcd_handle; u8 not_2DS; CFGU_GetModelNintendo2DS(¬_2DS); if(not_2DS && srvGetServiceHandle(&lcd_handle, "gsp::Lcd") >= 0) { u32 *cmdbuf = getThreadCommandBuffer(); cmdbuf[0] = ((hook == APTHOOK_ONSUSPEND) || ctr_bottom_screen_enabled)? 0x00110040: 0x00120040; cmdbuf[1] = 2; svcSendSyncRequest(lcd_handle); svcCloseHandle(lcd_handle); } } if (menu_driver_is_alive()) { return; } else if ((hook == APTHOOK_ONSUSPEND) || (hook == APTHOOK_ONSLEEP)) { command_event(CMD_EVENT_AUDIO_STOP, NULL); } else if ((hook == APTHOOK_ONRESTORE) || (hook == APTHOOK_ONWAKEUP)) { command_event(CMD_EVENT_AUDIO_START, NULL); } } static void ctr_vsync_hook(ctr_video_t* ctr) { ctr->vsync_event_pending = false; } #ifndef HAVE_THREADS static bool ctr_tasks_finder(retro_task_t *task,void *userdata) { return task; } task_finder_data_t ctr_tasks_finder_data = {ctr_tasks_finder, NULL}; #endif static void ctr_set_bottom_screen_enable(void* data, bool enabled) { Handle lcd_handle; u8 not_2DS; ctr_video_t *ctr = (ctr_video_t*)data; if (!ctr) return; gfxBottomFramebuffers[0] = enabled ? (u8*)ctrConsole->frameBuffer: (u8*)ctr->empty_framebuffer; CFGU_GetModelNintendo2DS(¬_2DS); if(not_2DS && srvGetServiceHandle(&lcd_handle, "gsp::Lcd") >= 0) { u32 *cmdbuf = getThreadCommandBuffer(); cmdbuf[0] = enabled? 0x00110040: 0x00120040; cmdbuf[1] = 2; svcSendSyncRequest(lcd_handle); svcCloseHandle(lcd_handle); } ctr_bottom_screen_enabled = enabled; } static void* ctr_init(const video_info_t* video, input_driver_t** input, void** input_data) { float refresh_rate; u8 device_model = 0xFF; void* ctrinput = NULL; settings_t *settings = config_get_ptr(); bool lcd_bottom = settings->bools.video_3ds_lcd_bottom; ctr_video_t* ctr = (ctr_video_t*)linearAlloc(sizeof(ctr_video_t)); if (!ctr) return NULL; memset(ctr, 0, sizeof(ctr_video_t)); ctr->vp.x = 0; ctr->vp.y = 0; ctr->vp.width = CTR_TOP_FRAMEBUFFER_WIDTH; ctr->vp.height = CTR_TOP_FRAMEBUFFER_HEIGHT; ctr->vp.full_width = CTR_TOP_FRAMEBUFFER_WIDTH; ctr->vp.full_height = CTR_TOP_FRAMEBUFFER_HEIGHT; video_driver_set_size(ctr->vp.width, ctr->vp.height); ctr->drawbuffers.top.left = vramAlloc(CTR_TOP_FRAMEBUFFER_WIDTH * CTR_TOP_FRAMEBUFFER_HEIGHT * 2 * sizeof(uint32_t)); ctr->drawbuffers.top.right = (void*)((uint32_t*)ctr->drawbuffers.top.left + CTR_TOP_FRAMEBUFFER_WIDTH * CTR_TOP_FRAMEBUFFER_HEIGHT); ctr->display_list_size = 0x4000; ctr->display_list = linearAlloc(ctr->display_list_size * sizeof(uint32_t)); GPU_Reset(NULL, ctr->display_list, ctr->display_list_size); ctr->vertex_cache.size = 0x1000; ctr->vertex_cache.buffer = linearAlloc(ctr->vertex_cache.size * sizeof(ctr_vertex_t)); ctr->vertex_cache.current = ctr->vertex_cache.buffer; ctr->rgb32 = video->rgb32; ctr->texture_width = video->input_scale * RARCH_SCALE_BASE; ctr->texture_height = video->input_scale * RARCH_SCALE_BASE; ctr->texture_linear = linearMemAlign(ctr->texture_width * ctr->texture_height * (ctr->rgb32? 4:2), 128); ctr->texture_swizzled = linearMemAlign(ctr->texture_width * ctr->texture_height * (ctr->rgb32? 4:2), 128); ctr->frame_coords = linearAlloc(3 * sizeof(ctr_vertex_t)); ctr->frame_coords->x0 = 0; ctr->frame_coords->y0 = 0; ctr->frame_coords->x1 = CTR_TOP_FRAMEBUFFER_WIDTH; ctr->frame_coords->y1 = CTR_TOP_FRAMEBUFFER_HEIGHT; ctr->frame_coords->u0 = 0; ctr->frame_coords->v0 = 0; ctr->frame_coords->u1 = CTR_TOP_FRAMEBUFFER_WIDTH; ctr->frame_coords->v1 = CTR_TOP_FRAMEBUFFER_HEIGHT; GSPGPU_FlushDataCache(ctr->frame_coords, sizeof(ctr_vertex_t)); ctr->menu.texture_width = 512; ctr->menu.texture_height = 512; ctr->menu.texture_linear = linearMemAlign(ctr->menu.texture_width * ctr->menu.texture_height * sizeof(uint16_t), 128); ctr->menu.texture_swizzled = linearMemAlign(ctr->menu.texture_width * ctr->menu.texture_height * sizeof(uint16_t), 128); ctr->menu.frame_coords = linearAlloc(sizeof(ctr_vertex_t)); ctr->menu.frame_coords->x0 = 40; ctr->menu.frame_coords->y0 = 0; ctr->menu.frame_coords->x1 = CTR_TOP_FRAMEBUFFER_WIDTH - 40; ctr->menu.frame_coords->y1 = CTR_TOP_FRAMEBUFFER_HEIGHT; ctr->menu.frame_coords->u0 = 0; ctr->menu.frame_coords->v0 = 0; ctr->menu.frame_coords->u1 = CTR_TOP_FRAMEBUFFER_WIDTH - 80; ctr->menu.frame_coords->v1 = CTR_TOP_FRAMEBUFFER_HEIGHT; GSPGPU_FlushDataCache(ctr->menu.frame_coords, sizeof(ctr_vertex_t)); ctr_set_scale_vector(&ctr->scale_vector, CTR_TOP_FRAMEBUFFER_WIDTH, CTR_TOP_FRAMEBUFFER_HEIGHT, ctr->texture_width, ctr->texture_height); ctr_set_scale_vector(&ctr->menu.scale_vector, CTR_TOP_FRAMEBUFFER_WIDTH, CTR_TOP_FRAMEBUFFER_HEIGHT, ctr->menu.texture_width, ctr->menu.texture_height); memset(ctr->texture_linear, 0x00, ctr->texture_width * ctr->texture_height * (ctr->rgb32? 4:2)); #if 0 memset(ctr->menu.texture_swizzled , 0x00, ctr->menu.texture_width * ctr->menu.texture_height * 2); #endif ctr->dvlb = DVLB_ParseFile((u32*)ctr_sprite_shbin, ctr_sprite_shbin_size); ctrGuSetVshGsh(&ctr->shader, ctr->dvlb, 2, 2); shaderProgramUse(&ctr->shader); GPU_SetViewport(NULL, VIRT_TO_PHYS(ctr->drawbuffers.top.left), 0, 0, CTR_TOP_FRAMEBUFFER_HEIGHT, CTR_TOP_FRAMEBUFFER_WIDTH); GPU_DepthMap(-1.0f, 0.0f); GPU_SetFaceCulling(GPU_CULL_NONE); GPU_SetStencilTest(false, GPU_ALWAYS, 0x00, 0xFF, 0x00); GPU_SetStencilOp(GPU_STENCIL_KEEP, GPU_STENCIL_KEEP, GPU_STENCIL_KEEP); GPU_SetBlendingColor(0, 0, 0, 0); #if 0 GPU_SetDepthTestAndWriteMask(true, GPU_GREATER, GPU_WRITE_ALL); #endif GPU_SetDepthTestAndWriteMask(false, GPU_ALWAYS, GPU_WRITE_COLOR); #if 0 GPU_SetDepthTestAndWriteMask(true, GPU_ALWAYS, GPU_WRITE_ALL); #endif GPUCMD_AddMaskedWrite(GPUREG_EARLYDEPTH_TEST1, 0x1, 0); GPUCMD_AddWrite(GPUREG_EARLYDEPTH_TEST2, 0); GPU_SetAlphaBlending(GPU_BLEND_ADD, GPU_BLEND_ADD, GPU_SRC_ALPHA, GPU_ONE_MINUS_SRC_ALPHA, GPU_SRC_ALPHA, GPU_ONE_MINUS_SRC_ALPHA); GPU_SetAlphaTest(false, GPU_ALWAYS, 0x00); GPU_SetTextureEnable(GPU_TEXUNIT0); GPU_SetTexEnv(0, GPU_TEXTURE0, GPU_TEXTURE0, 0, 0, GPU_REPLACE, GPU_REPLACE, 0); GPU_SetTexEnv(1, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(2, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(3, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(4, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(5, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); ctrGuSetAttributeBuffers(2, VIRT_TO_PHYS(ctr->menu.frame_coords), CTRGU_ATTRIBFMT(GPU_SHORT, 4) << 0 | CTRGU_ATTRIBFMT(GPU_SHORT, 4) << 4, sizeof(ctr_vertex_t)); GPU_Finalize(); ctrGuFlushAndRun(true); ctr->p3d_event_pending = true; ctr->ppf_event_pending = false; if (input && input_data) { ctrinput = input_driver_init_wrap(&input_ctr, settings->arrays.input_joypad_driver); *input = ctrinput ? &input_ctr : NULL; *input_data = ctrinput; } ctr->keep_aspect = true; ctr->should_resize = true; ctr->smooth = video->smooth; ctr->vsync = video->vsync; ctr->current_buffer_top = 0; /* Only O3DS and O3DSXL support running in 'dual-framebuffer' * mode with the parallax barrier disabled * (i.e. these are the only platforms that can use * CTR_VIDEO_MODE_2D_400X240 and CTR_VIDEO_MODE_2D_800X240) */ CFGU_GetSystemModel(&device_model); /* (0 = O3DS, 1 = O3DSXL, 2 = N3DS, 3 = 2DS, 4 = N3DSXL, 5 = N2DSXL) */ ctr->supports_parallax_disable = (device_model == 0) || (device_model == 1); ctr->empty_framebuffer = linearAlloc(320 * 240 * 2); memset(ctr->empty_framebuffer, 0, 320 * 240 * 2); refresh_rate = (32730.0 * 8192.0) / 4481134.0; driver_ctl(RARCH_DRIVER_CTL_SET_REFRESH_RATE, &refresh_rate); aptHook(&ctr->lcd_aptHook, ctr_lcd_aptHook, ctr); font_driver_init_osd(ctr, video, false, video->is_threaded, FONT_DRIVER_RENDER_CTR); ctr->msg_rendering_enabled = false; ctr->menu_texture_frame_enable = false; ctr->menu_texture_enable = false; /* Set bottom screen enable state, if required */ if (lcd_bottom != ctr_bottom_screen_enabled) ctr_set_bottom_screen_enable(ctr, lcd_bottom); gspSetEventCallback(GSPGPU_EVENT_VBlank0, (ThreadFunc)ctr_vsync_hook, ctr, false); return ctr; } #if 0 #define CTR_INSPECT_MEMORY_USAGE #endif static bool ctr_frame(void* data, const void* frame, unsigned width, unsigned height, uint64_t frame_count, unsigned pitch, const char* msg, video_frame_info_t *video_info) { static uint64_t currentTick,lastTick; touchPosition state_tmp_touch; extern GSPGPU_FramebufferInfo topFramebufferInfo; extern u8* gfxSharedMemory; extern u8 gfxThreadID; uint32_t diff; uint32_t state_tmp = 0; ctr_video_t *ctr = (ctr_video_t*)data; static float fps = 0.0; static int total_frames = 0; static int frames = 0; settings_t *settings = config_get_ptr(); unsigned disp_mode = settings->uints.video_3ds_display_mode; bool statistics_show = video_info->statistics_show; const char *stat_text = video_info->stat_text; float video_refresh_rate = video_info->refresh_rate; struct font_params *osd_params = (struct font_params*) &video_info->osd_stat_params; int custom_vp_x = video_info->custom_vp_x; int custom_vp_y = video_info->custom_vp_y; unsigned custom_vp_width = video_info->custom_vp_width; unsigned custom_vp_height = video_info->custom_vp_height; #ifdef HAVE_MENU bool menu_is_alive = video_info->menu_is_alive; #endif #ifdef HAVE_GFX_WIDGETS bool widgets_active = video_info->widgets_active; #endif if (!width || !height || !settings) { gspWaitForEvent(GSPGPU_EVENT_VBlank0, true); return true; } state_tmp = hidKeysDown(); hidTouchRead(&state_tmp_touch); if((state_tmp & KEY_TOUCH) && (state_tmp_touch.py < 120)) { ctr_set_bottom_screen_enable(ctr, !ctr_bottom_screen_enabled); } if (ctr->p3d_event_pending) { gspWaitForEvent(GSPGPU_EVENT_P3D, false); ctr->p3d_event_pending = false; } if (ctr->ppf_event_pending) { gspWaitForEvent(GSPGPU_EVENT_PPF, false); ctr->ppf_event_pending = false; } #ifndef HAVE_THREADS if (task_queue_find(&ctr_tasks_finder_data)) { #if 0 ctr->vsync_event_pending = true; #endif while (ctr->vsync_event_pending) { task_queue_check(); svcSleepThread(0); } } #endif if (ctr->vsync) { /* If we are running at the display refresh rate, * then all is well - just wait on the *current* VBlank0 * event and carry on. * * If we are running at below the display refresh rate, * then we have problems: frame updates will happen * entirely out of sync with VBlank0 events. To elaborate, * we'll wait for a VBlank0 here, but it will already have * happened partway through the previous frame. So it's: * 'oh good - let's render the current frame', but the next * VBlank0 will occur in less time than it takes to draw the * current frame, resulting in 'overlap' and screen tearing. * * This seems to be a consequence of using the GPU directly. * Other 3DS homebrew typically uses the ctrulib function * gfxSwapBuffers(), which ensures an immediate buffer * swap every time, and no tearing. We can't do this: * instead, we use a variant of the ctrulib function * gfxSwapBuffersGpu(), which seems to send a notification, * and the swap happens when it happens... * * I don't know how to fix this 'properly' (probably needs * some low level rewriting, maybe switching to an implementation * based on citro3d), but I can at least implement a hack/workaround * that allows 50Hz content to be run without tearing. This involves * the following: * * If content frame rate is more than 10% lower than the 3DS * display refresh rate, don't wait on the *current* VBlank0 * event (because it is 'tainted'), but instead wait on the * *next* VBlank0 event (which will ensure we have enough time * to write/flush the display buffers). * * This fixes screen tearing, but it has a significant impact on * performance... * */ bool next_event = false; struct retro_system_av_info *av_info = video_viewport_get_system_av_info(); if (av_info) next_event = av_info->timing.fps < video_refresh_rate * 0.9f; gspWaitForEvent(GSPGPU_EVENT_VBlank0, next_event); } ctr->vsync_event_pending = true; /* Internal counters/statistics * > This is only required if the bottom screen is enabled */ if (ctr_bottom_screen_enabled) { frames++; currentTick = svcGetSystemTick(); diff = currentTick - lastTick; if(diff > CTR_CPU_TICKS_PER_SECOND) { fps = (float)frames * ((float) CTR_CPU_TICKS_PER_SECOND / (float) diff); lastTick = currentTick; frames = 0; } #ifdef CTR_INSPECT_MEMORY_USAGE uint32_t ctr_get_stack_usage(void); void ctr_linear_get_stats(void); extern u32 __linear_heap_size; extern u32 __heap_size; MemInfo mem_info; PageInfo page_info; u32 query_addr = 0x08000000; printf(PRINTFPOS(0,0)); while (query_addr < 0x40000000) { svcQueryMemory(&mem_info, &page_info, query_addr); printf("0x%08X --> 0x%08X (0x%08X) \n", mem_info.base_addr, mem_info.base_addr + mem_info.size, mem_info.size); query_addr = mem_info.base_addr + mem_info.size; if(query_addr == 0x1F000000) query_addr = 0x30000000; } #if 0 static u32* dummy_pointer; if(total_frames == 500) dummy_pointer = malloc(0x2000000); if(total_frames == 1000) free(dummy_pointer); #endif printf("========================================"); printf("0x%08X 0x%08X 0x%08X\n", __heap_size, gpuCmdBufOffset, (__linear_heap_size - linearSpaceFree())); printf("fps: %8.4f frames: %i (%X)\n", fps, total_frames++, (__linear_heap_size - linearSpaceFree())); printf("========================================"); u32 app_memory = *((u32*)0x1FF80040); u64 mem_used; svcGetSystemInfo(&mem_used, 0, 1); printf("total mem : 0x%08X \n", app_memory); printf("used: 0x%08X free: 0x%08X \n", (u32)mem_used, app_memory - (u32)mem_used); static u32 stack_usage = 0; extern u32 __stack_bottom; if(!(total_frames & 0x3F)) stack_usage = ctr_get_stack_usage(); printf("stack total:0x%08X used: 0x%08X\n", 0x10000000 - __stack_bottom, stack_usage); printf("========================================"); ctr_linear_get_stats(); printf("========================================"); #else printf(PRINTFPOS(29,0)"fps: %8.4f frames: %i\r", fps, total_frames++); #endif fflush(stdout); } if (ctr->should_resize) ctr_update_viewport(ctr, settings, custom_vp_x, custom_vp_y, custom_vp_width, custom_vp_height ); ctrGuSetMemoryFill(true, (u32*)ctr->drawbuffers.top.left, 0x00000000, (u32*)ctr->drawbuffers.top.left + 2 * CTR_TOP_FRAMEBUFFER_WIDTH * CTR_TOP_FRAMEBUFFER_HEIGHT, 0x201, NULL, 0x00000000, 0, 0x201); GPUCMD_SetBufferOffset(0); if (width > ctr->texture_width) width = ctr->texture_width; if (height > ctr->texture_height) height = ctr->texture_height; if(frame) { if(((((u32)(frame)) >= 0x14000000 && ((u32)(frame)) < 0x40000000)) /* frame in linear memory */ && !((u32)frame & 0x7F) /* 128-byte aligned */ && !(pitch & 0xF) /* 16-byte aligned */ && (pitch > 0x40)) { /* can copy the buffer directly with the GPU */ #if 0 GSPGPU_FlushDataCache(frame, pitch * height); #endif ctrGuSetCommandList_First(true,(void*)frame, pitch * height,0,0,0,0); ctrGuCopyImage(true, frame, pitch / (ctr->rgb32? 4: 2), height, ctr->rgb32 ? CTRGU_RGBA8: CTRGU_RGB565, false, ctr->texture_swizzled, ctr->texture_width, ctr->rgb32 ? CTRGU_RGBA8: CTRGU_RGB565, true); } else { int i; uint8_t *dst = (uint8_t*)ctr->texture_linear; const uint8_t *src = frame; for (i = 0; i < height; i++) { memcpy(dst, src, width * (ctr->rgb32? 4: 2)); dst += ctr->texture_width * (ctr->rgb32? 4: 2); src += pitch; } GSPGPU_FlushDataCache(ctr->texture_linear, ctr->texture_width * ctr->texture_height * (ctr->rgb32? 4: 2)); ctrGuCopyImage(false, ctr->texture_linear, ctr->texture_width, ctr->texture_height, ctr->rgb32 ? CTRGU_RGBA8: CTRGU_RGB565, false, ctr->texture_swizzled, ctr->texture_width, ctr->rgb32 ? CTRGU_RGBA8: CTRGU_RGB565, true); } ctr->frame_coords->u0 = 0; ctr->frame_coords->v0 = 0; ctr->frame_coords->u1 = width; ctr->frame_coords->v1 = height; GSPGPU_FlushDataCache(ctr->frame_coords, sizeof(ctr_vertex_t)); } GPUCMD_AddWrite(GPUREG_GSH_BOOLUNIFORM, ctr->rotation & 1); ctrGuSetVertexShaderFloatUniform(0, (float*)&ctr->scale_vector, 1); ctrGuSetTexture(GPU_TEXUNIT0, VIRT_TO_PHYS(ctr->texture_swizzled), ctr->texture_width, ctr->texture_height, (ctr->smooth? GPU_TEXTURE_MAG_FILTER(GPU_LINEAR) | GPU_TEXTURE_MIN_FILTER(GPU_LINEAR) : GPU_TEXTURE_MAG_FILTER(GPU_NEAREST) | GPU_TEXTURE_MIN_FILTER(GPU_NEAREST)) | GPU_TEXTURE_WRAP_S(GPU_CLAMP_TO_EDGE) | GPU_TEXTURE_WRAP_T(GPU_CLAMP_TO_EDGE), ctr->rgb32 ? GPU_RGBA8: GPU_RGB565); ctr_check_3D_slider(ctr, (ctr_video_mode_enum)disp_mode); /* ARGB --> RGBA */ if (ctr->rgb32) { GPU_SetTexEnv(0, GPU_TEVSOURCES(GPU_TEXTURE0, GPU_CONSTANT, 0), GPU_CONSTANT, GPU_TEVOPERANDS(GPU_TEVOP_RGB_SRC_G, 0, 0), 0, GPU_MODULATE, GPU_REPLACE, 0xFF0000FF); GPU_SetTexEnv(1, GPU_TEVSOURCES(GPU_TEXTURE0, GPU_CONSTANT, GPU_PREVIOUS), GPU_PREVIOUS, GPU_TEVOPERANDS(GPU_TEVOP_RGB_SRC_B, 0, 0), 0, GPU_MULTIPLY_ADD, GPU_REPLACE, 0x00FF00); GPU_SetTexEnv(2, GPU_TEVSOURCES(GPU_TEXTURE0, GPU_CONSTANT, GPU_PREVIOUS), GPU_PREVIOUS, GPU_TEVOPERANDS(GPU_TEVOP_RGB_SRC_ALPHA, 0, 0), 0, GPU_MULTIPLY_ADD, GPU_REPLACE, 0xFF0000); } GPU_SetViewport(NULL, VIRT_TO_PHYS(ctr->drawbuffers.top.left), 0, 0, CTR_TOP_FRAMEBUFFER_HEIGHT, ctr->video_mode == CTR_VIDEO_MODE_2D_800X240 ? CTR_TOP_FRAMEBUFFER_WIDTH * 2 : CTR_TOP_FRAMEBUFFER_WIDTH); if (ctr->video_mode == CTR_VIDEO_MODE_3D) { if (ctr->menu_texture_enable) { ctrGuSetAttributeBuffersAddress(VIRT_TO_PHYS(&ctr->frame_coords[1])); GPU_DrawArray(GPU_GEOMETRY_PRIM, 0, 1); ctrGuSetAttributeBuffersAddress(VIRT_TO_PHYS(&ctr->frame_coords[2])); } else { ctrGuSetAttributeBuffersAddress(VIRT_TO_PHYS(ctr->frame_coords)); GPU_DrawArray(GPU_GEOMETRY_PRIM, 0, 1); } GPU_SetViewport(NULL, VIRT_TO_PHYS(ctr->drawbuffers.top.right), 0, 0, CTR_TOP_FRAMEBUFFER_HEIGHT, CTR_TOP_FRAMEBUFFER_WIDTH); } else ctrGuSetAttributeBuffersAddress(VIRT_TO_PHYS(ctr->frame_coords)); GPU_DrawArray(GPU_GEOMETRY_PRIM, 0, 1); /* restore */ if (ctr->rgb32) { GPU_SetTexEnv(0, GPU_TEXTURE0, GPU_TEXTURE0, 0, 0, GPU_REPLACE, GPU_REPLACE, 0); GPU_SetTexEnv(1, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); GPU_SetTexEnv(2, GPU_PREVIOUS, GPU_PREVIOUS, 0, 0, 0, 0, 0); } #ifdef HAVE_MENU if (ctr->menu_texture_enable) { if(ctr->menu_texture_frame_enable) { ctrGuSetTexture(GPU_TEXUNIT0, VIRT_TO_PHYS(ctr->menu.texture_swizzled), ctr->menu.texture_width, ctr->menu.texture_height, GPU_TEXTURE_MAG_FILTER(GPU_LINEAR) | GPU_TEXTURE_MIN_FILTER(GPU_LINEAR) | GPU_TEXTURE_WRAP_S(GPU_CLAMP_TO_EDGE) | GPU_TEXTURE_WRAP_T(GPU_CLAMP_TO_EDGE), GPU_RGBA4); GPUCMD_AddWrite(GPUREG_GSH_BOOLUNIFORM, 0); ctrGuSetVertexShaderFloatUniform(0, (float*)&ctr->menu.scale_vector, 1); ctrGuSetAttributeBuffersAddress(VIRT_TO_PHYS(ctr->menu.frame_coords)); GPU_SetViewport(NULL, VIRT_TO_PHYS(ctr->drawbuffers.top.left), 0, 0, CTR_TOP_FRAMEBUFFER_HEIGHT, ctr->video_mode == CTR_VIDEO_MODE_2D_800X240 ? CTR_TOP_FRAMEBUFFER_WIDTH * 2 : CTR_TOP_FRAMEBUFFER_WIDTH); GPU_DrawArray(GPU_GEOMETRY_PRIM, 0, 1); if (ctr->video_mode == CTR_VIDEO_MODE_3D) { GPU_SetViewport(NULL, VIRT_TO_PHYS(ctr->drawbuffers.top.right), 0, 0, CTR_TOP_FRAMEBUFFER_HEIGHT, CTR_TOP_FRAMEBUFFER_WIDTH); GPU_DrawArray(GPU_GEOMETRY_PRIM, 0, 1); } } ctr->msg_rendering_enabled = true; menu_driver_frame(menu_is_alive, video_info); ctr->msg_rendering_enabled = false; } else if (statistics_show) { if (osd_params) { font_driver_render_msg(ctr, stat_text, (const struct font_params*)osd_params, NULL); } } #endif #ifdef HAVE_GFX_WIDGETS if (widgets_active) gfx_widgets_frame(video_info); #endif if (msg) font_driver_render_msg(ctr, msg, NULL, NULL); GPU_FinishDrawing(); GPU_Finalize(); ctrGuFlushAndRun(true); ctrGuDisplayTransfer(true, ctr->drawbuffers.top.left, 240, ctr->video_mode == CTR_VIDEO_MODE_2D_800X240 ? 800 : 400, CTRGU_RGBA8, gfxTopLeftFramebuffers[ctr->current_buffer_top], 240, CTRGU_RGB8, CTRGU_MULTISAMPLE_NONE); if ((ctr->video_mode == CTR_VIDEO_MODE_2D_400X240) || (ctr->video_mode == CTR_VIDEO_MODE_3D)) ctrGuDisplayTransfer(true, ctr->drawbuffers.top.right, 240, 400, CTRGU_RGBA8, gfxTopRightFramebuffers[ctr->current_buffer_top], 240, CTRGU_RGB8, CTRGU_MULTISAMPLE_NONE); /* Swap buffers : */ #ifdef USE_CTRULIB_2 u32 *buf0, *buf1; u32 stride; buf0 = (u32*)gfxTopLeftFramebuffers[ctr->current_buffer_top]; if(ctr->video_mode == CTR_VIDEO_MODE_2D_800X240) { buf1 = (u32*)(gfxTopLeftFramebuffers[ctr->current_buffer_top] + 240 * 3); stride = 240 * 3 * 2; } else { if (ctr->enable_3d) buf1 = (u32*)gfxTopRightFramebuffers[ctr->current_buffer_top]; else buf1 = buf0; stride = 240 * 3; } u8 bit5 = (ctr->enable_3d != 0); gspPresentBuffer(GFX_TOP, ctr->current_buffer_top, buf0, buf1, stride, (1<<8)|((1^bit5)<<6)|((bit5)<<5)|GSP_BGR8_OES); #else topFramebufferInfo. active_framebuf = ctr->current_buffer_top; topFramebufferInfo. framebuf0_vaddr = (u32*)gfxTopLeftFramebuffers[ctr->current_buffer_top]; if(ctr->video_mode == CTR_VIDEO_MODE_2D_800X240) { topFramebufferInfo. framebuf1_vaddr = (u32*)(gfxTopLeftFramebuffers[ctr->current_buffer_top] + 240 * 3); topFramebufferInfo. framebuf_widthbytesize = 240 * 3 * 2; } else { if (ctr->enable_3d) topFramebufferInfo. framebuf1_vaddr = (u32*)gfxTopRightFramebuffers[ctr->current_buffer_top]; else topFramebufferInfo. framebuf1_vaddr = topFramebufferInfo.framebuf0_vaddr; topFramebufferInfo. framebuf_widthbytesize = 240 * 3; } u8 bit5 = (ctr->enable_3d != 0); topFramebufferInfo.format = (1<<8)|((1^bit5)<<6)|((bit5)<<5)|GSP_BGR8_OES; topFramebufferInfo. framebuf_dispselect = ctr->current_buffer_top; topFramebufferInfo.unk = 0x00000000; u8* framebufferInfoHeader = gfxSharedMemory+0x200+gfxThreadID*0x80; GSPGPU_FramebufferInfo* framebufferInfo = (GSPGPU_FramebufferInfo*)&framebufferInfoHeader[0x4]; framebufferInfoHeader[0x0] ^= 1; framebufferInfo[framebufferInfoHeader[0x0]] = topFramebufferInfo; framebufferInfoHeader[0x1] = 1; #endif ctr->current_buffer_top ^= 1; ctr->p3d_event_pending = true; ctr->ppf_event_pending = true; return true; } static void ctr_set_nonblock_state(void* data, bool toggle, bool a, unsigned b) { ctr_video_t* ctr = (ctr_video_t*)data; if (ctr) ctr->vsync = !toggle; } static bool ctr_alive(void* data) { (void)data; return true; } static bool ctr_focus(void* data) { (void)data; return true; } static bool ctr_suppress_screensaver(void* data, bool enable) { (void)data; (void)enable; return false; } static void ctr_free(void* data) { ctr_video_t* ctr = (ctr_video_t*)data; if (!ctr) return; aptUnhook(&ctr->lcd_aptHook); gspSetEventCallback(GSPGPU_EVENT_VBlank0, NULL, NULL, true); shaderProgramFree(&ctr->shader); DVLB_Free(ctr->dvlb); vramFree(ctr->drawbuffers.top.left); linearFree(ctr->display_list); linearFree(ctr->texture_linear); linearFree(ctr->texture_swizzled); linearFree(ctr->frame_coords); linearFree(ctr->menu.texture_linear); linearFree(ctr->menu.texture_swizzled); linearFree(ctr->menu.frame_coords); linearFree(ctr->empty_framebuffer); linearFree(ctr->vertex_cache.buffer); linearFree(ctr); #if 0 gfxExit(); #endif } static void ctr_set_texture_frame(void* data, const void* frame, bool rgb32, unsigned width, unsigned height, float alpha) { int i; ctr_video_t* ctr = (ctr_video_t*)data; int line_width = width; (void)rgb32; (void)alpha; if(!ctr || !frame) return; if (line_width > ctr->menu.texture_width) line_width = ctr->menu.texture_width; if (height > (unsigned)ctr->menu.texture_height) height = (unsigned)ctr->menu.texture_height; const uint16_t* src = frame; uint16_t* dst = (uint16_t*)ctr->menu.texture_linear; for (i = 0; i < height; i++) { memcpy(dst, src, line_width * sizeof(uint16_t)); dst += ctr->menu.texture_width; src += width; } ctr->menu.frame_coords->x0 = (CTR_TOP_FRAMEBUFFER_WIDTH - width) / 2; ctr->menu.frame_coords->y0 = (CTR_TOP_FRAMEBUFFER_HEIGHT - height) / 2; ctr->menu.frame_coords->x1 = ctr->menu.frame_coords->x0 + width; ctr->menu.frame_coords->y1 = ctr->menu.frame_coords->y0 + height; ctr->menu.frame_coords->u0 = 0; ctr->menu.frame_coords->v0 = 0; ctr->menu.frame_coords->u1 = width; ctr->menu.frame_coords->v1 = height; GSPGPU_FlushDataCache(ctr->menu.frame_coords, sizeof(ctr_vertex_t)); ctr->menu_texture_frame_enable = true; GSPGPU_FlushDataCache(ctr->menu.texture_linear, ctr->menu.texture_width * ctr->menu.texture_height * sizeof(uint16_t)); ctrGuCopyImage(false, ctr->menu.texture_linear, ctr->menu.texture_width, ctr->menu.texture_height, CTRGU_RGBA4444,false, ctr->menu.texture_swizzled, ctr->menu.texture_width, CTRGU_RGBA4444, true); } static void ctr_set_texture_enable(void* data, bool state, bool full_screen) { (void) full_screen; ctr_video_t* ctr = (ctr_video_t*)data; if (ctr) ctr->menu_texture_enable = state; } static void ctr_set_rotation(void* data, unsigned rotation) { ctr_video_t* ctr = (ctr_video_t*)data; if (!ctr) return; ctr->rotation = rotation; ctr->should_resize = true; } static void ctr_set_filtering(void* data, unsigned index, bool smooth, bool ctx_scaling) { ctr_video_t* ctr = (ctr_video_t*)data; if (ctr) ctr->smooth = smooth; } static void ctr_set_aspect_ratio(void* data, unsigned aspect_ratio_idx) { ctr_video_t *ctr = (ctr_video_t*)data; if(!ctr) return; ctr->keep_aspect = true; ctr->should_resize = true; } static void ctr_apply_state_changes(void* data) { ctr_video_t* ctr = (ctr_video_t*)data; if (ctr) ctr->should_resize = true; } static void ctr_viewport_info(void* data, struct video_viewport* vp) { ctr_video_t* ctr = (ctr_video_t*)data; if (ctr) *vp = ctr->vp; } static uintptr_t ctr_load_texture(void *video_data, void *data, bool threaded, enum texture_filter_type filter_type) { void* tmpdata; ctr_texture_t *texture = NULL; ctr_video_t *ctr = (ctr_video_t*)video_data; struct texture_image *image = (struct texture_image*)data; int size = image->width * image->height * sizeof(uint32_t); if ((size * 3) > linearSpaceFree()) return 0; if (!ctr || !image || image->width > 2048 || image->height > 2048) return 0; texture = (ctr_texture_t*) calloc(1, sizeof(ctr_texture_t)); texture->width = next_pow2(image->width); texture->height = next_pow2(image->height); texture->active_width = image->width; texture->active_height = image->height; texture->data = linearAlloc( texture->width * texture->height * sizeof(uint32_t)); texture->type = filter_type; if (!texture->data) { free(texture); return 0; } if ((image->width <= 32) || (image->height <= 32)) { int i, j; uint32_t* src = (uint32_t*)image->pixels; for (j = 0; j < image->height; j++) for (i = 0; i < image->width; i++) { ((uint32_t*)texture->data)[ctrgu_swizzle_coords(i, j, texture->width)] = ((*src >> 8) & 0x00FF00) | ((*src >> 24) & 0xFF) | ((*src << 8) & 0xFF0000) | ((*src << 24) & 0xFF000000); src++; } GSPGPU_FlushDataCache(texture->data, texture->width * texture->height * sizeof(uint32_t)); } else { int i; uint32_t *src = NULL; uint32_t *dst = NULL; tmpdata = linearAlloc(image->width * image->height * sizeof(uint32_t)); if (!tmpdata) { free(texture->data); free(texture); return 0; } src = (uint32_t*)image->pixels; dst = (uint32_t*)tmpdata; for (i = 0; i < image->width * image->height; i++) { *dst = ((*src >> 8) & 0x00FF00) | ((*src >> 24) & 0xFF) | ((*src << 8) & 0xFF0000) | ((*src << 24) & 0xFF000000); dst++; src++; } GSPGPU_FlushDataCache(tmpdata, image->width * image->height * sizeof(uint32_t)); ctrGuCopyImage(true, tmpdata, image->width, image->height, CTRGU_RGBA8, false, texture->data, texture->width, CTRGU_RGBA8, true); #if 0 gspWaitForEvent(GSPGPU_EVENT_PPF, false); ctr->ppf_event_pending = false; #else ctr->ppf_event_pending = true; #endif linearFree(tmpdata); } return (uintptr_t)texture; } static void ctr_unload_texture(void *data, bool threaded, uintptr_t handle) { struct ctr_texture *texture = (struct ctr_texture*)handle; if (!texture) return; if (texture->data) { if (((u32)texture->data & 0xFF000000) == 0x1F000000) vramFree(texture->data); else linearFree(texture->data); } free(texture); } static void ctr_set_osd_msg(void *data, const char *msg, const void *params, void *font) { ctr_video_t* ctr = (ctr_video_t*)data; if (ctr && ctr->msg_rendering_enabled) font_driver_render_msg(data, msg, params, font); } static uint32_t ctr_get_flags(void *data) { uint32_t flags = 0; return flags; } static const video_poke_interface_t ctr_poke_interface = { ctr_get_flags, ctr_load_texture, ctr_unload_texture, NULL, NULL, ctr_set_filtering, NULL, /* get_video_output_size */ NULL, /* get_video_output_prev */ NULL, /* get_video_output_next */ NULL, /* get_current_framebuffer */ NULL, ctr_set_aspect_ratio, ctr_apply_state_changes, ctr_set_texture_frame, ctr_set_texture_enable, font_driver_render_msg, /* ctr_set_osd_msg*/ NULL, /* show_mouse */ NULL, /* grab_mouse_toggle */ NULL, /* get_current_shader */ NULL, /* get_current_software_framebuffer */ NULL /* get_hw_render_interface */ }; static void ctr_get_poke_interface(void* data, const video_poke_interface_t** iface) { (void)data; *iface = &ctr_poke_interface; } #ifdef HAVE_GFX_WIDGETS static bool ctr_gfx_widgets_enabled(void *data) { (void)data; return true; } #endif static bool ctr_set_shader(void* data, enum rarch_shader_type type, const char* path) { (void)data; (void)type; (void)path; return false; } video_driver_t video_ctr = { ctr_init, ctr_frame, ctr_set_nonblock_state, ctr_alive, ctr_focus, ctr_suppress_screensaver, NULL, /* has_windowed */ ctr_set_shader, ctr_free, "ctr", NULL, /* set_viewport */ ctr_set_rotation, ctr_viewport_info, NULL, /* read_viewport */ NULL, /* read_frame_raw */ #ifdef HAVE_OVERLAY NULL, #endif #ifdef HAVE_VIDEO_LAYOUT NULL, #endif ctr_get_poke_interface, NULL, #ifdef HAVE_GFX_WIDGETS ctr_gfx_widgets_enabled #endif };