mirror of
				https://git.eden-emu.dev/eden-emu/eden.git
				synced 2025-10-26 14:53:18 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			122 lines
		
	
	
	
		
			4.5 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			122 lines
		
	
	
	
		
			4.5 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| // SPDX-FileCopyrightText: Copyright 2018 yuzu Emulator Project
 | |
| // SPDX-License-Identifier: GPL-2.0-or-later
 | |
| 
 | |
| #include "common/assert.h"
 | |
| #include "common/logging/log.h"
 | |
| #include "common/microprofile.h"
 | |
| #include "video_core/engines/fermi_2d.h"
 | |
| #include "video_core/engines/sw_blitter/blitter.h"
 | |
| #include "video_core/memory_manager.h"
 | |
| #include "video_core/rasterizer_interface.h"
 | |
| #include "video_core/surface.h"
 | |
| #include "video_core/textures/decoders.h"
 | |
| 
 | |
| MICROPROFILE_DECLARE(GPU_BlitEngine);
 | |
| MICROPROFILE_DEFINE(GPU_BlitEngine, "GPU", "Blit Engine", MP_RGB(224, 224, 128));
 | |
| 
 | |
| using VideoCore::Surface::BytesPerBlock;
 | |
| using VideoCore::Surface::PixelFormatFromRenderTargetFormat;
 | |
| 
 | |
| namespace Tegra::Engines {
 | |
| 
 | |
| using namespace Texture;
 | |
| 
 | |
| Fermi2D::Fermi2D(MemoryManager& memory_manager_) : memory_manager{memory_manager_} {
 | |
|     sw_blitter = std::make_unique<Blitter::SoftwareBlitEngine>(memory_manager);
 | |
|     // Nvidia's OpenGL driver seems to assume these values
 | |
|     regs.src.depth = 1;
 | |
|     regs.dst.depth = 1;
 | |
| 
 | |
|     execution_mask.reset();
 | |
|     execution_mask[FERMI2D_REG_INDEX(pixels_from_memory.src_y0) + 1] = true;
 | |
| }
 | |
| 
 | |
| Fermi2D::~Fermi2D() = default;
 | |
| 
 | |
| void Fermi2D::BindRasterizer(VideoCore::RasterizerInterface* rasterizer_) {
 | |
|     rasterizer = rasterizer_;
 | |
| }
 | |
| 
 | |
| void Fermi2D::CallMethod(u32 method, u32 method_argument, bool is_last_call) {
 | |
|     ASSERT_MSG(method < Regs::NUM_REGS,
 | |
|                "Invalid Fermi2D register, increase the size of the Regs structure");
 | |
|     regs.reg_array[method] = method_argument;
 | |
| 
 | |
|     if (method == FERMI2D_REG_INDEX(pixels_from_memory.src_y0) + 1) {
 | |
|         Blit();
 | |
|     }
 | |
| }
 | |
| 
 | |
| void Fermi2D::CallMultiMethod(u32 method, const u32* base_start, u32 amount, u32 methods_pending) {
 | |
|     for (u32 i = 0; i < amount; ++i) {
 | |
|         CallMethod(method, base_start[i], methods_pending - i <= 1);
 | |
|     }
 | |
| }
 | |
| 
 | |
| void Fermi2D::ConsumeSinkImpl() {
 | |
|     for (auto [method, value] : method_sink) {
 | |
|         regs.reg_array[method] = value;
 | |
|     }
 | |
|     method_sink.clear();
 | |
| }
 | |
| 
 | |
| void Fermi2D::Blit() {
 | |
|     MICROPROFILE_SCOPE(GPU_BlitEngine);
 | |
|     LOG_DEBUG(HW_GPU, "called. source address=0x{:x}, destination address=0x{:x}",
 | |
|               regs.src.Address(), regs.dst.Address());
 | |
| 
 | |
|     UNIMPLEMENTED_IF_MSG(regs.operation != Operation::SrcCopy, "Operation is not copy");
 | |
|     UNIMPLEMENTED_IF_MSG(regs.src.layer != 0, "Source layer is not zero");
 | |
|     UNIMPLEMENTED_IF_MSG(regs.dst.layer != 0, "Destination layer is not zero");
 | |
|     UNIMPLEMENTED_IF_MSG(regs.src.depth != 1, "Source depth is not one");
 | |
|     UNIMPLEMENTED_IF_MSG(regs.clip_enable != 0, "Clipped blit enabled");
 | |
| 
 | |
|     const auto& args = regs.pixels_from_memory;
 | |
|     constexpr s64 null_derivative = 1ULL << 32;
 | |
|     Surface src = regs.src;
 | |
|     const auto bytes_per_pixel = BytesPerBlock(PixelFormatFromRenderTargetFormat(src.format));
 | |
|     const bool delegate_to_gpu = src.width > 512 && src.height > 512 && bytes_per_pixel <= 8 &&
 | |
|                                  src.format != regs.dst.format;
 | |
| 
 | |
|     auto srcX = args.src_x0;
 | |
|     auto srcY = args.src_y0;
 | |
|     if (args.sample_mode.origin == Origin::Corner) {
 | |
|         srcX -= (args.du_dx >> 33) << 32;
 | |
|         srcY -= (args.dv_dy >> 33) << 32;
 | |
|     }
 | |
| 
 | |
|     Config config{
 | |
|         .operation = regs.operation,
 | |
|         .filter = args.sample_mode.filter,
 | |
|         .must_accelerate =
 | |
|             args.du_dx != null_derivative || args.dv_dy != null_derivative || delegate_to_gpu,
 | |
|         .dst_x0 = args.dst_x0,
 | |
|         .dst_y0 = args.dst_y0,
 | |
|         .dst_x1 = args.dst_x0 + args.dst_width,
 | |
|         .dst_y1 = args.dst_y0 + args.dst_height,
 | |
|         .src_x0 = static_cast<s32>(srcX >> 32),
 | |
|         .src_y0 = static_cast<s32>(srcY >> 32),
 | |
|         .src_x1 = static_cast<s32>((srcX + args.du_dx * args.dst_width) >> 32),
 | |
|         .src_y1 = static_cast<s32>((srcY + args.dv_dy * args.dst_height) >> 32),
 | |
|     };
 | |
| 
 | |
|     const auto need_align_to_pitch =
 | |
|         src.linear == Tegra::Engines::Fermi2D::MemoryLayout::Pitch &&
 | |
|         static_cast<s32>(src.width) == config.src_x1 &&
 | |
|         config.src_x1 > static_cast<s32>(src.pitch / bytes_per_pixel) && config.src_x0 > 0;
 | |
|     if (need_align_to_pitch) {
 | |
|         auto address = src.Address() + config.src_x0 * bytes_per_pixel;
 | |
|         src.addr_upper = static_cast<u32>(address >> 32);
 | |
|         src.addr_lower = static_cast<u32>(address);
 | |
|         src.width -= config.src_x0;
 | |
|         config.src_x1 -= config.src_x0;
 | |
|         config.src_x0 = 0;
 | |
|     }
 | |
| 
 | |
|     memory_manager.FlushCaching();
 | |
|     if (!rasterizer->AccelerateSurfaceCopy(src, regs.dst, config)) {
 | |
|         sw_blitter->Blit(src, regs.dst, config);
 | |
|     }
 | |
| }
 | |
| 
 | |
| } // namespace Tegra::Engines
 | 
