| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | // Copyright (C) 2003 Dolphin Project.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // This program is free software: you can redistribute it and/or modify
 | 
					
						
							|  |  |  | // it under the terms of the GNU General Public License as published by
 | 
					
						
							|  |  |  | // the Free Software Foundation, version 2.0.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // This program is distributed in the hope that it will be useful,
 | 
					
						
							|  |  |  | // but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
					
						
							|  |  |  | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
					
						
							|  |  |  | // GNU General Public License 2.0 for more details.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // A copy of the GPL 2.0 should have been included with the program.
 | 
					
						
							|  |  |  | // If not, see http://www.gnu.org/licenses/
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // Official SVN repository and contact information can be found at
 | 
					
						
							|  |  |  | // http://code.google.com/p/dolphin-emu/
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "OCLTextureDecoder.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "OpenCL.h"
 | 
					
						
							|  |  |  | #include "FileUtil.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <fcntl.h>
 | 
					
						
							|  |  |  | #include <stdio.h>
 | 
					
						
							|  |  |  | #include <stdlib.h>
 | 
					
						
							|  |  |  | #include <string.h>
 | 
					
						
							|  |  |  | #include <math.h>
 | 
					
						
							|  |  |  | #include <sys/types.h>
 | 
					
						
							|  |  |  | #include <sys/stat.h>
 | 
					
						
							|  |  |  | #include <string>
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | //#define DEBUG_OPENCL
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | cl_program g_program; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | struct sDecoderParameter | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | { | 
					
						
							|  |  |  |     const char *name; | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  |     cl_kernel kernel; | 
					
						
							|  |  |  |     float sizeOfSrc; | 
					
						
							|  |  |  | 	float sizeOfDst; | 
					
						
							|  |  |  |     int xSkip; | 
					
						
							|  |  |  |     int ySkip; | 
					
						
							|  |  |  | 	PC_TexFormat format; | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | sDecoderParameter g_DecodeParametersNative[] = { | 
					
						
							|  |  |  |     /* GX_TF_I4     */ { "DecodeI4",     NULL, 0.5f, 1, 8, 8, PC_TEX_FMT_I4_AS_I8 }, | 
					
						
							|  |  |  |     /* GX_TF_I8     */ { "DecodeI8",     NULL,    1, 1, 8, 4, PC_TEX_FMT_I8 }, | 
					
						
							|  |  |  |     /* GX_TF_IA4    */ { "DecodeIA4",    NULL,    1, 2, 8, 4, PC_TEX_FMT_IA4_AS_IA8 }, | 
					
						
							|  |  |  |     /* GX_TF_IA8    */ { "DecodeIA8",    NULL,    2, 2, 4, 4, PC_TEX_FMT_IA8 }, | 
					
						
							|  |  |  |     /* GX_TF_RGB565 */ { "DecodeRGB565", NULL,    2, 2, 4, 4, PC_TEX_FMT_RGB565 }, | 
					
						
							|  |  |  |     /* GX_TF_RGB5A3 */ { "DecodeRGB5A3", NULL,    2, 4, 4, 4, PC_TEX_FMT_BGRA32 }, | 
					
						
							|  |  |  |     /* GX_TF_RGBA8  */ { "DecodeRGBA8",  NULL,    4, 4, 4, 4, PC_TEX_FMT_BGRA32 }, | 
					
						
							|  |  |  |     /* 7            */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_C4     */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_C8     */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_C14X2  */ { NULL }, | 
					
						
							|  |  |  |     /* B            */ { NULL }, | 
					
						
							|  |  |  |     /* C            */ { NULL }, | 
					
						
							|  |  |  |     /* D            */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_CMPR   */ { "DecodeCMPR",   NULL, 0.5f, 4, 8, 8, PC_TEX_FMT_BGRA32 }, | 
					
						
							|  |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | sDecoderParameter g_DecodeParametersRGBA[] = { | 
					
						
							|  |  |  |     /* GX_TF_I4     */ { "DecodeI4_RGBA",     NULL, 0.5f, 4, 8, 8, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* GX_TF_I8     */ { "DecodeI8_RGBA",     NULL,    1, 4, 8, 4, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* GX_TF_IA4    */ { "DecodeIA4_RGBA",    NULL,    1, 4, 8, 4, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* GX_TF_IA8    */ { "DecodeIA8_RGBA",    NULL,    2, 4, 4, 4, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* GX_TF_RGB565 */ { "DecodeRGB565_RGBA", NULL,    2, 4, 4, 4, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* GX_TF_RGB5A3 */ { "DecodeRGB5A3_RGBA", NULL,    2, 4, 4, 4, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* GX_TF_RGBA8  */ { "DecodeRGBA8_RGBA",  NULL,    4, 4, 4, 4, PC_TEX_FMT_RGBA32 }, | 
					
						
							|  |  |  |     /* 7            */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_C4     */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_C8     */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_C14X2  */ { NULL }, | 
					
						
							|  |  |  |     /* B            */ { NULL }, | 
					
						
							|  |  |  |     /* C            */ { NULL }, | 
					
						
							|  |  |  |     /* D            */ { NULL }, | 
					
						
							|  |  |  |     /* GX_TF_CMPR   */ { "DecodeCMPR_RGBA",   NULL, 0.5f, 4, 8, 8, PC_TEX_FMT_RGBA32 }, | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | bool g_Inited = false; | 
					
						
							|  |  |  | cl_mem g_clsrc, g_cldst;                    // texture buffer memory objects
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void TexDecoder_OpenCL_Initialize() { | 
					
						
							|  |  |  | #if defined(HAVE_OPENCL) && HAVE_OPENCL
 | 
					
						
							|  |  |  | 	if(!g_Inited) | 
					
						
							| 
									
										
										
										
											2010-06-19 07:59:53 +00:00
										 |  |  | 	{ | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 		if(!OpenCL::Initialize()) | 
					
						
							|  |  |  | 			return; | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-19 07:59:53 +00:00
										 |  |  | 		std::string code; | 
					
						
							|  |  |  | 		char filename[1024]; | 
					
						
							|  |  |  | 		sprintf(filename, "%sOpenCL/TextureDecoder.cl", File::GetUserPath(D_USER_IDX)); | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 		if (!File::ReadFileToString(true, filename, code)) | 
					
						
							|  |  |  | 		{ | 
					
						
							|  |  |  | 			ERROR_LOG(VIDEO, "Failed to load OpenCL code %s - file is missing?", filename); | 
					
						
							| 
									
										
										
										
											2010-06-19 07:59:53 +00:00
										 |  |  | 			return; | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 		g_program = OpenCL::CompileProgram(code.c_str()); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 		for (int i = 0; i <= GX_TF_CMPR; ++i) { | 
					
						
							|  |  |  | 			if (g_DecodeParametersNative[i].name) | 
					
						
							|  |  |  | 				g_DecodeParametersNative[i].kernel = | 
					
						
							|  |  |  | 					OpenCL::CompileKernel(g_program, | 
					
						
							|  |  |  | 					g_DecodeParametersNative[i].name); | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 			if (g_DecodeParametersRGBA[i].name) | 
					
						
							|  |  |  | 				g_DecodeParametersRGBA[i].kernel = | 
					
						
							|  |  |  | 					OpenCL::CompileKernel(g_program, | 
					
						
							|  |  |  | 					g_DecodeParametersRGBA[i].name); | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 		// Allocating maximal Wii texture size in advance, so that we don't have to allocate/deallocate per texture
 | 
					
						
							|  |  |  | #ifndef DEBUG_OPENCL
 | 
					
						
							|  |  |  | 		g_clsrc = clCreateBuffer(OpenCL::GetContext(), CL_MEM_READ_ONLY , 1024 * 1024 * sizeof(u32), NULL, NULL); | 
					
						
							|  |  |  | 		g_cldst = clCreateBuffer(OpenCL::GetContext(), CL_MEM_WRITE_ONLY, 1024 * 1024 * sizeof(u32), NULL, NULL); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		g_Inited = true; | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void TexDecoder_OpenCL_Shutdown() { | 
					
						
							|  |  |  | #if defined(HAVE_OPENCL) && HAVE_OPENCL && !defined(DEBUG_OPENCL)
 | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 	clReleaseProgram(g_program); | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 	for (int i = 0; i < GX_TF_CMPR; ++i) { | 
					
						
							|  |  |  | 		if (g_DecodeParametersNative[i].kernel) | 
					
						
							|  |  |  | 			clReleaseKernel(g_DecodeParametersNative[i].kernel); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 		if(g_DecodeParametersRGBA[i].kernel) | 
					
						
							|  |  |  | 			clReleaseKernel(g_DecodeParametersRGBA[i].kernel); | 
					
						
							|  |  |  | 	} | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 	if(g_clsrc) | 
					
						
							|  |  |  | 		clReleaseMemObject(g_clsrc); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 	if(g_cldst) | 
					
						
							|  |  |  | 		clReleaseMemObject(g_cldst); | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 	g_Inited = false; | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | PC_TexFormat TexDecoder_Decode_OpenCL(u8 *dst, const u8 *src, int width, int height, int texformat, int tlutaddr, int tlutfmt, bool rgba) | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | { | 
					
						
							|  |  |  | #if defined(HAVE_OPENCL) && HAVE_OPENCL
 | 
					
						
							| 
									
										
										
										
											2010-06-19 07:59:53 +00:00
										 |  |  | 	cl_int err; | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  |     sDecoderParameter& decoder = rgba ? g_DecodeParametersRGBA[texformat] : g_DecodeParametersNative[texformat]; | 
					
						
							|  |  |  |     if(!decoder.name || !decoder.kernel || decoder.format == PC_TEX_FMT_NONE) | 
					
						
							|  |  |  |         return PC_TEX_FMT_NONE; | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_OPENCL
 | 
					
						
							|  |  |  | 	g_clsrc = clCreateBuffer(OpenCL::GetContext(), CL_MEM_READ_ONLY , 1024 * 1024 * sizeof(u32), NULL, NULL); | 
					
						
							|  |  |  | 	g_cldst = clCreateBuffer(OpenCL::GetContext(), CL_MEM_WRITE_ONLY, 1024 * 1024 * sizeof(u32), NULL, NULL); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 	clEnqueueWriteBuffer(OpenCL::GetCommandQueue(), g_clsrc, CL_TRUE, 0, (size_t)(width * height * decoder.sizeOfSrc), src, 0, NULL, NULL); | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 	clSetKernelArg(decoder.kernel, 0, sizeof(cl_mem), &g_cldst); | 
					
						
							|  |  |  | 	clSetKernelArg(decoder.kernel, 1, sizeof(cl_mem), &g_clsrc); | 
					
						
							|  |  |  | 	clSetKernelArg(decoder.kernel, 2, sizeof(cl_int), &width); | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 	size_t global[] = { (size_t)(width / decoder.xSkip), (size_t)(height / decoder.ySkip) }; | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	// No work-groups for now
 | 
					
						
							|  |  |  | 	/*
 | 
					
						
							|  |  |  | 	size_t local; | 
					
						
							|  |  |  | 	err = clGetKernelWorkGroupInfo(kernelToRun, OpenCL::device_id, CL_KERNEL_WORK_GROUP_SIZE, sizeof(local), &local, NULL); | 
					
						
							|  |  |  | 	if(err) | 
					
						
							|  |  |  | 		PanicAlert("Error obtaining work-group information"); | 
					
						
							|  |  |  | 	*/ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 	err = clEnqueueNDRangeKernel(OpenCL::GetCommandQueue(), decoder.kernel, 2, NULL, global, NULL, 0, NULL, NULL); | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 	if(err) | 
					
						
							| 
									
										
										
										
											2010-06-19 07:59:53 +00:00
										 |  |  | 		OpenCL::HandleCLError(err, "Failed to enqueue kernel"); | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	clFinish(OpenCL::GetCommandQueue()); | 
					
						
							| 
									
										
										
										
											2010-06-26 13:12:28 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 	clEnqueueReadBuffer(OpenCL::GetCommandQueue(), g_cldst, CL_TRUE, 0, (size_t)(width * height * decoder.sizeOfDst), dst, 0, NULL, NULL); | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef DEBUG_OPENCL
 | 
					
						
							|  |  |  | 	clReleaseMemObject(g_clsrc); | 
					
						
							|  |  |  | 	clReleaseMemObject(g_cldst); | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-22 00:52:17 +00:00
										 |  |  | 	return decoder.format; | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | #else
 | 
					
						
							|  |  |  | 	return PC_TEX_FMT_NONE; | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-06-19 07:59:53 +00:00
										 |  |  | 	return PC_TEX_FMT_NONE; | 
					
						
							| 
									
										
										
										
											2010-06-09 01:37:08 +00:00
										 |  |  | } | 
					
						
							|  |  |  | 
 |