Mercurial > hg > graal-compiler
diff src/gpu/hsail/vm/gpu_hsail.cpp @ 12743:f1a55428a8d7
more HSAIL support in the C++ layer for executing HSAIL code on the simulator
Contributed-by: Eric Caspole <eric.caspole@amd.com>
author | Doug Simon <doug.simon@oracle.com> |
---|---|
date | Sun, 10 Nov 2013 13:18:09 +0100 |
parents | |
children | 14db5ffd5ed9 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/src/gpu/hsail/vm/gpu_hsail.cpp Sun Nov 10 13:18:09 2013 +0100 @@ -0,0 +1,166 @@ +/* + * Copyright (c) 2013, Oracle and/or its affiliates. All rights reserved. + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * This code is free software; you can redistribute it and/or modify it + * under the terms of the GNU General Public License version 2 only, as + * published by the Free Software Foundation. + * + * This code is distributed in the hope that it will be useful, but WITHOUT + * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or + * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License + * version 2 for more details (a copy is included in the LICENSE file that + * accompanied this code). + * + * You should have received a copy of the GNU General Public License version + * 2 along with this work; if not, write to the Free Software Foundation, + * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. + * + * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA + * or visit www.oracle.com if you need additional information or have any + * questions. + * + */ + +#include "precompiled.hpp" +#include "runtime/javaCalls.hpp" +#include "runtime/gpu.hpp" +#include "utilities/globalDefinitions.hpp" +#include "utilities/ostream.hpp" +#include "memory/allocation.hpp" +#include "memory/allocation.inline.hpp" +#include "hsailKernelArguments.hpp" + +void * gpu::Hsail::_device_context; + +gpu::Hsail::okra_ctx_create_func_t gpu::Hsail::_okra_ctx_create; +gpu::Hsail::okra_kernel_create_func_t gpu::Hsail::_okra_kernel_create; +gpu::Hsail::okra_push_object_func_t gpu::Hsail::_okra_push_object; +gpu::Hsail::okra_push_boolean_func_t gpu::Hsail::_okra_push_boolean; +gpu::Hsail::okra_push_byte_func_t gpu::Hsail::_okra_push_byte; +gpu::Hsail::okra_push_double_func_t gpu::Hsail::_okra_push_double; +gpu::Hsail::okra_push_float_func_t gpu::Hsail::_okra_push_float; +gpu::Hsail::okra_push_int_func_t gpu::Hsail::_okra_push_int; +gpu::Hsail::okra_push_long_func_t gpu::Hsail::_okra_push_long; +gpu::Hsail::okra_execute_with_range_func_t gpu::Hsail::_okra_execute_with_range; +gpu::Hsail::okra_clearargs_func_t gpu::Hsail::_okra_clearargs; +gpu::Hsail::okra_register_heap_func_t gpu::Hsail::_okra_register_heap; + + +bool gpu::Hsail::initialize_gpu() { + // All the initialization is done in the okra library so + // nothing to do here. + if (TraceGPUInteraction) { + tty->print_cr("[HSAIL] Simulator: initialize_gpu"); + } + return true; +} + +unsigned int gpu::Hsail::total_cores() { + // This is not important with simulator + return 1; +} + +void gpu::Hsail::register_heap() { + // After the okra functions are set up and the heap is initialized, register the java heap with HSA + guarantee(Universe::heap() != NULL, "heap should be there by now."); + if (TraceGPUInteraction) { + tty->print_cr("[HSAIL] heap=" PTR_FORMAT, Universe::heap()); + tty->print_cr("[HSAIL] base=0x%08x, capacity=%ld", Universe::heap()->base(), Universe::heap()->capacity()); + } + _okra_register_heap(Universe::heap()->base(), Universe::heap()->capacity()); +} + +bool gpu::Hsail::execute_kernel_void_1d(address kernel, int dimX, jobject args, methodHandle& mh) { + objArrayOop argsArray = (objArrayOop) JNIHandles::resolve(args); + + // Reset the kernel arguments + _okra_clearargs(kernel); + + // This object sets up the kernel arguments + HSAILKernelArguments hka(kernel, mh->signature(), argsArray, mh->is_static()); + + // Run the kernel + bool success = _okra_execute_with_range(kernel, dimX); + return success; +} + +void *gpu::Hsail::generate_kernel(unsigned char *code, int code_len, const char *name) { + + gpu::Hsail::register_heap(); + + // The kernel entrypoint is always run for the time being + const char* entryPointName = "&run"; + + _device_context = _okra_ctx_create(); + + // code is not null terminated, must be a better way to do this + unsigned char* nullTerminatedCodeBuffer = (unsigned char*) malloc(code_len + 1); + memcpy(nullTerminatedCodeBuffer, code, code_len); + nullTerminatedCodeBuffer[code_len] = 0; + void* kernel = _okra_kernel_create(_device_context, nullTerminatedCodeBuffer, entryPointName); + free(nullTerminatedCodeBuffer); + return kernel; +} + +#if defined(LINUX) +static const char okra_library_name[] = "libokra_x86_64.so"; +#elif defined (_WINDOWS) +static char const okra_library_name[] = "okra_x86_64.dll"; +#else +static char const okra_library_name[] = ""; +#endif + +#define STD_BUFFER_SIZE 1024 + +bool gpu::Hsail::probe_linkage() { + if (okra_library_name != NULL) { + char *buffer = (char*)malloc(STD_BUFFER_SIZE); + if (TraceGPUInteraction) { + tty->print_cr("[HSAIL] library is %s", okra_library_name); + } + void *handle = os::dll_load(okra_library_name, buffer, STD_BUFFER_SIZE); + free(buffer); + if (handle != NULL) { + + _okra_ctx_create = + CAST_TO_FN_PTR(okra_ctx_create_func_t, os::dll_lookup(handle, "okra_create_context")); + _okra_kernel_create = + CAST_TO_FN_PTR(okra_kernel_create_func_t, os::dll_lookup(handle, "okra_create_kernel")); + _okra_push_object = + CAST_TO_FN_PTR(okra_push_object_func_t, os::dll_lookup(handle, "okra_push_object")); + _okra_push_boolean = + CAST_TO_FN_PTR(okra_push_boolean_func_t, os::dll_lookup(handle, "okra_push_boolean")); + _okra_push_byte = + CAST_TO_FN_PTR(okra_push_byte_func_t, os::dll_lookup(handle, "okra_push_byte")); + _okra_push_double = + CAST_TO_FN_PTR(okra_push_double_func_t, os::dll_lookup(handle, "okra_push_double")); + _okra_push_float = + CAST_TO_FN_PTR(okra_push_float_func_t, os::dll_lookup(handle, "okra_push_float")); + _okra_push_int = + CAST_TO_FN_PTR(okra_push_int_func_t, os::dll_lookup(handle, "okra_push_int")); + _okra_push_long = + CAST_TO_FN_PTR(okra_push_long_func_t, os::dll_lookup(handle, "okra_push_long")); + _okra_execute_with_range = + CAST_TO_FN_PTR(okra_execute_with_range_func_t, os::dll_lookup(handle, "okra_execute_with_range")); + _okra_clearargs = + CAST_TO_FN_PTR(okra_clearargs_func_t, os::dll_lookup(handle, "okra_clearargs")); + _okra_register_heap = + CAST_TO_FN_PTR(okra_register_heap_func_t, os::dll_lookup(handle, "okra_register_heap")); + + if (TraceGPUInteraction) { + tty->print_cr("[HSAIL] Success: library linkage _okra_clearargs=0x%08x", _okra_clearargs); + } + return true; + } else { + // Unable to dlopen okra + tty->print_cr("[HSAIL] library load failed."); + return false; + } + } else { + tty->print_cr("Unsupported HSAIL platform"); + return false; + } + tty->print_cr("Failed to find HSAIL linkage"); + return false; +}