truffle: src/gpu/ptx/vm/gpu_ptx.cpp comparison

comparison src/gpu/ptx/vm/gpu_ptx.cpp @ 13832:ab370d74a8eb

implemented GC locking for duration of a PTX kernel call

author	Doug Simon <doug.simon@oracle.com>
date	Thu, 30 Jan 2014 23:52:34 +0100
parents	49db2c1e3bee
children	fe99bfb55626

comparison

equal deleted inserted replaced

-:d6823d127f76
+:ab370d74a8eb
 #include "runtime/gpu.hpp"
 #include "utilities/globalDefinitions.hpp"
 #include "utilities/ostream.hpp"
 #include "memory/allocation.hpp"
 #include "memory/allocation.inline.hpp"
+#include "memory/gcLocker.inline.hpp"
 #include "runtime/interfaceSupport.hpp"
 #include "graal/graalEnv.hpp"
 #include "graal/graalCompiler.hpp"
 #include "ptxKernelArguments.hpp"
 oop*         _pinned;        // objects that have been pinned with cuMemHostRegister
 int          _pinned_length; // length of _pinned
 gpu::Ptx::CUdeviceptr  _ret_value;     // pointer to slot in GPU memory holding the return value
 int          _ret_type_size; // size of the return type value
 bool         _ret_is_object; // specifies if the return type is Object
+bool         _gc_locked;
 bool check(int status, const char *action) {
 if (status != GRAAL_CUDA_SUCCESS) {
 Thread* THREAD = _thread;
 char* message = NEW_RESOURCE_ARRAY_IN_THREAD(THREAD, char, O_BUFLEN + 1);
 }
 return true;
 }
 public:
-PtxCall(JavaThread* thread, address buffer, int buffer_size, oop* pinned, int encodedReturnTypeSize) : _thread(thread),
+PtxCall(JavaThread* thread, address buffer, int buffer_size, oop* pinned, int encodedReturnTypeSize) : _thread(thread), _gc_locked(false),
 _buffer(buffer), _buffer_size(buffer_size), _pinned(pinned), _pinned_length(0), _ret_value(0), _ret_is_object(encodedReturnTypeSize < 0) {
 _ret_type_size = _ret_is_object ? -encodedReturnTypeSize : encodedReturnTypeSize;
 }
 bool is_object_return() { return _ret_is_object; }
 void pin_objects(int count, int* objectOffsets) {
 if (count == 0) {
 return;
 }
+// Once we start pinning objects, no GC must occur
+// until the kernel has completed. This is a big
+// hammer for ensuring we can safely pass objects
+// to the GPU.
+GC_locker::lock_critical(_thread);
+_gc_locked = true;
+if (TraceGPUInteraction) {
+tty->print_cr("[CUDA] Locked GC");
+}
 for (int i = 0; i < count; i++) {
 int offset = objectOffsets[i];
 oop* argPtr = (oop*) (_buffer + offset);
 oop obj = *argPtr;
 if (obj != NULL) {
 ~PtxCall() {
 unpin_objects();
 free_return_value();
 destroy_context();
+if (_gc_locked) {
+GC_locker::unlock_critical(_thread);
+if (TraceGPUInteraction) {
+tty->print_cr("[CUDA] Unlocked GC");
+}
+}
 }
 };
 GPU_VMENTRY(jlong, gpu::Ptx::get_execute_kernel_from_vm_address, (JNIEnv *env, jclass))
 return (jlong) gpu::Ptx::execute_kernel_from_vm;
 int encodedReturnTypeSize))
 if (kernel == 0L) {
 SharedRuntime::throw_and_post_jvmti_exception(thread, vmSymbols::java_lang_NullPointerException(), NULL);
 return 0L;
 }
-#if 0
-Universe::heap()->collect(GCCause::_jvmti_force_gc);
-#endif
 PtxCall call(thread, (address) buffer, bufferSize, (oop*) (address) pinnedObjects, encodedReturnTypeSize);
 #define TRY(action) do { \
 action; \

Mercurial > hg > truffle

comparison src/gpu/ptx/vm/gpu_ptx.cpp @ 13832:ab370d74a8eb