view graal/com.oracle.graal.compiler.ptx.test/src/com/oracle/graal/compiler/ptx/test/PTXTestBase.java @ 13229:325b4e4efb60

added CompilationResultBuilderFactory to support peep-hole instrumentation of methods as their code is emitted
author Doug Simon <doug.simon@oracle.com>
date Tue, 03 Dec 2013 16:33:41 +0100
parents 4568980f7257
children bb35fc7e0d68
line wrap: on
line source

/*
 * Copyright (c) 2013, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */
package com.oracle.graal.compiler.ptx.test;

import static com.oracle.graal.api.code.CodeUtil.*;

import java.lang.annotation.*;
import java.lang.reflect.*;

import com.oracle.graal.api.code.*;
import com.oracle.graal.api.code.CallingConvention.Type;
import com.oracle.graal.api.meta.*;
import com.oracle.graal.compiler.*;
import com.oracle.graal.compiler.target.*;
import com.oracle.graal.compiler.test.*;
import com.oracle.graal.debug.*;
import com.oracle.graal.hotspot.*;
import com.oracle.graal.hotspot.bridge.*;
import com.oracle.graal.hotspot.meta.*;
import com.oracle.graal.hotspot.ptx.*;
import com.oracle.graal.java.*;
import com.oracle.graal.lir.asm.*;
import com.oracle.graal.lir.ptx.*;
import com.oracle.graal.nodes.*;
import com.oracle.graal.phases.*;
import com.oracle.graal.phases.PhasePlan.PhasePosition;
import com.oracle.graal.phases.tiers.*;
import com.oracle.graal.ptx.*;

public abstract class PTXTestBase extends GraalCompilerTest {

    private StructuredGraph sg;

    public static void printReport(String message) {
        // Use -G:Log=Test to see these messages on the console
        Debug.log(message);
    }

    public PTXTestBase() {
        super(PTX.class);
    }

    private static CompilerToGPU toGPU = HotSpotGraalRuntime.runtime().getCompilerToGPU();

    private static boolean validDevice = toGPU.deviceInit();

    private static final int totalProcessors = (validDevice ? toGPU.availableProcessors() : 0);

    protected CompilationResult compile(String test) {
        if (getBackend() instanceof PTXHotSpotBackend) {
            StructuredGraph graph = parse(test);
            sg = graph;
            Debug.dump(graph, "Graph");
            Backend ptxBackend = getBackend();
            TargetDescription target = ptxBackend.getTarget();
            PhasePlan phasePlan = new PhasePlan();
            GraphBuilderPhase graphBuilderPhase = new GraphBuilderPhase(getMetaAccess(), getForeignCalls(), GraphBuilderConfiguration.getDefault(), OptimisticOptimizations.NONE);
            phasePlan.addPhase(PhasePosition.AFTER_PARSING, graphBuilderPhase);
            phasePlan.addPhase(PhasePosition.AFTER_PARSING, new PTXPhase());
            new PTXPhase().apply(graph);
            CallingConvention cc = getCallingConvention(getCodeCache(), Type.JavaCallee, graph.method(), false);
            /*
             * Use Suites.createDefaultSuites() instead of GraalCompilerTest.suites. The
             * GraalCompilerTest.suites variable contains the Suites for the HotSpotRuntime. This
             * code will not run on hotspot, so it should use the plain Graal default suites,
             * without hotspot specific phases.
             * 
             * Ultimately we might want to have both the kernel and the code natively compiled for
             * GPU fallback to CPU in cases of ECC failure on kernel invocation.
             */
            Suites suites = Suites.createDefaultSuites();
            ExternalCompilationResult result = GraalCompiler.compileGraph(graph, cc, graph.method(), getProviders(), ptxBackend, target, null, phasePlan, OptimisticOptimizations.NONE,
                            new SpeculationLog(), suites, true, new ExternalCompilationResult(), CompilationResultBuilderFactory.Default);

            ResolvedJavaMethod method = graph.method();

            try {
                if ((validDevice) && (result.getTargetCode() != null)) {
                    long kernel = toGPU.generateKernel(result.getTargetCode(), method.getName());
                    result.setEntryPoint(kernel);
                }
            } catch (Throwable th) {
                th.printStackTrace();
            }

            return result;
        } else {
            return null;
        }
    }

    protected StructuredGraph getStructuredGraph() {
        return sg;
    }

    protected Object invoke(CompilationResult result, Object... args) {
        if (result == null) {
            return null;
        }
        try {
            if (((ExternalCompilationResult) result).getEntryPoint() == 0) {
                Debug.dump(result, "[CUDA] *** Null entry point - Not launching kernel");
                return null;
            }

            /* Check if the method compiled is static */
            HotSpotResolvedJavaMethod compiledMethod = (HotSpotResolvedJavaMethod) sg.method();
            boolean isStatic = Modifier.isStatic(compiledMethod.getModifiers());
            Object[] executeArgs = argsWithReceiver((isStatic ? null : this), args);
            HotSpotCodeCacheProvider codeCache = (HotSpotCodeCacheProvider) getCodeCache();
            InstalledCode installedCode = codeCache.addExternalMethod(compiledMethod, result);
            Annotation[][] params = compiledMethod.getParameterAnnotations();

            int dimensionX = 1;
            int dimensionY = 1;
            int dimensionZ = 1;

            for (int p = 0; p < params.length; p++) {
                Annotation[] annos = params[p];
                if (annos != null) {
                    for (int a = 0; a < annos.length; a++) {
                        Annotation aa = annos[a];
                        if (args[p] instanceof int[] && aa.annotationType().equals(ParallelOver.class)) {
                            int[] iarray = (int[]) args[p];
                            ParallelOver threadBlockDimension = (ParallelOver) aa;
                            switch (threadBlockDimension.dimension()) {
                                case X:
                                    dimensionX = iarray.length;
                                    break;
                                case Y:
                                    dimensionY = iarray.length;
                                    break;
                                case Z:
                                    dimensionZ = iarray.length;
                                    break;
                            }
                        }
                    }
                }
            }
            Object r;
            if (dimensionX != 1 || dimensionY != 1 || dimensionZ != 1) {
                /*
                 * for now assert that the warp array block is no larger than the number of physical
                 * gpu cores.
                 */
                assert dimensionX * dimensionY * dimensionZ < totalProcessors;

                r = ((HotSpotNmethod) installedCode).executeParallel(dimensionX, dimensionY, dimensionZ, executeArgs);
            } else {
                r = installedCode.executeVarargs(executeArgs);
            }
            return r;
        } catch (Throwable th) {
            th.printStackTrace();
            return null;
        }
    }
}