truffle: src/share/vm/opto/divnode.cpp comparison

comparison src/share/vm/opto/divnode.cpp @ 570:dca06e7f503d

Merge

author	kvn
date	Tue, 17 Feb 2009 14:30:24 -0800
parents	30663ca5e8f4
children	98cb887364d3

comparison

equal deleted inserted replaced

-:fe3d7c11b4b7
+:dca06e7f503d
 /*
-* Copyright 1997-2008 Sun Microsystems, Inc.  All Rights Reserved.
+* Copyright 1997-2009 Sun Microsystems, Inc.  All Rights Reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.
 return true;
 }
 //---------------------long_by_long_mulhi--------------------------------------
 // Generate ideal node graph for upper half of a 64 bit x 64 bit multiplication
-static Node *long_by_long_mulhi( PhaseGVN *phase, Node *dividend, jlong magic_const) {
+static Node* long_by_long_mulhi(PhaseGVN* phase, Node* dividend, jlong magic_const) {
 // If the architecture supports a 64x64 mulhi, there is
 // no need to synthesize it in ideal nodes.
 if (Matcher::has_match_rule(Op_MulHiL)) {
-Node *v = phase->longcon(magic_const);
+Node* v = phase->longcon(magic_const);
 return new (phase->C, 3) MulHiLNode(dividend, v);
 }
+// Taken from Hacker's Delight, Fig. 8-2. Multiply high signed.
+// (http://www.hackersdelight.org/HDcode/mulhs.c)
+//
+// int mulhs(int u, int v) {
+//    unsigned u0, v0, w0;
+//    int u1, v1, w1, w2, t;
+//
+//    u0 = u & 0xFFFF;  u1 = u >> 16;
+//    v0 = v & 0xFFFF;  v1 = v >> 16;
+//    w0 = u0*v0;
+//    t  = u1*v0 + (w0 >> 16);
+//    w1 = t & 0xFFFF;
+//    w2 = t >> 16;
+//    w1 = u0*v1 + w1;
+//    return u1*v1 + w2 + (w1 >> 16);
+// }
+//
+// Note: The version above is for 32x32 multiplications, while the
+// following inline comments are adapted to 64x64.
 const int N = 64;
-Node *u_hi = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N / 2)));
+// u0 = u & 0xFFFFFFFF;  u1 = u >> 32;
-Node *u_lo = phase->transform(new (phase->C, 3) AndLNode(dividend, phase->longcon(0xFFFFFFFF)));
+Node* u0 = phase->transform(new (phase->C, 3) AndLNode(dividend, phase->longcon(0xFFFFFFFF)));
+Node* u1 = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N / 2)));
-Node *v_hi = phase->longcon(magic_const >> N/2);
-Node *v_lo = phase->longcon(magic_const & 0XFFFFFFFF);
+// v0 = v & 0xFFFFFFFF;  v1 = v >> 32;
+Node* v0 = phase->longcon(magic_const & 0xFFFFFFFF);
-Node *hihi_product = phase->transform(new (phase->C, 3) MulLNode(u_hi, v_hi));
+Node* v1 = phase->longcon(magic_const >> (N / 2));
-Node *hilo_product = phase->transform(new (phase->C, 3) MulLNode(u_hi, v_lo));
-Node *lohi_product = phase->transform(new (phase->C, 3) MulLNode(u_lo, v_hi));
+// w0 = u0*v0;
-Node *lolo_product = phase->transform(new (phase->C, 3) MulLNode(u_lo, v_lo));
+Node* w0 = phase->transform(new (phase->C, 3) MulLNode(u0, v0));
-Node *t1 = phase->transform(new (phase->C, 3) URShiftLNode(lolo_product, phase->intcon(N / 2)));
+// t = u1*v0 + (w0 >> 32);
-Node *t2 = phase->transform(new (phase->C, 3) AddLNode(hilo_product, t1));
+Node* u1v0 = phase->transform(new (phase->C, 3) MulLNode(u1, v0));
+Node* temp = phase->transform(new (phase->C, 3) URShiftLNode(w0, phase->intcon(N / 2)));
-// Construct both t3 and t4 before transforming so t2 doesn't go dead
+Node* t    = phase->transform(new (phase->C, 3) AddLNode(u1v0, temp));
-// prematurely.
-Node *t3 = new (phase->C, 3) RShiftLNode(t2, phase->intcon(N / 2));
+// w1 = t & 0xFFFFFFFF;
-Node *t4 = new (phase->C, 3) AndLNode(t2, phase->longcon(0xFFFFFFFF));
+Node* w1 = new (phase->C, 3) AndLNode(t, phase->longcon(0xFFFFFFFF));
-t3 = phase->transform(t3);
-t4 = phase->transform(t4);
+// w2 = t >> 32;
+Node* w2 = new (phase->C, 3) RShiftLNode(t, phase->intcon(N / 2));
-Node *t5 = phase->transform(new (phase->C, 3) AddLNode(t4, lohi_product));
-Node *t6 = phase->transform(new (phase->C, 3) RShiftLNode(t5, phase->intcon(N / 2)));
+// 6732154: Construct both w1 and w2 before transforming, so t
-Node *t7 = phase->transform(new (phase->C, 3) AddLNode(t3, hihi_product));
+// doesn't go dead prematurely.
+w1 = phase->transform(w1);
-return new (phase->C, 3) AddLNode(t7, t6);
+w2 = phase->transform(w2);
+// w1 = u0*v1 + w1;
+Node* u0v1 = phase->transform(new (phase->C, 3) MulLNode(u0, v1));
+w1         = phase->transform(new (phase->C, 3) AddLNode(u0v1, w1));
+// return u1*v1 + w2 + (w1 >> 32);
+Node* u1v1  = phase->transform(new (phase->C, 3) MulLNode(u1, v1));
+Node* temp1 = phase->transform(new (phase->C, 3) AddLNode(u1v1, w2));
+Node* temp2 = phase->transform(new (phase->C, 3) RShiftLNode(w1, phase->intcon(N / 2)));
+return new (phase->C, 3) AddLNode(temp1, temp2);
 }
 //--------------------------transform_long_divide------------------------------
 // Convert a division by constant divisor into an alternate Ideal graph.
 Node *hook = new (phase->C, 1) Node(1);
 // Expand mod
 if( con >= 0 && con < max_jlong && is_power_of_2_long(con+1) ) {
-uint k = log2_long(con);       // Extract k
+uint k = exact_log2_long(con+1);  // Extract k
 // Basic algorithm by David Detlefs.  See fastmod_long.java for gory details.
 // Used to help a popular random number generator which does a long-mod
 // of 2^31-1 and shows up in SpecJBB and SciMark.
 static int unroll_factor[] = { 999, 999, 61, 30, 20, 15, 12, 10, 8, 7, 6, 6, 5, 5, 4, 4, 4, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1 /*past here we assume 1 forever*/};

Mercurial > hg > truffle

comparison src/share/vm/opto/divnode.cpp @ 570:dca06e7f503d