annotate src/share/vm/opto/divnode.cpp @ 1552:c18cbe5936b8

6941466: Oracle rebranding changes for Hotspot repositories Summary: Change all the Sun copyrights to Oracle copyright Reviewed-by: ohair
author trims
date Thu, 27 May 2010 19:08:38 -0700
parents 174ade00803b
children ae065c367d93
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1 /*
1552
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1154
diff changeset
2 * Copyright (c) 1997, 2009, Oracle and/or its affiliates. All rights reserved.
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
a61af66fc99e Initial load
duke
parents:
diff changeset
4 *
a61af66fc99e Initial load
duke
parents:
diff changeset
5 * This code is free software; you can redistribute it and/or modify it
a61af66fc99e Initial load
duke
parents:
diff changeset
6 * under the terms of the GNU General Public License version 2 only, as
a61af66fc99e Initial load
duke
parents:
diff changeset
7 * published by the Free Software Foundation.
a61af66fc99e Initial load
duke
parents:
diff changeset
8 *
a61af66fc99e Initial load
duke
parents:
diff changeset
9 * This code is distributed in the hope that it will be useful, but WITHOUT
a61af66fc99e Initial load
duke
parents:
diff changeset
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
a61af66fc99e Initial load
duke
parents:
diff changeset
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
a61af66fc99e Initial load
duke
parents:
diff changeset
12 * version 2 for more details (a copy is included in the LICENSE file that
a61af66fc99e Initial load
duke
parents:
diff changeset
13 * accompanied this code).
a61af66fc99e Initial load
duke
parents:
diff changeset
14 *
a61af66fc99e Initial load
duke
parents:
diff changeset
15 * You should have received a copy of the GNU General Public License version
a61af66fc99e Initial load
duke
parents:
diff changeset
16 * 2 along with this work; if not, write to the Free Software Foundation,
a61af66fc99e Initial load
duke
parents:
diff changeset
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
a61af66fc99e Initial load
duke
parents:
diff changeset
18 *
1552
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1154
diff changeset
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1154
diff changeset
20 * or visit www.oracle.com if you need additional information or have any
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1154
diff changeset
21 * questions.
0
a61af66fc99e Initial load
duke
parents:
diff changeset
22 *
a61af66fc99e Initial load
duke
parents:
diff changeset
23 */
a61af66fc99e Initial load
duke
parents:
diff changeset
24
a61af66fc99e Initial load
duke
parents:
diff changeset
25 // Portions of code courtesy of Clifford Click
a61af66fc99e Initial load
duke
parents:
diff changeset
26
a61af66fc99e Initial load
duke
parents:
diff changeset
27 // Optimization - Graph Style
a61af66fc99e Initial load
duke
parents:
diff changeset
28
a61af66fc99e Initial load
duke
parents:
diff changeset
29 #include "incls/_precompiled.incl"
a61af66fc99e Initial load
duke
parents:
diff changeset
30 #include "incls/_divnode.cpp.incl"
a61af66fc99e Initial load
duke
parents:
diff changeset
31 #include <math.h>
a61af66fc99e Initial load
duke
parents:
diff changeset
32
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
33 //----------------------magic_int_divide_constants-----------------------------
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
34 // Compute magic multiplier and shift constant for converting a 32 bit divide
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
35 // by constant into a multiply/shift/add series. Return false if calculations
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
36 // fail.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
37 //
605
98cb887364d3 6810672: Comment typos
twisti
parents: 568
diff changeset
38 // Borrowed almost verbatim from Hacker's Delight by Henry S. Warren, Jr. with
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
39 // minor type name and parameter changes.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
40 static bool magic_int_divide_constants(jint d, jint &M, jint &s) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
41 int32_t p;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
42 uint32_t ad, anc, delta, q1, r1, q2, r2, t;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
43 const uint32_t two31 = 0x80000000L; // 2**31.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
44
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
45 ad = ABS(d);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
46 if (d == 0 || d == 1) return false;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
47 t = two31 + ((uint32_t)d >> 31);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
48 anc = t - 1 - t%ad; // Absolute value of nc.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
49 p = 31; // Init. p.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
50 q1 = two31/anc; // Init. q1 = 2**p/|nc|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
51 r1 = two31 - q1*anc; // Init. r1 = rem(2**p, |nc|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
52 q2 = two31/ad; // Init. q2 = 2**p/|d|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
53 r2 = two31 - q2*ad; // Init. r2 = rem(2**p, |d|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
54 do {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
55 p = p + 1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
56 q1 = 2*q1; // Update q1 = 2**p/|nc|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
57 r1 = 2*r1; // Update r1 = rem(2**p, |nc|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
58 if (r1 >= anc) { // (Must be an unsigned
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
59 q1 = q1 + 1; // comparison here).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
60 r1 = r1 - anc;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
61 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
62 q2 = 2*q2; // Update q2 = 2**p/|d|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
63 r2 = 2*r2; // Update r2 = rem(2**p, |d|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
64 if (r2 >= ad) { // (Must be an unsigned
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
65 q2 = q2 + 1; // comparison here).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
66 r2 = r2 - ad;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
67 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
68 delta = ad - r2;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
69 } while (q1 < delta || (q1 == delta && r1 == 0));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
70
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
71 M = q2 + 1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
72 if (d < 0) M = -M; // Magic number and
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
73 s = p - 32; // shift amount to return.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
74
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
75 return true;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
76 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
77
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
78 //--------------------------transform_int_divide-------------------------------
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
79 // Convert a division by constant divisor into an alternate Ideal graph.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
80 // Return NULL if no transformation occurs.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
81 static Node *transform_int_divide( PhaseGVN *phase, Node *dividend, jint divisor ) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
82
a61af66fc99e Initial load
duke
parents:
diff changeset
83 // Check for invalid divisors
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
84 assert( divisor != 0 && divisor != min_jint,
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
85 "bad divisor for transforming to long multiply" );
0
a61af66fc99e Initial load
duke
parents:
diff changeset
86
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
87 bool d_pos = divisor >= 0;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
88 jint d = d_pos ? divisor : -divisor;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
89 const int N = 32;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
90
a61af66fc99e Initial load
duke
parents:
diff changeset
91 // Result
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
92 Node *q = NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
93
a61af66fc99e Initial load
duke
parents:
diff changeset
94 if (d == 1) {
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
95 // division by +/- 1
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
96 if (!d_pos) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
97 // Just negate the value
0
a61af66fc99e Initial load
duke
parents:
diff changeset
98 q = new (phase->C, 3) SubINode(phase->intcon(0), dividend);
a61af66fc99e Initial load
duke
parents:
diff changeset
99 }
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
100 } else if ( is_power_of_2(d) ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
101 // division by +/- a power of 2
0
a61af66fc99e Initial load
duke
parents:
diff changeset
102
a61af66fc99e Initial load
duke
parents:
diff changeset
103 // See if we can simply do a shift without rounding
a61af66fc99e Initial load
duke
parents:
diff changeset
104 bool needs_rounding = true;
a61af66fc99e Initial load
duke
parents:
diff changeset
105 const Type *dt = phase->type(dividend);
a61af66fc99e Initial load
duke
parents:
diff changeset
106 const TypeInt *dti = dt->isa_int();
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
107 if (dti && dti->_lo >= 0) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
108 // we don't need to round a positive dividend
0
a61af66fc99e Initial load
duke
parents:
diff changeset
109 needs_rounding = false;
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
110 } else if( dividend->Opcode() == Op_AndI ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
111 // An AND mask of sufficient size clears the low bits and
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
112 // I can avoid rounding.
400
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
113 const TypeInt *andconi_t = phase->type( dividend->in(2) )->isa_int();
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
114 if( andconi_t && andconi_t->is_con() ) {
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
115 jint andconi = andconi_t->get_con();
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
116 if( andconi < 0 && is_power_of_2(-andconi) && (-andconi) >= d ) {
1154
174ade00803b 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 756
diff changeset
117 if( (-andconi) == d ) // Remove AND if it clears bits which will be shifted
174ade00803b 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 756
diff changeset
118 dividend = dividend->in(1);
400
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
119 needs_rounding = false;
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
120 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
121 }
a61af66fc99e Initial load
duke
parents:
diff changeset
122 }
a61af66fc99e Initial load
duke
parents:
diff changeset
123
a61af66fc99e Initial load
duke
parents:
diff changeset
124 // Add rounding to the shift to handle the sign bit
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
125 int l = log2_intptr(d-1)+1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
126 if (needs_rounding) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
127 // Divide-by-power-of-2 can be made into a shift, but you have to do
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
128 // more math for the rounding. You need to add 0 for positive
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
129 // numbers, and "i-1" for negative numbers. Example: i=4, so the
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
130 // shift is by 2. You need to add 3 to negative dividends and 0 to
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
131 // positive ones. So (-7+3)>>2 becomes -1, (-4+3)>>2 becomes -1,
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
132 // (-2+3)>>2 becomes 0, etc.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
133
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
134 // Compute 0 or -1, based on sign bit
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
135 Node *sign = phase->transform(new (phase->C, 3) RShiftINode(dividend, phase->intcon(N - 1)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
136 // Mask sign bit to the low sign bits
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
137 Node *round = phase->transform(new (phase->C, 3) URShiftINode(sign, phase->intcon(N - l)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
138 // Round up before shifting
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
139 dividend = phase->transform(new (phase->C, 3) AddINode(dividend, round));
0
a61af66fc99e Initial load
duke
parents:
diff changeset
140 }
a61af66fc99e Initial load
duke
parents:
diff changeset
141
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
142 // Shift for division
0
a61af66fc99e Initial load
duke
parents:
diff changeset
143 q = new (phase->C, 3) RShiftINode(dividend, phase->intcon(l));
a61af66fc99e Initial load
duke
parents:
diff changeset
144
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
145 if (!d_pos) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
146 q = new (phase->C, 3) SubINode(phase->intcon(0), phase->transform(q));
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
147 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
148 } else {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
149 // Attempt the jint constant divide -> multiply transform found in
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
150 // "Division by Invariant Integers using Multiplication"
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
151 // by Granlund and Montgomery
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
152 // See also "Hacker's Delight", chapter 10 by Warren.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
153
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
154 jint magic_const;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
155 jint shift_const;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
156 if (magic_int_divide_constants(d, magic_const, shift_const)) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
157 Node *magic = phase->longcon(magic_const);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
158 Node *dividend_long = phase->transform(new (phase->C, 2) ConvI2LNode(dividend));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
159
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
160 // Compute the high half of the dividend x magic multiplication
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
161 Node *mul_hi = phase->transform(new (phase->C, 3) MulLNode(dividend_long, magic));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
162
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
163 if (magic_const < 0) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
164 mul_hi = phase->transform(new (phase->C, 3) RShiftLNode(mul_hi, phase->intcon(N)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
165 mul_hi = phase->transform(new (phase->C, 2) ConvL2INode(mul_hi));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
166
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
167 // The magic multiplier is too large for a 32 bit constant. We've adjusted
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
168 // it down by 2^32, but have to add 1 dividend back in after the multiplication.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
169 // This handles the "overflow" case described by Granlund and Montgomery.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
170 mul_hi = phase->transform(new (phase->C, 3) AddINode(dividend, mul_hi));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
171
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
172 // Shift over the (adjusted) mulhi
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
173 if (shift_const != 0) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
174 mul_hi = phase->transform(new (phase->C, 3) RShiftINode(mul_hi, phase->intcon(shift_const)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
175 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
176 } else {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
177 // No add is required, we can merge the shifts together.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
178 mul_hi = phase->transform(new (phase->C, 3) RShiftLNode(mul_hi, phase->intcon(N + shift_const)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
179 mul_hi = phase->transform(new (phase->C, 2) ConvL2INode(mul_hi));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
180 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
181
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
182 // Get a 0 or -1 from the sign of the dividend.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
183 Node *addend0 = mul_hi;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
184 Node *addend1 = phase->transform(new (phase->C, 3) RShiftINode(dividend, phase->intcon(N-1)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
185
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
186 // If the divisor is negative, swap the order of the input addends;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
187 // this has the effect of negating the quotient.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
188 if (!d_pos) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
189 Node *temp = addend0; addend0 = addend1; addend1 = temp;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
190 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
191
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
192 // Adjust the final quotient by subtracting -1 (adding 1)
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
193 // from the mul_hi.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
194 q = new (phase->C, 3) SubINode(addend0, addend1);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
195 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
196 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
197
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
198 return q;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
199 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
200
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
201 //---------------------magic_long_divide_constants-----------------------------
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
202 // Compute magic multiplier and shift constant for converting a 64 bit divide
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
203 // by constant into a multiply/shift/add series. Return false if calculations
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
204 // fail.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
205 //
605
98cb887364d3 6810672: Comment typos
twisti
parents: 568
diff changeset
206 // Borrowed almost verbatim from Hacker's Delight by Henry S. Warren, Jr. with
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
207 // minor type name and parameter changes. Adjusted to 64 bit word width.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
208 static bool magic_long_divide_constants(jlong d, jlong &M, jint &s) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
209 int64_t p;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
210 uint64_t ad, anc, delta, q1, r1, q2, r2, t;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
211 const uint64_t two63 = 0x8000000000000000LL; // 2**63.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
212
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
213 ad = ABS(d);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
214 if (d == 0 || d == 1) return false;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
215 t = two63 + ((uint64_t)d >> 63);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
216 anc = t - 1 - t%ad; // Absolute value of nc.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
217 p = 63; // Init. p.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
218 q1 = two63/anc; // Init. q1 = 2**p/|nc|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
219 r1 = two63 - q1*anc; // Init. r1 = rem(2**p, |nc|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
220 q2 = two63/ad; // Init. q2 = 2**p/|d|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
221 r2 = two63 - q2*ad; // Init. r2 = rem(2**p, |d|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
222 do {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
223 p = p + 1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
224 q1 = 2*q1; // Update q1 = 2**p/|nc|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
225 r1 = 2*r1; // Update r1 = rem(2**p, |nc|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
226 if (r1 >= anc) { // (Must be an unsigned
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
227 q1 = q1 + 1; // comparison here).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
228 r1 = r1 - anc;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
229 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
230 q2 = 2*q2; // Update q2 = 2**p/|d|.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
231 r2 = 2*r2; // Update r2 = rem(2**p, |d|).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
232 if (r2 >= ad) { // (Must be an unsigned
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
233 q2 = q2 + 1; // comparison here).
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
234 r2 = r2 - ad;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
235 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
236 delta = ad - r2;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
237 } while (q1 < delta || (q1 == delta && r1 == 0));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
238
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
239 M = q2 + 1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
240 if (d < 0) M = -M; // Magic number and
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
241 s = p - 64; // shift amount to return.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
242
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
243 return true;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
244 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
245
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
246 //---------------------long_by_long_mulhi--------------------------------------
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
247 // Generate ideal node graph for upper half of a 64 bit x 64 bit multiplication
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
248 static Node* long_by_long_mulhi(PhaseGVN* phase, Node* dividend, jlong magic_const) {
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
249 // If the architecture supports a 64x64 mulhi, there is
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
250 // no need to synthesize it in ideal nodes.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
251 if (Matcher::has_match_rule(Op_MulHiL)) {
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
252 Node* v = phase->longcon(magic_const);
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
253 return new (phase->C, 3) MulHiLNode(dividend, v);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
254 }
a61af66fc99e Initial load
duke
parents:
diff changeset
255
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
256 // Taken from Hacker's Delight, Fig. 8-2. Multiply high signed.
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
257 // (http://www.hackersdelight.org/HDcode/mulhs.c)
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
258 //
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
259 // int mulhs(int u, int v) {
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
260 // unsigned u0, v0, w0;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
261 // int u1, v1, w1, w2, t;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
262 //
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
263 // u0 = u & 0xFFFF; u1 = u >> 16;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
264 // v0 = v & 0xFFFF; v1 = v >> 16;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
265 // w0 = u0*v0;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
266 // t = u1*v0 + (w0 >> 16);
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
267 // w1 = t & 0xFFFF;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
268 // w2 = t >> 16;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
269 // w1 = u0*v1 + w1;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
270 // return u1*v1 + w2 + (w1 >> 16);
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
271 // }
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
272 //
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
273 // Note: The version above is for 32x32 multiplications, while the
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
274 // following inline comments are adapted to 64x64.
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
275
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
276 const int N = 64;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
277
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
278 // u0 = u & 0xFFFFFFFF; u1 = u >> 32;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
279 Node* u0 = phase->transform(new (phase->C, 3) AndLNode(dividend, phase->longcon(0xFFFFFFFF)));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
280 Node* u1 = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N / 2)));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
281
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
282 // v0 = v & 0xFFFFFFFF; v1 = v >> 32;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
283 Node* v0 = phase->longcon(magic_const & 0xFFFFFFFF);
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
284 Node* v1 = phase->longcon(magic_const >> (N / 2));
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
285
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
286 // w0 = u0*v0;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
287 Node* w0 = phase->transform(new (phase->C, 3) MulLNode(u0, v0));
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
288
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
289 // t = u1*v0 + (w0 >> 32);
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
290 Node* u1v0 = phase->transform(new (phase->C, 3) MulLNode(u1, v0));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
291 Node* temp = phase->transform(new (phase->C, 3) URShiftLNode(w0, phase->intcon(N / 2)));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
292 Node* t = phase->transform(new (phase->C, 3) AddLNode(u1v0, temp));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
293
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
294 // w1 = t & 0xFFFFFFFF;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
295 Node* w1 = new (phase->C, 3) AndLNode(t, phase->longcon(0xFFFFFFFF));
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
296
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
297 // w2 = t >> 32;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
298 Node* w2 = new (phase->C, 3) RShiftLNode(t, phase->intcon(N / 2));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
299
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
300 // 6732154: Construct both w1 and w2 before transforming, so t
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
301 // doesn't go dead prematurely.
756
cecd04fc6f93 6837011: SIGSEGV in PhaseIdealLoop in 32bit jvm
twisti
parents: 605
diff changeset
302 // 6837011: We need to transform w2 before w1 because the
cecd04fc6f93 6837011: SIGSEGV in PhaseIdealLoop in 32bit jvm
twisti
parents: 605
diff changeset
303 // transformation of w1 could return t.
cecd04fc6f93 6837011: SIGSEGV in PhaseIdealLoop in 32bit jvm
twisti
parents: 605
diff changeset
304 w2 = phase->transform(w2);
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
305 w1 = phase->transform(w1);
294
616a07a75c3c 6732154: REG: Printing an Image using image/gif doc flavor crashes the VM, Solsparc
rasbold
parents: 196
diff changeset
306
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
307 // w1 = u0*v1 + w1;
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
308 Node* u0v1 = phase->transform(new (phase->C, 3) MulLNode(u0, v1));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
309 w1 = phase->transform(new (phase->C, 3) AddLNode(u0v1, w1));
294
616a07a75c3c 6732154: REG: Printing an Image using image/gif doc flavor crashes the VM, Solsparc
rasbold
parents: 196
diff changeset
310
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
311 // return u1*v1 + w2 + (w1 >> 32);
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
312 Node* u1v1 = phase->transform(new (phase->C, 3) MulLNode(u1, v1));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
313 Node* temp1 = phase->transform(new (phase->C, 3) AddLNode(u1v1, w2));
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
314 Node* temp2 = phase->transform(new (phase->C, 3) RShiftLNode(w1, phase->intcon(N / 2)));
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
315
567
bbef4344adb2 6800154: Add comments to long_by_long_mulhi() for better understandability
twisti
parents: 404
diff changeset
316 return new (phase->C, 3) AddLNode(temp1, temp2);
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
317 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
318
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
319
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
320 //--------------------------transform_long_divide------------------------------
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
321 // Convert a division by constant divisor into an alternate Ideal graph.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
322 // Return NULL if no transformation occurs.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
323 static Node *transform_long_divide( PhaseGVN *phase, Node *dividend, jlong divisor ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
324 // Check for invalid divisors
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
325 assert( divisor != 0L && divisor != min_jlong,
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
326 "bad divisor for transforming to long multiply" );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
327
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
328 bool d_pos = divisor >= 0;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
329 jlong d = d_pos ? divisor : -divisor;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
330 const int N = 64;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
331
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
332 // Result
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
333 Node *q = NULL;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
334
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
335 if (d == 1) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
336 // division by +/- 1
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
337 if (!d_pos) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
338 // Just negate the value
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
339 q = new (phase->C, 3) SubLNode(phase->longcon(0), dividend);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
340 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
341 } else if ( is_power_of_2_long(d) ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
342
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
343 // division by +/- a power of 2
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
344
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
345 // See if we can simply do a shift without rounding
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
346 bool needs_rounding = true;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
347 const Type *dt = phase->type(dividend);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
348 const TypeLong *dtl = dt->isa_long();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
349
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
350 if (dtl && dtl->_lo > 0) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
351 // we don't need to round a positive dividend
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
352 needs_rounding = false;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
353 } else if( dividend->Opcode() == Op_AndL ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
354 // An AND mask of sufficient size clears the low bits and
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
355 // I can avoid rounding.
400
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
356 const TypeLong *andconl_t = phase->type( dividend->in(2) )->isa_long();
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
357 if( andconl_t && andconl_t->is_con() ) {
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
358 jlong andconl = andconl_t->get_con();
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
359 if( andconl < 0 && is_power_of_2_long(-andconl) && (-andconl) >= d ) {
1154
174ade00803b 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 756
diff changeset
360 if( (-andconl) == d ) // Remove AND if it clears bits which will be shifted
174ade00803b 6910484: incorrect integer optimization (loosing and op-r in a given example)
kvn
parents: 756
diff changeset
361 dividend = dividend->in(1);
400
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
362 needs_rounding = false;
cc80376deb0c 6667595: Set probability FAIR for pre-, post- loops and ALWAYS for main loop
kvn
parents: 305
diff changeset
363 }
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
364 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
365 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
366
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
367 // Add rounding to the shift to handle the sign bit
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
368 int l = log2_long(d-1)+1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
369 if (needs_rounding) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
370 // Divide-by-power-of-2 can be made into a shift, but you have to do
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
371 // more math for the rounding. You need to add 0 for positive
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
372 // numbers, and "i-1" for negative numbers. Example: i=4, so the
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
373 // shift is by 2. You need to add 3 to negative dividends and 0 to
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
374 // positive ones. So (-7+3)>>2 becomes -1, (-4+3)>>2 becomes -1,
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
375 // (-2+3)>>2 becomes 0, etc.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
376
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
377 // Compute 0 or -1, based on sign bit
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
378 Node *sign = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N - 1)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
379 // Mask sign bit to the low sign bits
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
380 Node *round = phase->transform(new (phase->C, 3) URShiftLNode(sign, phase->intcon(N - l)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
381 // Round up before shifting
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
382 dividend = phase->transform(new (phase->C, 3) AddLNode(dividend, round));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
383 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
384
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
385 // Shift for division
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
386 q = new (phase->C, 3) RShiftLNode(dividend, phase->intcon(l));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
387
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
388 if (!d_pos) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
389 q = new (phase->C, 3) SubLNode(phase->longcon(0), phase->transform(q));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
390 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
391 } else {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
392 // Attempt the jlong constant divide -> multiply transform found in
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
393 // "Division by Invariant Integers using Multiplication"
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
394 // by Granlund and Montgomery
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
395 // See also "Hacker's Delight", chapter 10 by Warren.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
396
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
397 jlong magic_const;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
398 jint shift_const;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
399 if (magic_long_divide_constants(d, magic_const, shift_const)) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
400 // Compute the high half of the dividend x magic multiplication
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
401 Node *mul_hi = phase->transform(long_by_long_mulhi(phase, dividend, magic_const));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
402
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
403 // The high half of the 128-bit multiply is computed.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
404 if (magic_const < 0) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
405 // The magic multiplier is too large for a 64 bit constant. We've adjusted
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
406 // it down by 2^64, but have to add 1 dividend back in after the multiplication.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
407 // This handles the "overflow" case described by Granlund and Montgomery.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
408 mul_hi = phase->transform(new (phase->C, 3) AddLNode(dividend, mul_hi));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
409 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
410
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
411 // Shift over the (adjusted) mulhi
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
412 if (shift_const != 0) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
413 mul_hi = phase->transform(new (phase->C, 3) RShiftLNode(mul_hi, phase->intcon(shift_const)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
414 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
415
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
416 // Get a 0 or -1 from the sign of the dividend.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
417 Node *addend0 = mul_hi;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
418 Node *addend1 = phase->transform(new (phase->C, 3) RShiftLNode(dividend, phase->intcon(N-1)));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
419
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
420 // If the divisor is negative, swap the order of the input addends;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
421 // this has the effect of negating the quotient.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
422 if (!d_pos) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
423 Node *temp = addend0; addend0 = addend1; addend1 = temp;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
424 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
425
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
426 // Adjust the final quotient by subtracting -1 (adding 1)
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
427 // from the mul_hi.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
428 q = new (phase->C, 3) SubLNode(addend0, addend1);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
429 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
430 }
a61af66fc99e Initial load
duke
parents:
diff changeset
431
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
432 return q;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
433 }
a61af66fc99e Initial load
duke
parents:
diff changeset
434
a61af66fc99e Initial load
duke
parents:
diff changeset
435 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
436 //------------------------------Identity---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
437 // If the divisor is 1, we are an identity on the dividend.
a61af66fc99e Initial load
duke
parents:
diff changeset
438 Node *DivINode::Identity( PhaseTransform *phase ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
439 return (phase->type( in(2) )->higher_equal(TypeInt::ONE)) ? in(1) : this;
a61af66fc99e Initial load
duke
parents:
diff changeset
440 }
a61af66fc99e Initial load
duke
parents:
diff changeset
441
a61af66fc99e Initial load
duke
parents:
diff changeset
442 //------------------------------Idealize---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
443 // Divides can be changed to multiplies and/or shifts
a61af66fc99e Initial load
duke
parents:
diff changeset
444 Node *DivINode::Ideal(PhaseGVN *phase, bool can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
445 if (in(0) && remove_dead_region(phase, can_reshape)) return this;
305
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
446 // Don't bother trying to transform a dead node
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
447 if( in(0) && in(0)->is_top() ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
448
a61af66fc99e Initial load
duke
parents:
diff changeset
449 const Type *t = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
450 if( t == TypeInt::ONE ) // Identity?
a61af66fc99e Initial load
duke
parents:
diff changeset
451 return NULL; // Skip it
a61af66fc99e Initial load
duke
parents:
diff changeset
452
a61af66fc99e Initial load
duke
parents:
diff changeset
453 const TypeInt *ti = t->isa_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
454 if( !ti ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
455 if( !ti->is_con() ) return NULL;
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
456 jint i = ti->get_con(); // Get divisor
0
a61af66fc99e Initial load
duke
parents:
diff changeset
457
a61af66fc99e Initial load
duke
parents:
diff changeset
458 if (i == 0) return NULL; // Dividing by zero constant does not idealize
a61af66fc99e Initial load
duke
parents:
diff changeset
459
a61af66fc99e Initial load
duke
parents:
diff changeset
460 set_req(0,NULL); // Dividing by a not-zero constant; no faulting
a61af66fc99e Initial load
duke
parents:
diff changeset
461
a61af66fc99e Initial load
duke
parents:
diff changeset
462 // Dividing by MININT does not optimize as a power-of-2 shift.
a61af66fc99e Initial load
duke
parents:
diff changeset
463 if( i == min_jint ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
464
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
465 return transform_int_divide( phase, in(1), i );
0
a61af66fc99e Initial load
duke
parents:
diff changeset
466 }
a61af66fc99e Initial load
duke
parents:
diff changeset
467
a61af66fc99e Initial load
duke
parents:
diff changeset
468 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
469 // A DivINode divides its inputs. The third input is a Control input, used to
a61af66fc99e Initial load
duke
parents:
diff changeset
470 // prevent hoisting the divide above an unsafe test.
a61af66fc99e Initial load
duke
parents:
diff changeset
471 const Type *DivINode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
472 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
473 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
474 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
475 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
476 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
477
a61af66fc99e Initial load
duke
parents:
diff changeset
478 // x/x == 1 since we always generate the dynamic divisor check for 0.
a61af66fc99e Initial load
duke
parents:
diff changeset
479 if( phase->eqv( in(1), in(2) ) )
a61af66fc99e Initial load
duke
parents:
diff changeset
480 return TypeInt::ONE;
a61af66fc99e Initial load
duke
parents:
diff changeset
481
a61af66fc99e Initial load
duke
parents:
diff changeset
482 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
483 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
484 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
485 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
486 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
487
a61af66fc99e Initial load
duke
parents:
diff changeset
488 // Divide the two numbers. We approximate.
a61af66fc99e Initial load
duke
parents:
diff changeset
489 // If divisor is a constant and not zero
a61af66fc99e Initial load
duke
parents:
diff changeset
490 const TypeInt *i1 = t1->is_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
491 const TypeInt *i2 = t2->is_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
492 int widen = MAX2(i1->_widen, i2->_widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
493
a61af66fc99e Initial load
duke
parents:
diff changeset
494 if( i2->is_con() && i2->get_con() != 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
495 int32 d = i2->get_con(); // Divisor
a61af66fc99e Initial load
duke
parents:
diff changeset
496 jint lo, hi;
a61af66fc99e Initial load
duke
parents:
diff changeset
497 if( d >= 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
498 lo = i1->_lo/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
499 hi = i1->_hi/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
500 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
501 if( d == -1 && i1->_lo == min_jint ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
502 // 'min_jint/-1' throws arithmetic exception during compilation
a61af66fc99e Initial load
duke
parents:
diff changeset
503 lo = min_jint;
a61af66fc99e Initial load
duke
parents:
diff changeset
504 // do not support holes, 'hi' must go to either min_jint or max_jint:
a61af66fc99e Initial load
duke
parents:
diff changeset
505 // [min_jint, -10]/[-1,-1] ==> [min_jint] UNION [10,max_jint]
a61af66fc99e Initial load
duke
parents:
diff changeset
506 hi = i1->_hi == min_jint ? min_jint : max_jint;
a61af66fc99e Initial load
duke
parents:
diff changeset
507 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
508 lo = i1->_hi/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
509 hi = i1->_lo/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
510 }
a61af66fc99e Initial load
duke
parents:
diff changeset
511 }
a61af66fc99e Initial load
duke
parents:
diff changeset
512 return TypeInt::make(lo, hi, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
513 }
a61af66fc99e Initial load
duke
parents:
diff changeset
514
a61af66fc99e Initial load
duke
parents:
diff changeset
515 // If the dividend is a constant
a61af66fc99e Initial load
duke
parents:
diff changeset
516 if( i1->is_con() ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
517 int32 d = i1->get_con();
a61af66fc99e Initial load
duke
parents:
diff changeset
518 if( d < 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
519 if( d == min_jint ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
520 // (-min_jint) == min_jint == (min_jint / -1)
a61af66fc99e Initial load
duke
parents:
diff changeset
521 return TypeInt::make(min_jint, max_jint/2 + 1, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
522 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
523 return TypeInt::make(d, -d, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
524 }
a61af66fc99e Initial load
duke
parents:
diff changeset
525 }
a61af66fc99e Initial load
duke
parents:
diff changeset
526 return TypeInt::make(-d, d, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
527 }
a61af66fc99e Initial load
duke
parents:
diff changeset
528
a61af66fc99e Initial load
duke
parents:
diff changeset
529 // Otherwise we give up all hope
a61af66fc99e Initial load
duke
parents:
diff changeset
530 return TypeInt::INT;
a61af66fc99e Initial load
duke
parents:
diff changeset
531 }
a61af66fc99e Initial load
duke
parents:
diff changeset
532
a61af66fc99e Initial load
duke
parents:
diff changeset
533
a61af66fc99e Initial load
duke
parents:
diff changeset
534 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
535 //------------------------------Identity---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
536 // If the divisor is 1, we are an identity on the dividend.
a61af66fc99e Initial load
duke
parents:
diff changeset
537 Node *DivLNode::Identity( PhaseTransform *phase ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
538 return (phase->type( in(2) )->higher_equal(TypeLong::ONE)) ? in(1) : this;
a61af66fc99e Initial load
duke
parents:
diff changeset
539 }
a61af66fc99e Initial load
duke
parents:
diff changeset
540
a61af66fc99e Initial load
duke
parents:
diff changeset
541 //------------------------------Idealize---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
542 // Dividing by a power of 2 is a shift.
a61af66fc99e Initial load
duke
parents:
diff changeset
543 Node *DivLNode::Ideal( PhaseGVN *phase, bool can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
544 if (in(0) && remove_dead_region(phase, can_reshape)) return this;
305
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
545 // Don't bother trying to transform a dead node
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
546 if( in(0) && in(0)->is_top() ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
547
a61af66fc99e Initial load
duke
parents:
diff changeset
548 const Type *t = phase->type( in(2) );
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
549 if( t == TypeLong::ONE ) // Identity?
0
a61af66fc99e Initial load
duke
parents:
diff changeset
550 return NULL; // Skip it
a61af66fc99e Initial load
duke
parents:
diff changeset
551
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
552 const TypeLong *tl = t->isa_long();
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
553 if( !tl ) return NULL;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
554 if( !tl->is_con() ) return NULL;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
555 jlong l = tl->get_con(); // Get divisor
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
556
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
557 if (l == 0) return NULL; // Dividing by zero constant does not idealize
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
558
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
559 set_req(0,NULL); // Dividing by a not-zero constant; no faulting
0
a61af66fc99e Initial load
duke
parents:
diff changeset
560
a61af66fc99e Initial load
duke
parents:
diff changeset
561 // Dividing by MININT does not optimize as a power-of-2 shift.
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
562 if( l == min_jlong ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
563
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
564 return transform_long_divide( phase, in(1), l );
0
a61af66fc99e Initial load
duke
parents:
diff changeset
565 }
a61af66fc99e Initial load
duke
parents:
diff changeset
566
a61af66fc99e Initial load
duke
parents:
diff changeset
567 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
568 // A DivLNode divides its inputs. The third input is a Control input, used to
a61af66fc99e Initial load
duke
parents:
diff changeset
569 // prevent hoisting the divide above an unsafe test.
a61af66fc99e Initial load
duke
parents:
diff changeset
570 const Type *DivLNode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
571 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
572 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
573 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
574 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
575 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
576
a61af66fc99e Initial load
duke
parents:
diff changeset
577 // x/x == 1 since we always generate the dynamic divisor check for 0.
a61af66fc99e Initial load
duke
parents:
diff changeset
578 if( phase->eqv( in(1), in(2) ) )
a61af66fc99e Initial load
duke
parents:
diff changeset
579 return TypeLong::ONE;
a61af66fc99e Initial load
duke
parents:
diff changeset
580
a61af66fc99e Initial load
duke
parents:
diff changeset
581 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
582 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
583 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
584 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
585 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
586
a61af66fc99e Initial load
duke
parents:
diff changeset
587 // Divide the two numbers. We approximate.
a61af66fc99e Initial load
duke
parents:
diff changeset
588 // If divisor is a constant and not zero
a61af66fc99e Initial load
duke
parents:
diff changeset
589 const TypeLong *i1 = t1->is_long();
a61af66fc99e Initial load
duke
parents:
diff changeset
590 const TypeLong *i2 = t2->is_long();
a61af66fc99e Initial load
duke
parents:
diff changeset
591 int widen = MAX2(i1->_widen, i2->_widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
592
a61af66fc99e Initial load
duke
parents:
diff changeset
593 if( i2->is_con() && i2->get_con() != 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
594 jlong d = i2->get_con(); // Divisor
a61af66fc99e Initial load
duke
parents:
diff changeset
595 jlong lo, hi;
a61af66fc99e Initial load
duke
parents:
diff changeset
596 if( d >= 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
597 lo = i1->_lo/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
598 hi = i1->_hi/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
599 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
600 if( d == CONST64(-1) && i1->_lo == min_jlong ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
601 // 'min_jlong/-1' throws arithmetic exception during compilation
a61af66fc99e Initial load
duke
parents:
diff changeset
602 lo = min_jlong;
a61af66fc99e Initial load
duke
parents:
diff changeset
603 // do not support holes, 'hi' must go to either min_jlong or max_jlong:
a61af66fc99e Initial load
duke
parents:
diff changeset
604 // [min_jlong, -10]/[-1,-1] ==> [min_jlong] UNION [10,max_jlong]
a61af66fc99e Initial load
duke
parents:
diff changeset
605 hi = i1->_hi == min_jlong ? min_jlong : max_jlong;
a61af66fc99e Initial load
duke
parents:
diff changeset
606 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
607 lo = i1->_hi/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
608 hi = i1->_lo/d;
a61af66fc99e Initial load
duke
parents:
diff changeset
609 }
a61af66fc99e Initial load
duke
parents:
diff changeset
610 }
a61af66fc99e Initial load
duke
parents:
diff changeset
611 return TypeLong::make(lo, hi, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
612 }
a61af66fc99e Initial load
duke
parents:
diff changeset
613
a61af66fc99e Initial load
duke
parents:
diff changeset
614 // If the dividend is a constant
a61af66fc99e Initial load
duke
parents:
diff changeset
615 if( i1->is_con() ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
616 jlong d = i1->get_con();
a61af66fc99e Initial load
duke
parents:
diff changeset
617 if( d < 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
618 if( d == min_jlong ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
619 // (-min_jlong) == min_jlong == (min_jlong / -1)
a61af66fc99e Initial load
duke
parents:
diff changeset
620 return TypeLong::make(min_jlong, max_jlong/2 + 1, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
621 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
622 return TypeLong::make(d, -d, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
623 }
a61af66fc99e Initial load
duke
parents:
diff changeset
624 }
a61af66fc99e Initial load
duke
parents:
diff changeset
625 return TypeLong::make(-d, d, widen);
a61af66fc99e Initial load
duke
parents:
diff changeset
626 }
a61af66fc99e Initial load
duke
parents:
diff changeset
627
a61af66fc99e Initial load
duke
parents:
diff changeset
628 // Otherwise we give up all hope
a61af66fc99e Initial load
duke
parents:
diff changeset
629 return TypeLong::LONG;
a61af66fc99e Initial load
duke
parents:
diff changeset
630 }
a61af66fc99e Initial load
duke
parents:
diff changeset
631
a61af66fc99e Initial load
duke
parents:
diff changeset
632
a61af66fc99e Initial load
duke
parents:
diff changeset
633 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
634 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
635 // An DivFNode divides its inputs. The third input is a Control input, used to
a61af66fc99e Initial load
duke
parents:
diff changeset
636 // prevent hoisting the divide above an unsafe test.
a61af66fc99e Initial load
duke
parents:
diff changeset
637 const Type *DivFNode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
638 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
639 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
640 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
641 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
642 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
643
a61af66fc99e Initial load
duke
parents:
diff changeset
644 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
645 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
646 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
647 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
648 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
649
a61af66fc99e Initial load
duke
parents:
diff changeset
650 // x/x == 1, we ignore 0/0.
a61af66fc99e Initial load
duke
parents:
diff changeset
651 // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
652 // Does not work for variables because of NaN's
0
a61af66fc99e Initial load
duke
parents:
diff changeset
653 if( phase->eqv( in(1), in(2) ) && t1->base() == Type::FloatCon)
a61af66fc99e Initial load
duke
parents:
diff changeset
654 if (!g_isnan(t1->getf()) && g_isfinite(t1->getf()) && t1->getf() != 0.0) // could be negative ZERO or NaN
a61af66fc99e Initial load
duke
parents:
diff changeset
655 return TypeF::ONE;
a61af66fc99e Initial load
duke
parents:
diff changeset
656
a61af66fc99e Initial load
duke
parents:
diff changeset
657 if( t2 == TypeF::ONE )
a61af66fc99e Initial load
duke
parents:
diff changeset
658 return t1;
a61af66fc99e Initial load
duke
parents:
diff changeset
659
a61af66fc99e Initial load
duke
parents:
diff changeset
660 // If divisor is a constant and not zero, divide them numbers
a61af66fc99e Initial load
duke
parents:
diff changeset
661 if( t1->base() == Type::FloatCon &&
a61af66fc99e Initial load
duke
parents:
diff changeset
662 t2->base() == Type::FloatCon &&
a61af66fc99e Initial load
duke
parents:
diff changeset
663 t2->getf() != 0.0 ) // could be negative zero
a61af66fc99e Initial load
duke
parents:
diff changeset
664 return TypeF::make( t1->getf()/t2->getf() );
a61af66fc99e Initial load
duke
parents:
diff changeset
665
a61af66fc99e Initial load
duke
parents:
diff changeset
666 // If the dividend is a constant zero
a61af66fc99e Initial load
duke
parents:
diff changeset
667 // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
a61af66fc99e Initial load
duke
parents:
diff changeset
668 // Test TypeF::ZERO is not sufficient as it could be negative zero
a61af66fc99e Initial load
duke
parents:
diff changeset
669
a61af66fc99e Initial load
duke
parents:
diff changeset
670 if( t1 == TypeF::ZERO && !g_isnan(t2->getf()) && t2->getf() != 0.0 )
a61af66fc99e Initial load
duke
parents:
diff changeset
671 return TypeF::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
672
a61af66fc99e Initial load
duke
parents:
diff changeset
673 // Otherwise we give up all hope
a61af66fc99e Initial load
duke
parents:
diff changeset
674 return Type::FLOAT;
a61af66fc99e Initial load
duke
parents:
diff changeset
675 }
a61af66fc99e Initial load
duke
parents:
diff changeset
676
a61af66fc99e Initial load
duke
parents:
diff changeset
677 //------------------------------isA_Copy---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
678 // Dividing by self is 1.
a61af66fc99e Initial load
duke
parents:
diff changeset
679 // If the divisor is 1, we are an identity on the dividend.
a61af66fc99e Initial load
duke
parents:
diff changeset
680 Node *DivFNode::Identity( PhaseTransform *phase ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
681 return (phase->type( in(2) ) == TypeF::ONE) ? in(1) : this;
a61af66fc99e Initial load
duke
parents:
diff changeset
682 }
a61af66fc99e Initial load
duke
parents:
diff changeset
683
a61af66fc99e Initial load
duke
parents:
diff changeset
684
a61af66fc99e Initial load
duke
parents:
diff changeset
685 //------------------------------Idealize---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
686 Node *DivFNode::Ideal(PhaseGVN *phase, bool can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
687 if (in(0) && remove_dead_region(phase, can_reshape)) return this;
305
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
688 // Don't bother trying to transform a dead node
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
689 if( in(0) && in(0)->is_top() ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
690
a61af66fc99e Initial load
duke
parents:
diff changeset
691 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
692 if( t2 == TypeF::ONE ) // Identity?
a61af66fc99e Initial load
duke
parents:
diff changeset
693 return NULL; // Skip it
a61af66fc99e Initial load
duke
parents:
diff changeset
694
a61af66fc99e Initial load
duke
parents:
diff changeset
695 const TypeF *tf = t2->isa_float_constant();
a61af66fc99e Initial load
duke
parents:
diff changeset
696 if( !tf ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
697 if( tf->base() != Type::FloatCon ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
698
a61af66fc99e Initial load
duke
parents:
diff changeset
699 // Check for out of range values
a61af66fc99e Initial load
duke
parents:
diff changeset
700 if( tf->is_nan() || !tf->is_finite() ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
701
a61af66fc99e Initial load
duke
parents:
diff changeset
702 // Get the value
a61af66fc99e Initial load
duke
parents:
diff changeset
703 float f = tf->getf();
a61af66fc99e Initial load
duke
parents:
diff changeset
704 int exp;
a61af66fc99e Initial load
duke
parents:
diff changeset
705
a61af66fc99e Initial load
duke
parents:
diff changeset
706 // Only for special case of dividing by a power of 2
a61af66fc99e Initial load
duke
parents:
diff changeset
707 if( frexp((double)f, &exp) != 0.5 ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
708
a61af66fc99e Initial load
duke
parents:
diff changeset
709 // Limit the range of acceptable exponents
a61af66fc99e Initial load
duke
parents:
diff changeset
710 if( exp < -126 || exp > 126 ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
711
a61af66fc99e Initial load
duke
parents:
diff changeset
712 // Compute the reciprocal
a61af66fc99e Initial load
duke
parents:
diff changeset
713 float reciprocal = ((float)1.0) / f;
a61af66fc99e Initial load
duke
parents:
diff changeset
714
a61af66fc99e Initial load
duke
parents:
diff changeset
715 assert( frexp((double)reciprocal, &exp) == 0.5, "reciprocal should be power of 2" );
a61af66fc99e Initial load
duke
parents:
diff changeset
716
a61af66fc99e Initial load
duke
parents:
diff changeset
717 // return multiplication by the reciprocal
a61af66fc99e Initial load
duke
parents:
diff changeset
718 return (new (phase->C, 3) MulFNode(in(1), phase->makecon(TypeF::make(reciprocal))));
a61af66fc99e Initial load
duke
parents:
diff changeset
719 }
a61af66fc99e Initial load
duke
parents:
diff changeset
720
a61af66fc99e Initial load
duke
parents:
diff changeset
721 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
722 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
723 // An DivDNode divides its inputs. The third input is a Control input, used to
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
724 // prevent hoisting the divide above an unsafe test.
0
a61af66fc99e Initial load
duke
parents:
diff changeset
725 const Type *DivDNode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
726 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
727 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
728 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
729 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
730 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
731
a61af66fc99e Initial load
duke
parents:
diff changeset
732 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
733 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
734 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
735 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
736 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
737
a61af66fc99e Initial load
duke
parents:
diff changeset
738 // x/x == 1, we ignore 0/0.
a61af66fc99e Initial load
duke
parents:
diff changeset
739 // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
a61af66fc99e Initial load
duke
parents:
diff changeset
740 // Does not work for variables because of NaN's
a61af66fc99e Initial load
duke
parents:
diff changeset
741 if( phase->eqv( in(1), in(2) ) && t1->base() == Type::DoubleCon)
a61af66fc99e Initial load
duke
parents:
diff changeset
742 if (!g_isnan(t1->getd()) && g_isfinite(t1->getd()) && t1->getd() != 0.0) // could be negative ZERO or NaN
a61af66fc99e Initial load
duke
parents:
diff changeset
743 return TypeD::ONE;
a61af66fc99e Initial load
duke
parents:
diff changeset
744
a61af66fc99e Initial load
duke
parents:
diff changeset
745 if( t2 == TypeD::ONE )
a61af66fc99e Initial load
duke
parents:
diff changeset
746 return t1;
a61af66fc99e Initial load
duke
parents:
diff changeset
747
404
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
748 #if defined(IA32)
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
749 if (!phase->C->method()->is_strict())
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
750 // Can't trust native compilers to properly fold strict double
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
751 // division with round-to-zero on this platform.
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
752 #endif
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
753 {
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
754 // If divisor is a constant and not zero, divide them numbers
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
755 if( t1->base() == Type::DoubleCon &&
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
756 t2->base() == Type::DoubleCon &&
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
757 t2->getd() != 0.0 ) // could be negative zero
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
758 return TypeD::make( t1->getd()/t2->getd() );
78c058bc5cdc 6717150: improper constant folding of subnormal strictfp multiplications and divides
rasbold
parents: 400
diff changeset
759 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
760
a61af66fc99e Initial load
duke
parents:
diff changeset
761 // If the dividend is a constant zero
a61af66fc99e Initial load
duke
parents:
diff changeset
762 // Note: if t1 and t2 are zero then result is NaN (JVMS page 213)
a61af66fc99e Initial load
duke
parents:
diff changeset
763 // Test TypeF::ZERO is not sufficient as it could be negative zero
a61af66fc99e Initial load
duke
parents:
diff changeset
764 if( t1 == TypeD::ZERO && !g_isnan(t2->getd()) && t2->getd() != 0.0 )
a61af66fc99e Initial load
duke
parents:
diff changeset
765 return TypeD::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
766
a61af66fc99e Initial load
duke
parents:
diff changeset
767 // Otherwise we give up all hope
a61af66fc99e Initial load
duke
parents:
diff changeset
768 return Type::DOUBLE;
a61af66fc99e Initial load
duke
parents:
diff changeset
769 }
a61af66fc99e Initial load
duke
parents:
diff changeset
770
a61af66fc99e Initial load
duke
parents:
diff changeset
771
a61af66fc99e Initial load
duke
parents:
diff changeset
772 //------------------------------isA_Copy---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
773 // Dividing by self is 1.
a61af66fc99e Initial load
duke
parents:
diff changeset
774 // If the divisor is 1, we are an identity on the dividend.
a61af66fc99e Initial load
duke
parents:
diff changeset
775 Node *DivDNode::Identity( PhaseTransform *phase ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
776 return (phase->type( in(2) ) == TypeD::ONE) ? in(1) : this;
a61af66fc99e Initial load
duke
parents:
diff changeset
777 }
a61af66fc99e Initial load
duke
parents:
diff changeset
778
a61af66fc99e Initial load
duke
parents:
diff changeset
779 //------------------------------Idealize---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
780 Node *DivDNode::Ideal(PhaseGVN *phase, bool can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
781 if (in(0) && remove_dead_region(phase, can_reshape)) return this;
305
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
782 // Don't bother trying to transform a dead node
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
783 if( in(0) && in(0)->is_top() ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
784
a61af66fc99e Initial load
duke
parents:
diff changeset
785 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
786 if( t2 == TypeD::ONE ) // Identity?
a61af66fc99e Initial load
duke
parents:
diff changeset
787 return NULL; // Skip it
a61af66fc99e Initial load
duke
parents:
diff changeset
788
a61af66fc99e Initial load
duke
parents:
diff changeset
789 const TypeD *td = t2->isa_double_constant();
a61af66fc99e Initial load
duke
parents:
diff changeset
790 if( !td ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
791 if( td->base() != Type::DoubleCon ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
792
a61af66fc99e Initial load
duke
parents:
diff changeset
793 // Check for out of range values
a61af66fc99e Initial load
duke
parents:
diff changeset
794 if( td->is_nan() || !td->is_finite() ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
795
a61af66fc99e Initial load
duke
parents:
diff changeset
796 // Get the value
a61af66fc99e Initial load
duke
parents:
diff changeset
797 double d = td->getd();
a61af66fc99e Initial load
duke
parents:
diff changeset
798 int exp;
a61af66fc99e Initial load
duke
parents:
diff changeset
799
a61af66fc99e Initial load
duke
parents:
diff changeset
800 // Only for special case of dividing by a power of 2
a61af66fc99e Initial load
duke
parents:
diff changeset
801 if( frexp(d, &exp) != 0.5 ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
802
a61af66fc99e Initial load
duke
parents:
diff changeset
803 // Limit the range of acceptable exponents
a61af66fc99e Initial load
duke
parents:
diff changeset
804 if( exp < -1021 || exp > 1022 ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
805
a61af66fc99e Initial load
duke
parents:
diff changeset
806 // Compute the reciprocal
a61af66fc99e Initial load
duke
parents:
diff changeset
807 double reciprocal = 1.0 / d;
a61af66fc99e Initial load
duke
parents:
diff changeset
808
a61af66fc99e Initial load
duke
parents:
diff changeset
809 assert( frexp(reciprocal, &exp) == 0.5, "reciprocal should be power of 2" );
a61af66fc99e Initial load
duke
parents:
diff changeset
810
a61af66fc99e Initial load
duke
parents:
diff changeset
811 // return multiplication by the reciprocal
a61af66fc99e Initial load
duke
parents:
diff changeset
812 return (new (phase->C, 3) MulDNode(in(1), phase->makecon(TypeD::make(reciprocal))));
a61af66fc99e Initial load
duke
parents:
diff changeset
813 }
a61af66fc99e Initial load
duke
parents:
diff changeset
814
a61af66fc99e Initial load
duke
parents:
diff changeset
815 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
816 //------------------------------Idealize---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
817 Node *ModINode::Ideal(PhaseGVN *phase, bool can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
818 // Check for dead control input
305
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
819 if( in(0) && remove_dead_region(phase, can_reshape) ) return this;
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
820 // Don't bother trying to transform a dead node
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
821 if( in(0) && in(0)->is_top() ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
822
a61af66fc99e Initial load
duke
parents:
diff changeset
823 // Get the modulus
a61af66fc99e Initial load
duke
parents:
diff changeset
824 const Type *t = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
825 if( t == Type::TOP ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
826 const TypeInt *ti = t->is_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
827
a61af66fc99e Initial load
duke
parents:
diff changeset
828 // Check for useless control input
a61af66fc99e Initial load
duke
parents:
diff changeset
829 // Check for excluding mod-zero case
a61af66fc99e Initial load
duke
parents:
diff changeset
830 if( in(0) && (ti->_hi < 0 || ti->_lo > 0) ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
831 set_req(0, NULL); // Yank control input
a61af66fc99e Initial load
duke
parents:
diff changeset
832 return this;
a61af66fc99e Initial load
duke
parents:
diff changeset
833 }
a61af66fc99e Initial load
duke
parents:
diff changeset
834
a61af66fc99e Initial load
duke
parents:
diff changeset
835 // See if we are MOD'ing by 2^k or 2^k-1.
a61af66fc99e Initial load
duke
parents:
diff changeset
836 if( !ti->is_con() ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
837 jint con = ti->get_con();
a61af66fc99e Initial load
duke
parents:
diff changeset
838
a61af66fc99e Initial load
duke
parents:
diff changeset
839 Node *hook = new (phase->C, 1) Node(1);
a61af66fc99e Initial load
duke
parents:
diff changeset
840
a61af66fc99e Initial load
duke
parents:
diff changeset
841 // First, special check for modulo 2^k-1
a61af66fc99e Initial load
duke
parents:
diff changeset
842 if( con >= 0 && con < max_jint && is_power_of_2(con+1) ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
843 uint k = exact_log2(con+1); // Extract k
a61af66fc99e Initial load
duke
parents:
diff changeset
844
a61af66fc99e Initial load
duke
parents:
diff changeset
845 // Basic algorithm by David Detlefs. See fastmod_int.java for gory details.
a61af66fc99e Initial load
duke
parents:
diff changeset
846 static int unroll_factor[] = { 999, 999, 29, 14, 9, 7, 5, 4, 4, 3, 3, 2, 2, 2, 2, 2, 1 /*past here we assume 1 forever*/};
a61af66fc99e Initial load
duke
parents:
diff changeset
847 int trip_count = 1;
a61af66fc99e Initial load
duke
parents:
diff changeset
848 if( k < ARRAY_SIZE(unroll_factor)) trip_count = unroll_factor[k];
a61af66fc99e Initial load
duke
parents:
diff changeset
849
a61af66fc99e Initial load
duke
parents:
diff changeset
850 // If the unroll factor is not too large, and if conditional moves are
a61af66fc99e Initial load
duke
parents:
diff changeset
851 // ok, then use this case
a61af66fc99e Initial load
duke
parents:
diff changeset
852 if( trip_count <= 5 && ConditionalMoveLimit != 0 ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
853 Node *x = in(1); // Value being mod'd
a61af66fc99e Initial load
duke
parents:
diff changeset
854 Node *divisor = in(2); // Also is mask
a61af66fc99e Initial load
duke
parents:
diff changeset
855
a61af66fc99e Initial load
duke
parents:
diff changeset
856 hook->init_req(0, x); // Add a use to x to prevent him from dying
a61af66fc99e Initial load
duke
parents:
diff changeset
857 // Generate code to reduce X rapidly to nearly 2^k-1.
a61af66fc99e Initial load
duke
parents:
diff changeset
858 for( int i = 0; i < trip_count; i++ ) {
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
859 Node *xl = phase->transform( new (phase->C, 3) AndINode(x,divisor) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
860 Node *xh = phase->transform( new (phase->C, 3) RShiftINode(x,phase->intcon(k)) ); // Must be signed
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
861 x = phase->transform( new (phase->C, 3) AddINode(xh,xl) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
862 hook->set_req(0, x);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
863 }
a61af66fc99e Initial load
duke
parents:
diff changeset
864
a61af66fc99e Initial load
duke
parents:
diff changeset
865 // Generate sign-fixup code. Was original value positive?
a61af66fc99e Initial load
duke
parents:
diff changeset
866 // int hack_res = (i >= 0) ? divisor : 1;
a61af66fc99e Initial load
duke
parents:
diff changeset
867 Node *cmp1 = phase->transform( new (phase->C, 3) CmpINode( in(1), phase->intcon(0) ) );
a61af66fc99e Initial load
duke
parents:
diff changeset
868 Node *bol1 = phase->transform( new (phase->C, 2) BoolNode( cmp1, BoolTest::ge ) );
a61af66fc99e Initial load
duke
parents:
diff changeset
869 Node *cmov1= phase->transform( new (phase->C, 4) CMoveINode(bol1, phase->intcon(1), divisor, TypeInt::POS) );
a61af66fc99e Initial load
duke
parents:
diff changeset
870 // if( x >= hack_res ) x -= divisor;
a61af66fc99e Initial load
duke
parents:
diff changeset
871 Node *sub = phase->transform( new (phase->C, 3) SubINode( x, divisor ) );
a61af66fc99e Initial load
duke
parents:
diff changeset
872 Node *cmp2 = phase->transform( new (phase->C, 3) CmpINode( x, cmov1 ) );
a61af66fc99e Initial load
duke
parents:
diff changeset
873 Node *bol2 = phase->transform( new (phase->C, 2) BoolNode( cmp2, BoolTest::ge ) );
a61af66fc99e Initial load
duke
parents:
diff changeset
874 // Convention is to not transform the return value of an Ideal
a61af66fc99e Initial load
duke
parents:
diff changeset
875 // since Ideal is expected to return a modified 'this' or a new node.
a61af66fc99e Initial load
duke
parents:
diff changeset
876 Node *cmov2= new (phase->C, 4) CMoveINode(bol2, x, sub, TypeInt::INT);
a61af66fc99e Initial load
duke
parents:
diff changeset
877 // cmov2 is now the mod
a61af66fc99e Initial load
duke
parents:
diff changeset
878
a61af66fc99e Initial load
duke
parents:
diff changeset
879 // Now remove the bogus extra edges used to keep things alive
a61af66fc99e Initial load
duke
parents:
diff changeset
880 if (can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
881 phase->is_IterGVN()->remove_dead_node(hook);
a61af66fc99e Initial load
duke
parents:
diff changeset
882 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
883 hook->set_req(0, NULL); // Just yank bogus edge during Parse phase
a61af66fc99e Initial load
duke
parents:
diff changeset
884 }
a61af66fc99e Initial load
duke
parents:
diff changeset
885 return cmov2;
a61af66fc99e Initial load
duke
parents:
diff changeset
886 }
a61af66fc99e Initial load
duke
parents:
diff changeset
887 }
a61af66fc99e Initial load
duke
parents:
diff changeset
888
a61af66fc99e Initial load
duke
parents:
diff changeset
889 // Fell thru, the unroll case is not appropriate. Transform the modulo
a61af66fc99e Initial load
duke
parents:
diff changeset
890 // into a long multiply/int multiply/subtract case
a61af66fc99e Initial load
duke
parents:
diff changeset
891
a61af66fc99e Initial load
duke
parents:
diff changeset
892 // Cannot handle mod 0, and min_jint isn't handled by the transform
a61af66fc99e Initial load
duke
parents:
diff changeset
893 if( con == 0 || con == min_jint ) return NULL;
a61af66fc99e Initial load
duke
parents:
diff changeset
894
a61af66fc99e Initial load
duke
parents:
diff changeset
895 // Get the absolute value of the constant; at this point, we can use this
a61af66fc99e Initial load
duke
parents:
diff changeset
896 jint pos_con = (con >= 0) ? con : -con;
a61af66fc99e Initial load
duke
parents:
diff changeset
897
a61af66fc99e Initial load
duke
parents:
diff changeset
898 // integer Mod 1 is always 0
a61af66fc99e Initial load
duke
parents:
diff changeset
899 if( pos_con == 1 ) return new (phase->C, 1) ConINode(TypeInt::ZERO);
a61af66fc99e Initial load
duke
parents:
diff changeset
900
a61af66fc99e Initial load
duke
parents:
diff changeset
901 int log2_con = -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
902
a61af66fc99e Initial load
duke
parents:
diff changeset
903 // If this is a power of two, they maybe we can mask it
a61af66fc99e Initial load
duke
parents:
diff changeset
904 if( is_power_of_2(pos_con) ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
905 log2_con = log2_intptr((intptr_t)pos_con);
a61af66fc99e Initial load
duke
parents:
diff changeset
906
a61af66fc99e Initial load
duke
parents:
diff changeset
907 const Type *dt = phase->type(in(1));
a61af66fc99e Initial load
duke
parents:
diff changeset
908 const TypeInt *dti = dt->isa_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
909
a61af66fc99e Initial load
duke
parents:
diff changeset
910 // See if this can be masked, if the dividend is non-negative
a61af66fc99e Initial load
duke
parents:
diff changeset
911 if( dti && dti->_lo >= 0 )
a61af66fc99e Initial load
duke
parents:
diff changeset
912 return ( new (phase->C, 3) AndINode( in(1), phase->intcon( pos_con-1 ) ) );
a61af66fc99e Initial load
duke
parents:
diff changeset
913 }
a61af66fc99e Initial load
duke
parents:
diff changeset
914
a61af66fc99e Initial load
duke
parents:
diff changeset
915 // Save in(1) so that it cannot be changed or deleted
a61af66fc99e Initial load
duke
parents:
diff changeset
916 hook->init_req(0, in(1));
a61af66fc99e Initial load
duke
parents:
diff changeset
917
a61af66fc99e Initial load
duke
parents:
diff changeset
918 // Divide using the transform from DivI to MulL
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
919 Node *result = transform_int_divide( phase, in(1), pos_con );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
920 if (result != NULL) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
921 Node *divide = phase->transform(result);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
922
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
923 // Re-multiply, using a shift if this is a power of two
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
924 Node *mult = NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
925
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
926 if( log2_con >= 0 )
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
927 mult = phase->transform( new (phase->C, 3) LShiftINode( divide, phase->intcon( log2_con ) ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
928 else
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
929 mult = phase->transform( new (phase->C, 3) MulINode( divide, phase->intcon( pos_con ) ) );
0
a61af66fc99e Initial load
duke
parents:
diff changeset
930
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
931 // Finally, subtract the multiplied divided value from the original
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
932 result = new (phase->C, 3) SubINode( in(1), mult );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
933 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
934
a61af66fc99e Initial load
duke
parents:
diff changeset
935 // Now remove the bogus extra edges used to keep things alive
a61af66fc99e Initial load
duke
parents:
diff changeset
936 if (can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
937 phase->is_IterGVN()->remove_dead_node(hook);
a61af66fc99e Initial load
duke
parents:
diff changeset
938 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
939 hook->set_req(0, NULL); // Just yank bogus edge during Parse phase
a61af66fc99e Initial load
duke
parents:
diff changeset
940 }
a61af66fc99e Initial load
duke
parents:
diff changeset
941
a61af66fc99e Initial load
duke
parents:
diff changeset
942 // return the value
a61af66fc99e Initial load
duke
parents:
diff changeset
943 return result;
a61af66fc99e Initial load
duke
parents:
diff changeset
944 }
a61af66fc99e Initial load
duke
parents:
diff changeset
945
a61af66fc99e Initial load
duke
parents:
diff changeset
946 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
947 const Type *ModINode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
948 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
949 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
950 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
951 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
952 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
953
a61af66fc99e Initial load
duke
parents:
diff changeset
954 // We always generate the dynamic check for 0.
a61af66fc99e Initial load
duke
parents:
diff changeset
955 // 0 MOD X is 0
a61af66fc99e Initial load
duke
parents:
diff changeset
956 if( t1 == TypeInt::ZERO ) return TypeInt::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
957 // X MOD X is 0
a61af66fc99e Initial load
duke
parents:
diff changeset
958 if( phase->eqv( in(1), in(2) ) ) return TypeInt::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
959
a61af66fc99e Initial load
duke
parents:
diff changeset
960 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
961 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
962 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
963 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
964 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
965
a61af66fc99e Initial load
duke
parents:
diff changeset
966 const TypeInt *i1 = t1->is_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
967 const TypeInt *i2 = t2->is_int();
a61af66fc99e Initial load
duke
parents:
diff changeset
968 if( !i1->is_con() || !i2->is_con() ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
969 if( i1->_lo >= 0 && i2->_lo >= 0 )
a61af66fc99e Initial load
duke
parents:
diff changeset
970 return TypeInt::POS;
a61af66fc99e Initial load
duke
parents:
diff changeset
971 // If both numbers are not constants, we know little.
a61af66fc99e Initial load
duke
parents:
diff changeset
972 return TypeInt::INT;
a61af66fc99e Initial load
duke
parents:
diff changeset
973 }
a61af66fc99e Initial load
duke
parents:
diff changeset
974 // Mod by zero? Throw exception at runtime!
a61af66fc99e Initial load
duke
parents:
diff changeset
975 if( !i2->get_con() ) return TypeInt::POS;
a61af66fc99e Initial load
duke
parents:
diff changeset
976
a61af66fc99e Initial load
duke
parents:
diff changeset
977 // We must be modulo'ing 2 float constants.
a61af66fc99e Initial load
duke
parents:
diff changeset
978 // Check for min_jint % '-1', result is defined to be '0'.
a61af66fc99e Initial load
duke
parents:
diff changeset
979 if( i1->get_con() == min_jint && i2->get_con() == -1 )
a61af66fc99e Initial load
duke
parents:
diff changeset
980 return TypeInt::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
981
a61af66fc99e Initial load
duke
parents:
diff changeset
982 return TypeInt::make( i1->get_con() % i2->get_con() );
a61af66fc99e Initial load
duke
parents:
diff changeset
983 }
a61af66fc99e Initial load
duke
parents:
diff changeset
984
a61af66fc99e Initial load
duke
parents:
diff changeset
985
a61af66fc99e Initial load
duke
parents:
diff changeset
986 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
987 //------------------------------Idealize---------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
988 Node *ModLNode::Ideal(PhaseGVN *phase, bool can_reshape) {
a61af66fc99e Initial load
duke
parents:
diff changeset
989 // Check for dead control input
305
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
990 if( in(0) && remove_dead_region(phase, can_reshape) ) return this;
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
991 // Don't bother trying to transform a dead node
ab075d07f1ba 6736417: Fastdebug C2 crashes in StoreBNode::Ideal
kvn
parents: 294
diff changeset
992 if( in(0) && in(0)->is_top() ) return NULL;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
993
a61af66fc99e Initial load
duke
parents:
diff changeset
994 // Get the modulus
a61af66fc99e Initial load
duke
parents:
diff changeset
995 const Type *t = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
996 if( t == Type::TOP ) return NULL;
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
997 const TypeLong *tl = t->is_long();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
998
a61af66fc99e Initial load
duke
parents:
diff changeset
999 // Check for useless control input
a61af66fc99e Initial load
duke
parents:
diff changeset
1000 // Check for excluding mod-zero case
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1001 if( in(0) && (tl->_hi < 0 || tl->_lo > 0) ) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1002 set_req(0, NULL); // Yank control input
a61af66fc99e Initial load
duke
parents:
diff changeset
1003 return this;
a61af66fc99e Initial load
duke
parents:
diff changeset
1004 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1005
a61af66fc99e Initial load
duke
parents:
diff changeset
1006 // See if we are MOD'ing by 2^k or 2^k-1.
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1007 if( !tl->is_con() ) return NULL;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1008 jlong con = tl->get_con();
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1009
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1010 Node *hook = new (phase->C, 1) Node(1);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1011
a61af66fc99e Initial load
duke
parents:
diff changeset
1012 // Expand mod
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1013 if( con >= 0 && con < max_jlong && is_power_of_2_long(con+1) ) {
568
30663ca5e8f4 6805724: ModLNode::Ideal() generates functionally incorrect graph when divisor is any (2^k-1) constant.
twisti
parents: 567
diff changeset
1014 uint k = exact_log2_long(con+1); // Extract k
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1015
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1016 // Basic algorithm by David Detlefs. See fastmod_long.java for gory details.
a61af66fc99e Initial load
duke
parents:
diff changeset
1017 // Used to help a popular random number generator which does a long-mod
a61af66fc99e Initial load
duke
parents:
diff changeset
1018 // of 2^31-1 and shows up in SpecJBB and SciMark.
a61af66fc99e Initial load
duke
parents:
diff changeset
1019 static int unroll_factor[] = { 999, 999, 61, 30, 20, 15, 12, 10, 8, 7, 6, 6, 5, 5, 4, 4, 4, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1 /*past here we assume 1 forever*/};
a61af66fc99e Initial load
duke
parents:
diff changeset
1020 int trip_count = 1;
a61af66fc99e Initial load
duke
parents:
diff changeset
1021 if( k < ARRAY_SIZE(unroll_factor)) trip_count = unroll_factor[k];
a61af66fc99e Initial load
duke
parents:
diff changeset
1022
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1023 // If the unroll factor is not too large, and if conditional moves are
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1024 // ok, then use this case
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1025 if( trip_count <= 5 && ConditionalMoveLimit != 0 ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1026 Node *x = in(1); // Value being mod'd
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1027 Node *divisor = in(2); // Also is mask
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1028
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1029 hook->init_req(0, x); // Add a use to x to prevent him from dying
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1030 // Generate code to reduce X rapidly to nearly 2^k-1.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1031 for( int i = 0; i < trip_count; i++ ) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1032 Node *xl = phase->transform( new (phase->C, 3) AndLNode(x,divisor) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1033 Node *xh = phase->transform( new (phase->C, 3) RShiftLNode(x,phase->intcon(k)) ); // Must be signed
a61af66fc99e Initial load
duke
parents:
diff changeset
1034 x = phase->transform( new (phase->C, 3) AddLNode(xh,xl) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1035 hook->set_req(0, x); // Add a use to x to prevent him from dying
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1036 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1037
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1038 // Generate sign-fixup code. Was original value positive?
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1039 // long hack_res = (i >= 0) ? divisor : CONST64(1);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1040 Node *cmp1 = phase->transform( new (phase->C, 3) CmpLNode( in(1), phase->longcon(0) ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1041 Node *bol1 = phase->transform( new (phase->C, 2) BoolNode( cmp1, BoolTest::ge ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1042 Node *cmov1= phase->transform( new (phase->C, 4) CMoveLNode(bol1, phase->longcon(1), divisor, TypeLong::LONG) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1043 // if( x >= hack_res ) x -= divisor;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1044 Node *sub = phase->transform( new (phase->C, 3) SubLNode( x, divisor ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1045 Node *cmp2 = phase->transform( new (phase->C, 3) CmpLNode( x, cmov1 ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1046 Node *bol2 = phase->transform( new (phase->C, 2) BoolNode( cmp2, BoolTest::ge ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1047 // Convention is to not transform the return value of an Ideal
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1048 // since Ideal is expected to return a modified 'this' or a new node.
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1049 Node *cmov2= new (phase->C, 4) CMoveLNode(bol2, x, sub, TypeLong::LONG);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1050 // cmov2 is now the mod
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1051
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1052 // Now remove the bogus extra edges used to keep things alive
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1053 if (can_reshape) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1054 phase->is_IterGVN()->remove_dead_node(hook);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1055 } else {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1056 hook->set_req(0, NULL); // Just yank bogus edge during Parse phase
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1057 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1058 return cmov2;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1059 }
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1060 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1061
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1062 // Fell thru, the unroll case is not appropriate. Transform the modulo
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1063 // into a long multiply/int multiply/subtract case
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1064
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1065 // Cannot handle mod 0, and min_jint isn't handled by the transform
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1066 if( con == 0 || con == min_jlong ) return NULL;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1067
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1068 // Get the absolute value of the constant; at this point, we can use this
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1069 jlong pos_con = (con >= 0) ? con : -con;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1070
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1071 // integer Mod 1 is always 0
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1072 if( pos_con == 1 ) return new (phase->C, 1) ConLNode(TypeLong::ZERO);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1073
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1074 int log2_con = -1;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1075
605
98cb887364d3 6810672: Comment typos
twisti
parents: 568
diff changeset
1076 // If this is a power of two, then maybe we can mask it
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1077 if( is_power_of_2_long(pos_con) ) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1078 log2_con = log2_long(pos_con);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1079
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1080 const Type *dt = phase->type(in(1));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1081 const TypeLong *dtl = dt->isa_long();
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1082
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1083 // See if this can be masked, if the dividend is non-negative
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1084 if( dtl && dtl->_lo >= 0 )
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1085 return ( new (phase->C, 3) AndLNode( in(1), phase->longcon( pos_con-1 ) ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1086 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1087
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1088 // Save in(1) so that it cannot be changed or deleted
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1089 hook->init_req(0, in(1));
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1090
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1091 // Divide using the transform from DivI to MulL
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1092 Node *result = transform_long_divide( phase, in(1), pos_con );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1093 if (result != NULL) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1094 Node *divide = phase->transform(result);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1095
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1096 // Re-multiply, using a shift if this is a power of two
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1097 Node *mult = NULL;
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1098
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1099 if( log2_con >= 0 )
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1100 mult = phase->transform( new (phase->C, 3) LShiftLNode( divide, phase->intcon( log2_con ) ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1101 else
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1102 mult = phase->transform( new (phase->C, 3) MulLNode( divide, phase->longcon( pos_con ) ) );
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1103
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1104 // Finally, subtract the multiplied divided value from the original
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1105 result = new (phase->C, 3) SubLNode( in(1), mult );
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1106 }
145
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1107
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1108 // Now remove the bogus extra edges used to keep things alive
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1109 if (can_reshape) {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1110 phase->is_IterGVN()->remove_dead_node(hook);
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1111 } else {
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1112 hook->set_req(0, NULL); // Just yank bogus edge during Parse phase
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1113 }
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1114
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1115 // return the value
f3de1255b035 6603011: RFE: Optimize long division
rasbold
parents: 131
diff changeset
1116 return result;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1117 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1118
a61af66fc99e Initial load
duke
parents:
diff changeset
1119 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1120 const Type *ModLNode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
1121 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
1122 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1123 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1124 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
1125 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
1126
a61af66fc99e Initial load
duke
parents:
diff changeset
1127 // We always generate the dynamic check for 0.
a61af66fc99e Initial load
duke
parents:
diff changeset
1128 // 0 MOD X is 0
a61af66fc99e Initial load
duke
parents:
diff changeset
1129 if( t1 == TypeLong::ZERO ) return TypeLong::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
1130 // X MOD X is 0
a61af66fc99e Initial load
duke
parents:
diff changeset
1131 if( phase->eqv( in(1), in(2) ) ) return TypeLong::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
1132
a61af66fc99e Initial load
duke
parents:
diff changeset
1133 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
1134 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
1135 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
1136 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
1137 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
1138
a61af66fc99e Initial load
duke
parents:
diff changeset
1139 const TypeLong *i1 = t1->is_long();
a61af66fc99e Initial load
duke
parents:
diff changeset
1140 const TypeLong *i2 = t2->is_long();
a61af66fc99e Initial load
duke
parents:
diff changeset
1141 if( !i1->is_con() || !i2->is_con() ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1142 if( i1->_lo >= CONST64(0) && i2->_lo >= CONST64(0) )
a61af66fc99e Initial load
duke
parents:
diff changeset
1143 return TypeLong::POS;
a61af66fc99e Initial load
duke
parents:
diff changeset
1144 // If both numbers are not constants, we know little.
a61af66fc99e Initial load
duke
parents:
diff changeset
1145 return TypeLong::LONG;
a61af66fc99e Initial load
duke
parents:
diff changeset
1146 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1147 // Mod by zero? Throw exception at runtime!
a61af66fc99e Initial load
duke
parents:
diff changeset
1148 if( !i2->get_con() ) return TypeLong::POS;
a61af66fc99e Initial load
duke
parents:
diff changeset
1149
a61af66fc99e Initial load
duke
parents:
diff changeset
1150 // We must be modulo'ing 2 float constants.
a61af66fc99e Initial load
duke
parents:
diff changeset
1151 // Check for min_jint % '-1', result is defined to be '0'.
a61af66fc99e Initial load
duke
parents:
diff changeset
1152 if( i1->get_con() == min_jlong && i2->get_con() == -1 )
a61af66fc99e Initial load
duke
parents:
diff changeset
1153 return TypeLong::ZERO;
a61af66fc99e Initial load
duke
parents:
diff changeset
1154
a61af66fc99e Initial load
duke
parents:
diff changeset
1155 return TypeLong::make( i1->get_con() % i2->get_con() );
a61af66fc99e Initial load
duke
parents:
diff changeset
1156 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1157
a61af66fc99e Initial load
duke
parents:
diff changeset
1158
a61af66fc99e Initial load
duke
parents:
diff changeset
1159 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
1160 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1161 const Type *ModFNode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
1162 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
1163 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1164 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1165 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
1166 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
1167
a61af66fc99e Initial load
duke
parents:
diff changeset
1168 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
1169 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
1170 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
1171 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
1172 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
1173
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1174 // If either number is not a constant, we know nothing.
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1175 if ((t1->base() != Type::FloatCon) || (t2->base() != Type::FloatCon)) {
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1176 return Type::FLOAT; // note: x%x can be either NaN or 0
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1177 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1178
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1179 float f1 = t1->getf();
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1180 float f2 = t2->getf();
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1181 jint x1 = jint_cast(f1); // note: *(int*)&f1, not just (int)f1
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1182 jint x2 = jint_cast(f2);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1183
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1184 // If either is a NaN, return an input NaN
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1185 if (g_isnan(f1)) return t1;
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1186 if (g_isnan(f2)) return t2;
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1187
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1188 // If an operand is infinity or the divisor is +/- zero, punt.
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1189 if (!g_isfinite(f1) || !g_isfinite(f2) || x2 == 0 || x2 == min_jint)
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1190 return Type::FLOAT;
a61af66fc99e Initial load
duke
parents:
diff changeset
1191
a61af66fc99e Initial load
duke
parents:
diff changeset
1192 // We must be modulo'ing 2 float constants.
a61af66fc99e Initial load
duke
parents:
diff changeset
1193 // Make sure that the sign of the fmod is equal to the sign of the dividend
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1194 jint xr = jint_cast(fmod(f1, f2));
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1195 if ((x1 ^ xr) < 0) {
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1196 xr ^= min_jint;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1197 }
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1198
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1199 return TypeF::make(jfloat_cast(xr));
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1200 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1201
a61af66fc99e Initial load
duke
parents:
diff changeset
1202
a61af66fc99e Initial load
duke
parents:
diff changeset
1203 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
1204 //------------------------------Value------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1205 const Type *ModDNode::Value( PhaseTransform *phase ) const {
a61af66fc99e Initial load
duke
parents:
diff changeset
1206 // Either input is TOP ==> the result is TOP
a61af66fc99e Initial load
duke
parents:
diff changeset
1207 const Type *t1 = phase->type( in(1) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1208 const Type *t2 = phase->type( in(2) );
a61af66fc99e Initial load
duke
parents:
diff changeset
1209 if( t1 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
1210 if( t2 == Type::TOP ) return Type::TOP;
a61af66fc99e Initial load
duke
parents:
diff changeset
1211
a61af66fc99e Initial load
duke
parents:
diff changeset
1212 // Either input is BOTTOM ==> the result is the local BOTTOM
a61af66fc99e Initial load
duke
parents:
diff changeset
1213 const Type *bot = bottom_type();
a61af66fc99e Initial load
duke
parents:
diff changeset
1214 if( (t1 == bot) || (t2 == bot) ||
a61af66fc99e Initial load
duke
parents:
diff changeset
1215 (t1 == Type::BOTTOM) || (t2 == Type::BOTTOM) )
a61af66fc99e Initial load
duke
parents:
diff changeset
1216 return bot;
a61af66fc99e Initial load
duke
parents:
diff changeset
1217
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1218 // If either number is not a constant, we know nothing.
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1219 if ((t1->base() != Type::DoubleCon) || (t2->base() != Type::DoubleCon)) {
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1220 return Type::DOUBLE; // note: x%x can be either NaN or 0
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1221 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1222
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1223 double f1 = t1->getd();
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1224 double f2 = t2->getd();
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1225 jlong x1 = jlong_cast(f1); // note: *(long*)&f1, not just (long)f1
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1226 jlong x2 = jlong_cast(f2);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1227
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1228 // If either is a NaN, return an input NaN
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1229 if (g_isnan(f1)) return t1;
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1230 if (g_isnan(f2)) return t2;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1231
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1232 // If an operand is infinity or the divisor is +/- zero, punt.
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1233 if (!g_isfinite(f1) || !g_isfinite(f2) || x2 == 0 || x2 == min_jlong)
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1234 return Type::DOUBLE;
a61af66fc99e Initial load
duke
parents:
diff changeset
1235
a61af66fc99e Initial load
duke
parents:
diff changeset
1236 // We must be modulo'ing 2 double constants.
131
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1237 // Make sure that the sign of the fmod is equal to the sign of the dividend
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1238 jlong xr = jlong_cast(fmod(f1, f2));
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1239 if ((x1 ^ xr) < 0) {
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1240 xr ^= min_jlong;
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1241 }
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1242
6e825ad773c6 6695288: runThese tests expr30303 and drem00301m1 fail when compiled code executes without deopt
jrose
parents: 0
diff changeset
1243 return TypeD::make(jdouble_cast(xr));
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1244 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1245
a61af66fc99e Initial load
duke
parents:
diff changeset
1246 //=============================================================================
a61af66fc99e Initial load
duke
parents:
diff changeset
1247
a61af66fc99e Initial load
duke
parents:
diff changeset
1248 DivModNode::DivModNode( Node *c, Node *dividend, Node *divisor ) : MultiNode(3) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1249 init_req(0, c);
a61af66fc99e Initial load
duke
parents:
diff changeset
1250 init_req(1, dividend);
a61af66fc99e Initial load
duke
parents:
diff changeset
1251 init_req(2, divisor);
a61af66fc99e Initial load
duke
parents:
diff changeset
1252 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1253
a61af66fc99e Initial load
duke
parents:
diff changeset
1254 //------------------------------make------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1255 DivModINode* DivModINode::make(Compile* C, Node* div_or_mod) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1256 Node* n = div_or_mod;
a61af66fc99e Initial load
duke
parents:
diff changeset
1257 assert(n->Opcode() == Op_DivI || n->Opcode() == Op_ModI,
a61af66fc99e Initial load
duke
parents:
diff changeset
1258 "only div or mod input pattern accepted");
a61af66fc99e Initial load
duke
parents:
diff changeset
1259
a61af66fc99e Initial load
duke
parents:
diff changeset
1260 DivModINode* divmod = new (C, 3) DivModINode(n->in(0), n->in(1), n->in(2));
a61af66fc99e Initial load
duke
parents:
diff changeset
1261 Node* dproj = new (C, 1) ProjNode(divmod, DivModNode::div_proj_num);
a61af66fc99e Initial load
duke
parents:
diff changeset
1262 Node* mproj = new (C, 1) ProjNode(divmod, DivModNode::mod_proj_num);
a61af66fc99e Initial load
duke
parents:
diff changeset
1263 return divmod;
a61af66fc99e Initial load
duke
parents:
diff changeset
1264 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1265
a61af66fc99e Initial load
duke
parents:
diff changeset
1266 //------------------------------make------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1267 DivModLNode* DivModLNode::make(Compile* C, Node* div_or_mod) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1268 Node* n = div_or_mod;
a61af66fc99e Initial load
duke
parents:
diff changeset
1269 assert(n->Opcode() == Op_DivL || n->Opcode() == Op_ModL,
a61af66fc99e Initial load
duke
parents:
diff changeset
1270 "only div or mod input pattern accepted");
a61af66fc99e Initial load
duke
parents:
diff changeset
1271
a61af66fc99e Initial load
duke
parents:
diff changeset
1272 DivModLNode* divmod = new (C, 3) DivModLNode(n->in(0), n->in(1), n->in(2));
a61af66fc99e Initial load
duke
parents:
diff changeset
1273 Node* dproj = new (C, 1) ProjNode(divmod, DivModNode::div_proj_num);
a61af66fc99e Initial load
duke
parents:
diff changeset
1274 Node* mproj = new (C, 1) ProjNode(divmod, DivModNode::mod_proj_num);
a61af66fc99e Initial load
duke
parents:
diff changeset
1275 return divmod;
a61af66fc99e Initial load
duke
parents:
diff changeset
1276 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1277
a61af66fc99e Initial load
duke
parents:
diff changeset
1278 //------------------------------match------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1279 // return result(s) along with their RegMask info
a61af66fc99e Initial load
duke
parents:
diff changeset
1280 Node *DivModINode::match( const ProjNode *proj, const Matcher *match ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1281 uint ideal_reg = proj->ideal_reg();
a61af66fc99e Initial load
duke
parents:
diff changeset
1282 RegMask rm;
a61af66fc99e Initial load
duke
parents:
diff changeset
1283 if (proj->_con == div_proj_num) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1284 rm = match->divI_proj_mask();
a61af66fc99e Initial load
duke
parents:
diff changeset
1285 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
1286 assert(proj->_con == mod_proj_num, "must be div or mod projection");
a61af66fc99e Initial load
duke
parents:
diff changeset
1287 rm = match->modI_proj_mask();
a61af66fc99e Initial load
duke
parents:
diff changeset
1288 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1289 return new (match->C, 1)MachProjNode(this, proj->_con, rm, ideal_reg);
a61af66fc99e Initial load
duke
parents:
diff changeset
1290 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1291
a61af66fc99e Initial load
duke
parents:
diff changeset
1292
a61af66fc99e Initial load
duke
parents:
diff changeset
1293 //------------------------------match------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
1294 // return result(s) along with their RegMask info
a61af66fc99e Initial load
duke
parents:
diff changeset
1295 Node *DivModLNode::match( const ProjNode *proj, const Matcher *match ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1296 uint ideal_reg = proj->ideal_reg();
a61af66fc99e Initial load
duke
parents:
diff changeset
1297 RegMask rm;
a61af66fc99e Initial load
duke
parents:
diff changeset
1298 if (proj->_con == div_proj_num) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1299 rm = match->divL_proj_mask();
a61af66fc99e Initial load
duke
parents:
diff changeset
1300 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
1301 assert(proj->_con == mod_proj_num, "must be div or mod projection");
a61af66fc99e Initial load
duke
parents:
diff changeset
1302 rm = match->modL_proj_mask();
a61af66fc99e Initial load
duke
parents:
diff changeset
1303 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1304 return new (match->C, 1)MachProjNode(this, proj->_con, rm, ideal_reg);
a61af66fc99e Initial load
duke
parents:
diff changeset
1305 }