Mercurial > hg > graal-compiler
annotate src/cpu/sparc/vm/vm_version_sparc.cpp @ 3946:0db80d8e77fc jdk8-b06
Added tag jdk8-b05 for changeset dce7d24674f4
author | schien |
---|---|
date | Thu, 15 Sep 2011 18:53:14 -0700 |
parents | 1af104d6cf99 |
children | baf763f388e6 |
rev | line source |
---|---|
0 | 1 /* |
1914
ae065c367d93
6987135: Performance regression on Intel platform with 32-bits edition between 6u13 and 6u14.
kvn
parents:
1730
diff
changeset
|
2 * Copyright (c) 1997, 2010, Oracle and/or its affiliates. All rights reserved. |
0 | 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
4 * | |
5 * This code is free software; you can redistribute it and/or modify it | |
6 * under the terms of the GNU General Public License version 2 only, as | |
7 * published by the Free Software Foundation. | |
8 * | |
9 * This code is distributed in the hope that it will be useful, but WITHOUT | |
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License | |
12 * version 2 for more details (a copy is included in the LICENSE file that | |
13 * accompanied this code). | |
14 * | |
15 * You should have received a copy of the GNU General Public License version | |
16 * 2 along with this work; if not, write to the Free Software Foundation, | |
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. | |
18 * | |
1552
c18cbe5936b8
6941466: Oracle rebranding changes for Hotspot repositories
trims
parents:
1518
diff
changeset
|
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
c18cbe5936b8
6941466: Oracle rebranding changes for Hotspot repositories
trims
parents:
1518
diff
changeset
|
20 * or visit www.oracle.com if you need additional information or have any |
c18cbe5936b8
6941466: Oracle rebranding changes for Hotspot repositories
trims
parents:
1518
diff
changeset
|
21 * questions. |
0 | 22 * |
23 */ | |
24 | |
1972 | 25 #include "precompiled.hpp" |
26 #include "assembler_sparc.inline.hpp" | |
27 #include "memory/resourceArea.hpp" | |
28 #include "runtime/java.hpp" | |
29 #include "runtime/stubCodeGenerator.hpp" | |
30 #include "vm_version_sparc.hpp" | |
31 #ifdef TARGET_OS_FAMILY_linux | |
32 # include "os_linux.inline.hpp" | |
33 #endif | |
34 #ifdef TARGET_OS_FAMILY_solaris | |
35 # include "os_solaris.inline.hpp" | |
36 #endif | |
0 | 37 |
38 int VM_Version::_features = VM_Version::unknown_m; | |
39 const char* VM_Version::_features_str = ""; | |
40 | |
41 void VM_Version::initialize() { | |
42 _features = determine_features(); | |
43 PrefetchCopyIntervalInBytes = prefetch_copy_interval_in_bytes(); | |
44 PrefetchScanIntervalInBytes = prefetch_scan_interval_in_bytes(); | |
45 PrefetchFieldsAhead = prefetch_fields_ahead(); | |
46 | |
3854 | 47 assert(0 <= AllocatePrefetchInstr && AllocatePrefetchInstr <= 1, "invalid value"); |
48 if( AllocatePrefetchInstr < 0 ) AllocatePrefetchInstr = 0; | |
49 if( AllocatePrefetchInstr > 1 ) AllocatePrefetchInstr = 0; | |
50 | |
0 | 51 // Allocation prefetch settings |
3854 | 52 intx cache_line_size = prefetch_data_size(); |
0 | 53 if( cache_line_size > AllocatePrefetchStepSize ) |
54 AllocatePrefetchStepSize = cache_line_size; | |
3854 | 55 |
56 assert(AllocatePrefetchLines > 0, "invalid value"); | |
57 if( AllocatePrefetchLines < 1 ) // set valid value in product VM | |
58 AllocatePrefetchLines = 3; | |
59 assert(AllocateInstancePrefetchLines > 0, "invalid value"); | |
60 if( AllocateInstancePrefetchLines < 1 ) // set valid value in product VM | |
61 AllocateInstancePrefetchLines = 1; | |
0 | 62 |
63 AllocatePrefetchDistance = allocate_prefetch_distance(); | |
64 AllocatePrefetchStyle = allocate_prefetch_style(); | |
65 | |
3854 | 66 assert((AllocatePrefetchDistance % AllocatePrefetchStepSize) == 0 && |
67 (AllocatePrefetchDistance > 0), "invalid value"); | |
68 if ((AllocatePrefetchDistance % AllocatePrefetchStepSize) != 0 || | |
69 (AllocatePrefetchDistance <= 0)) { | |
70 AllocatePrefetchDistance = AllocatePrefetchStepSize; | |
71 } | |
0 | 72 |
3839 | 73 if (AllocatePrefetchStyle == 3 && !has_blk_init()) { |
74 warning("BIS instructions are not available on this CPU"); | |
75 FLAG_SET_DEFAULT(AllocatePrefetchStyle, 1); | |
76 } | |
77 | |
0 | 78 UseSSE = 0; // Only on x86 and x64 |
79 | |
3854 | 80 _supports_cx8 = has_v9(); |
0 | 81 |
2080 | 82 if (is_niagara()) { |
0 | 83 // Indirect branch is the same cost as direct |
84 if (FLAG_IS_DEFAULT(UseInlineCaches)) { | |
675 | 85 FLAG_SET_DEFAULT(UseInlineCaches, false); |
0 | 86 } |
2080 | 87 // Align loops on a single instruction boundary. |
88 if (FLAG_IS_DEFAULT(OptoLoopAlignment)) { | |
89 FLAG_SET_DEFAULT(OptoLoopAlignment, 4); | |
90 } | |
91 // When using CMS, we cannot use memset() in BOT updates because | |
92 // the sun4v/CMT version in libc_psr uses BIS which exposes | |
93 // "phantom zeros" to concurrent readers. See 6948537. | |
94 if (FLAG_IS_DEFAULT(UseMemSetInBOT) && UseConcMarkSweepGC) { | |
95 FLAG_SET_DEFAULT(UseMemSetInBOT, false); | |
96 } | |
113
ba764ed4b6f2
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents:
10
diff
changeset
|
97 #ifdef _LP64 |
642
660978a2a31a
6791178: Specialize for zero as the compressed oop vm heap base
kvn
parents:
641
diff
changeset
|
98 // 32-bit oops don't make sense for the 64-bit VM on sparc |
660978a2a31a
6791178: Specialize for zero as the compressed oop vm heap base
kvn
parents:
641
diff
changeset
|
99 // since the 32-bit VM has the same registers and smaller objects. |
660978a2a31a
6791178: Specialize for zero as the compressed oop vm heap base
kvn
parents:
641
diff
changeset
|
100 Universe::set_narrow_oop_shift(LogMinObjAlignmentInBytes); |
113
ba764ed4b6f2
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents:
10
diff
changeset
|
101 #endif // _LP64 |
0 | 102 #ifdef COMPILER2 |
103 // Indirect branch is the same cost as direct | |
104 if (FLAG_IS_DEFAULT(UseJumpTables)) { | |
675 | 105 FLAG_SET_DEFAULT(UseJumpTables, true); |
0 | 106 } |
107 // Single-issue, so entry and loop tops are | |
108 // aligned on a single instruction boundary | |
109 if (FLAG_IS_DEFAULT(InteriorEntryAlignment)) { | |
675 | 110 FLAG_SET_DEFAULT(InteriorEntryAlignment, 4); |
0 | 111 } |
2080 | 112 if (is_niagara_plus()) { |
3854 | 113 if (has_blk_init() && UseTLAB && |
114 FLAG_IS_DEFAULT(AllocatePrefetchInstr)) { | |
115 // Use BIS instruction for TLAB allocation prefetch. | |
116 FLAG_SET_ERGO(intx, AllocatePrefetchInstr, 1); | |
117 if (FLAG_IS_DEFAULT(AllocatePrefetchStyle)) { | |
118 FLAG_SET_ERGO(intx, AllocatePrefetchStyle, 3); | |
119 } | |
1367
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
120 if (FLAG_IS_DEFAULT(AllocatePrefetchDistance)) { |
3854 | 121 // Use smaller prefetch distance with BIS |
1367
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
122 FLAG_SET_DEFAULT(AllocatePrefetchDistance, 64); |
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
123 } |
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
124 } |
3854 | 125 if (is_T4()) { |
126 // Double number of prefetched cache lines on T4 | |
127 // since L2 cache line size is smaller (32 bytes). | |
128 if (FLAG_IS_DEFAULT(AllocatePrefetchLines)) { | |
129 FLAG_SET_ERGO(intx, AllocatePrefetchLines, AllocatePrefetchLines*2); | |
130 } | |
131 if (FLAG_IS_DEFAULT(AllocateInstancePrefetchLines)) { | |
132 FLAG_SET_ERGO(intx, AllocateInstancePrefetchLines, AllocateInstancePrefetchLines*2); | |
133 } | |
134 } | |
1367
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
135 if (AllocatePrefetchStyle != 3 && FLAG_IS_DEFAULT(AllocatePrefetchDistance)) { |
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
136 // Use different prefetch distance without BIS |
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
137 FLAG_SET_DEFAULT(AllocatePrefetchDistance, 256); |
9e321dcfa5b7
6940726: Use BIS instruction for allocation prefetch on Sparc
kvn
parents:
1365
diff
changeset
|
138 } |
3854 | 139 if (AllocatePrefetchInstr == 1) { |
140 // Need a space at the end of TLAB for BIS since it | |
141 // will fault when accessing memory outside of heap. | |
142 | |
143 // +1 for rounding up to next cache line, +1 to be safe | |
144 int lines = AllocatePrefetchLines + 2; | |
145 int step_size = AllocatePrefetchStepSize; | |
146 int distance = AllocatePrefetchDistance; | |
147 _reserve_for_allocation_prefetch = (distance + step_size*lines)/(int)HeapWordSize; | |
148 } | |
0 | 149 } |
150 #endif | |
151 } | |
152 | |
643
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
153 // Use hardware population count instruction if available. |
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
154 if (has_hardware_popc()) { |
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
155 if (FLAG_IS_DEFAULT(UsePopCountInstruction)) { |
675 | 156 FLAG_SET_DEFAULT(UsePopCountInstruction, true); |
643
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
157 } |
3839 | 158 } else if (UsePopCountInstruction) { |
159 warning("POPC instruction is not available on this CPU"); | |
160 FLAG_SET_DEFAULT(UsePopCountInstruction, false); | |
161 } | |
162 | |
163 // T4 and newer Sparc cpus have new compare and branch instruction. | |
164 if (has_cbcond()) { | |
165 if (FLAG_IS_DEFAULT(UseCBCond)) { | |
166 FLAG_SET_DEFAULT(UseCBCond, true); | |
167 } | |
168 } else if (UseCBCond) { | |
169 warning("CBCOND instruction is not available on this CPU"); | |
170 FLAG_SET_DEFAULT(UseCBCond, false); | |
643
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
171 } |
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
172 |
1730
f55c4f82ab9d
6978249: spill between cpu and fpu registers when those moves are fast
never
parents:
1579
diff
changeset
|
173 #ifdef COMPILER2 |
3839 | 174 // T4 and newer Sparc cpus have fast RDPC. |
175 if (has_fast_rdpc() && FLAG_IS_DEFAULT(UseRDPCForConstantTableBase)) { | |
176 // FLAG_SET_DEFAULT(UseRDPCForConstantTableBase, true); | |
177 } | |
178 | |
1730
f55c4f82ab9d
6978249: spill between cpu and fpu registers when those moves are fast
never
parents:
1579
diff
changeset
|
179 // Currently not supported anywhere. |
f55c4f82ab9d
6978249: spill between cpu and fpu registers when those moves are fast
never
parents:
1579
diff
changeset
|
180 FLAG_SET_DEFAULT(UseFPUForSpilling, false); |
3851 | 181 |
182 assert((InteriorEntryAlignment % relocInfo::addr_unit()) == 0, "alignment is not a multiple of NOP size"); | |
1730
f55c4f82ab9d
6978249: spill between cpu and fpu registers when those moves are fast
never
parents:
1579
diff
changeset
|
183 #endif |
f55c4f82ab9d
6978249: spill between cpu and fpu registers when those moves are fast
never
parents:
1579
diff
changeset
|
184 |
3851 | 185 assert((CodeEntryAlignment % relocInfo::addr_unit()) == 0, "alignment is not a multiple of NOP size"); |
186 assert((OptoLoopAlignment % relocInfo::addr_unit()) == 0, "alignment is not a multiple of NOP size"); | |
187 | |
0 | 188 char buf[512]; |
3839 | 189 jio_snprintf(buf, sizeof(buf), "%s%s%s%s%s%s%s%s%s%s%s%s%s%s", |
190 (has_v9() ? ", v9" : (has_v8() ? ", v8" : "")), | |
643
c771b7f43bbf
6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents:
642
diff
changeset
|
191 (has_hardware_popc() ? ", popc" : ""), |
3839 | 192 (has_vis1() ? ", vis1" : ""), |
193 (has_vis2() ? ", vis2" : ""), | |
194 (has_vis3() ? ", vis3" : ""), | |
195 (has_blk_init() ? ", blk_init" : ""), | |
196 (has_cbcond() ? ", cbcond" : ""), | |
197 (is_ultra3() ? ", ultra3" : ""), | |
198 (is_sun4v() ? ", sun4v" : ""), | |
199 (is_niagara_plus() ? ", niagara_plus" : (is_niagara() ? ", niagara" : "")), | |
200 (is_sparc64() ? ", sparc64" : ""), | |
641
6af0a709d52b
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
196
diff
changeset
|
201 (!has_hardware_mul32() ? ", no-mul32" : ""), |
6af0a709d52b
6812587: Use auxv to determine SPARC hardware features on Solaris
twisti
parents:
196
diff
changeset
|
202 (!has_hardware_div32() ? ", no-div32" : ""), |
0 | 203 (!has_hardware_fsmuld() ? ", no-fsmuld" : "")); |
204 | |
205 // buf is started with ", " or is empty | |
206 _features_str = strdup(strlen(buf) > 2 ? buf + 2 : buf); | |
207 | |
3804 | 208 // UseVIS is set to the smallest of what hardware supports and what |
209 // the command line requires. I.e., you cannot set UseVIS to 3 on | |
210 // older UltraSparc which do not support it. | |
211 if (UseVIS > 3) UseVIS=3; | |
212 if (UseVIS < 0) UseVIS=0; | |
213 if (!has_vis3()) // Drop to 2 if no VIS3 support | |
214 UseVIS = MIN2((intx)2,UseVIS); | |
215 if (!has_vis2()) // Drop to 1 if no VIS2 support | |
216 UseVIS = MIN2((intx)1,UseVIS); | |
217 if (!has_vis1()) // Drop to 0 if no VIS1 support | |
218 UseVIS = 0; | |
219 | |
0 | 220 #ifndef PRODUCT |
221 if (PrintMiscellaneous && Verbose) { | |
3854 | 222 tty->print("Allocation"); |
0 | 223 if (AllocatePrefetchStyle <= 0) { |
3854 | 224 tty->print_cr(": no prefetching"); |
0 | 225 } else { |
3854 | 226 tty->print(" prefetching: "); |
227 if (AllocatePrefetchInstr == 0) { | |
228 tty->print("PREFETCH"); | |
229 } else if (AllocatePrefetchInstr == 1) { | |
230 tty->print("BIS"); | |
231 } | |
0 | 232 if (AllocatePrefetchLines > 1) { |
3854 | 233 tty->print_cr(" at distance %d, %d lines of %d bytes", AllocatePrefetchDistance, AllocatePrefetchLines, AllocatePrefetchStepSize); |
0 | 234 } else { |
3854 | 235 tty->print_cr(" at distance %d, one line of %d bytes", AllocatePrefetchDistance, AllocatePrefetchStepSize); |
0 | 236 } |
237 } | |
238 if (PrefetchCopyIntervalInBytes > 0) { | |
239 tty->print_cr("PrefetchCopyIntervalInBytes %d", PrefetchCopyIntervalInBytes); | |
240 } | |
241 if (PrefetchScanIntervalInBytes > 0) { | |
242 tty->print_cr("PrefetchScanIntervalInBytes %d", PrefetchScanIntervalInBytes); | |
243 } | |
244 if (PrefetchFieldsAhead > 0) { | |
245 tty->print_cr("PrefetchFieldsAhead %d", PrefetchFieldsAhead); | |
246 } | |
247 } | |
248 #endif // PRODUCT | |
249 } | |
250 | |
251 void VM_Version::print_features() { | |
252 tty->print_cr("Version:%s", cpu_features()); | |
253 } | |
254 | |
255 int VM_Version::determine_features() { | |
256 if (UseV8InstrsOnly) { | |
257 NOT_PRODUCT(if (PrintMiscellaneous && Verbose) tty->print_cr("Version is Forced-V8");) | |
258 return generic_v8_m; | |
259 } | |
260 | |
261 int features = platform_features(unknown_m); // platform_features() is os_arch specific | |
262 | |
263 if (features == unknown_m) { | |
264 features = generic_v9_m; | |
265 warning("Cannot recognize SPARC version. Default to V9"); | |
266 } | |
267 | |
2080 | 268 assert(is_T_family(features) == is_niagara(features), "Niagara should be T series"); |
269 if (UseNiagaraInstrs) { // Force code generation for Niagara | |
270 if (is_T_family(features)) { | |
0 | 271 // Happy to accomodate... |
272 } else { | |
273 NOT_PRODUCT(if (PrintMiscellaneous && Verbose) tty->print_cr("Version is Forced-Niagara");) | |
2080 | 274 features |= T_family_m; |
0 | 275 } |
276 } else { | |
2080 | 277 if (is_T_family(features) && !FLAG_IS_DEFAULT(UseNiagaraInstrs)) { |
0 | 278 NOT_PRODUCT(if (PrintMiscellaneous && Verbose) tty->print_cr("Version is Forced-Not-Niagara");) |
2080 | 279 features &= ~(T_family_m | T1_model_m); |
0 | 280 } else { |
281 // Happy to accomodate... | |
282 } | |
283 } | |
284 | |
285 return features; | |
286 } | |
287 | |
288 static int saved_features = 0; | |
289 | |
290 void VM_Version::allow_all() { | |
291 saved_features = _features; | |
292 _features = all_features_m; | |
293 } | |
294 | |
295 void VM_Version::revert() { | |
296 _features = saved_features; | |
297 } | |
10
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
298 |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
299 unsigned int VM_Version::calc_parallel_worker_threads() { |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
300 unsigned int result; |
2080 | 301 if (is_niagara_plus()) { |
10
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
302 result = nof_parallel_worker_threads(5, 16, 8); |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
303 } else { |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
304 result = nof_parallel_worker_threads(5, 8, 8); |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
305 } |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
306 return result; |
28372612af5e
6362677: Change parallel GC collector default number of parallel GC threads.
jmasa
parents:
0
diff
changeset
|
307 } |