annotate src/cpu/sparc/vm/stubGenerator_sparc.cpp @ 21125:41f048caa3dd

Predefine value outside of COMPILERGRAAL
author Stefan Anzinger <stefan.anzinger@oracle.com>
date Mon, 27 Apr 2015 18:36:16 +0200
parents 7848fc12602b
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1 /*
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
2 * Copyright (c) 1997, 2014, Oracle and/or its affiliates. All rights reserved.
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
a61af66fc99e Initial load
duke
parents:
diff changeset
4 *
a61af66fc99e Initial load
duke
parents:
diff changeset
5 * This code is free software; you can redistribute it and/or modify it
a61af66fc99e Initial load
duke
parents:
diff changeset
6 * under the terms of the GNU General Public License version 2 only, as
a61af66fc99e Initial load
duke
parents:
diff changeset
7 * published by the Free Software Foundation.
a61af66fc99e Initial load
duke
parents:
diff changeset
8 *
a61af66fc99e Initial load
duke
parents:
diff changeset
9 * This code is distributed in the hope that it will be useful, but WITHOUT
a61af66fc99e Initial load
duke
parents:
diff changeset
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
a61af66fc99e Initial load
duke
parents:
diff changeset
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
a61af66fc99e Initial load
duke
parents:
diff changeset
12 * version 2 for more details (a copy is included in the LICENSE file that
a61af66fc99e Initial load
duke
parents:
diff changeset
13 * accompanied this code).
a61af66fc99e Initial load
duke
parents:
diff changeset
14 *
a61af66fc99e Initial load
duke
parents:
diff changeset
15 * You should have received a copy of the GNU General Public License version
a61af66fc99e Initial load
duke
parents:
diff changeset
16 * 2 along with this work; if not, write to the Free Software Foundation,
a61af66fc99e Initial load
duke
parents:
diff changeset
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
a61af66fc99e Initial load
duke
parents:
diff changeset
18 *
1552
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1506
diff changeset
19 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1506
diff changeset
20 * or visit www.oracle.com if you need additional information or have any
c18cbe5936b8 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 1506
diff changeset
21 * questions.
0
a61af66fc99e Initial load
duke
parents:
diff changeset
22 *
a61af66fc99e Initial load
duke
parents:
diff changeset
23 */
a61af66fc99e Initial load
duke
parents:
diff changeset
24
1972
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
25 #include "precompiled.hpp"
7204
f0c2369fda5a 8003250: SPARC: move MacroAssembler into separate file
twisti
parents: 6831
diff changeset
26 #include "asm/macroAssembler.inline.hpp"
1972
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
27 #include "interpreter/interpreter.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
28 #include "nativeInst_sparc.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
29 #include "oops/instanceOop.hpp"
6725
da91efe96a93 6964458: Reimplement class meta-data storage to use native memory
coleenp
parents: 6266
diff changeset
30 #include "oops/method.hpp"
1972
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
31 #include "oops/objArrayKlass.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
32 #include "oops/oop.inline.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
33 #include "prims/methodHandles.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
34 #include "runtime/frame.inline.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
35 #include "runtime/handles.inline.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
36 #include "runtime/sharedRuntime.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
37 #include "runtime/stubCodeGenerator.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
38 #include "runtime/stubRoutines.hpp"
7180
f34d701e952e 8003935: Simplify the needed includes for using Thread::current()
stefank
parents: 6831
diff changeset
39 #include "runtime/thread.inline.hpp"
1972
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
40 #include "utilities/top.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
41 #ifdef COMPILER2
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
42 #include "opto/runtime.hpp"
f95d63e2154a 6989984: Use standard include model for Hospot
stefank
parents: 1844
diff changeset
43 #endif
0
a61af66fc99e Initial load
duke
parents:
diff changeset
44
a61af66fc99e Initial load
duke
parents:
diff changeset
45 // Declaration and definition of StubGenerator (no .hpp file).
a61af66fc99e Initial load
duke
parents:
diff changeset
46 // For a more detailed description of the stub routine structure
a61af66fc99e Initial load
duke
parents:
diff changeset
47 // see the comment in stubRoutines.hpp.
a61af66fc99e Initial load
duke
parents:
diff changeset
48
a61af66fc99e Initial load
duke
parents:
diff changeset
49 #define __ _masm->
a61af66fc99e Initial load
duke
parents:
diff changeset
50
a61af66fc99e Initial load
duke
parents:
diff changeset
51 #ifdef PRODUCT
a61af66fc99e Initial load
duke
parents:
diff changeset
52 #define BLOCK_COMMENT(str) /* nothing */
a61af66fc99e Initial load
duke
parents:
diff changeset
53 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
54 #define BLOCK_COMMENT(str) __ block_comment(str)
a61af66fc99e Initial load
duke
parents:
diff changeset
55 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
56
a61af66fc99e Initial load
duke
parents:
diff changeset
57 #define BIND(label) bind(label); BLOCK_COMMENT(#label ":")
a61af66fc99e Initial load
duke
parents:
diff changeset
58
a61af66fc99e Initial load
duke
parents:
diff changeset
59 // Note: The register L7 is used as L7_thread_cache, and may not be used
a61af66fc99e Initial load
duke
parents:
diff changeset
60 // any other way within this module.
a61af66fc99e Initial load
duke
parents:
diff changeset
61
a61af66fc99e Initial load
duke
parents:
diff changeset
62
a61af66fc99e Initial load
duke
parents:
diff changeset
63 static const Register& Lstub_temp = L2;
a61af66fc99e Initial load
duke
parents:
diff changeset
64
a61af66fc99e Initial load
duke
parents:
diff changeset
65 // -------------------------------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
66 // Stub Code definitions
a61af66fc99e Initial load
duke
parents:
diff changeset
67
a61af66fc99e Initial load
duke
parents:
diff changeset
68 static address handle_unsafe_access() {
a61af66fc99e Initial load
duke
parents:
diff changeset
69 JavaThread* thread = JavaThread::current();
a61af66fc99e Initial load
duke
parents:
diff changeset
70 address pc = thread->saved_exception_pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
71 address npc = thread->saved_exception_npc();
a61af66fc99e Initial load
duke
parents:
diff changeset
72 // pc is the instruction which we must emulate
a61af66fc99e Initial load
duke
parents:
diff changeset
73 // doing a no-op is fine: return garbage from the load
a61af66fc99e Initial load
duke
parents:
diff changeset
74
a61af66fc99e Initial load
duke
parents:
diff changeset
75 // request an async exception
a61af66fc99e Initial load
duke
parents:
diff changeset
76 thread->set_pending_unsafe_access_error();
a61af66fc99e Initial load
duke
parents:
diff changeset
77
a61af66fc99e Initial load
duke
parents:
diff changeset
78 // return address of next instruction to execute
a61af66fc99e Initial load
duke
parents:
diff changeset
79 return npc;
a61af66fc99e Initial load
duke
parents:
diff changeset
80 }
a61af66fc99e Initial load
duke
parents:
diff changeset
81
a61af66fc99e Initial load
duke
parents:
diff changeset
82 class StubGenerator: public StubCodeGenerator {
a61af66fc99e Initial load
duke
parents:
diff changeset
83 private:
a61af66fc99e Initial load
duke
parents:
diff changeset
84
a61af66fc99e Initial load
duke
parents:
diff changeset
85 #ifdef PRODUCT
17939
0fb5b60ab4a2 8022070: Compilation error in stubGenerator_sparc.cpp with some compilers
mikael
parents: 17910
diff changeset
86 #define inc_counter_np(a,b,c)
0
a61af66fc99e Initial load
duke
parents:
diff changeset
87 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
88 #define inc_counter_np(counter, t1, t2) \
a61af66fc99e Initial load
duke
parents:
diff changeset
89 BLOCK_COMMENT("inc_counter " #counter); \
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
90 __ inc_counter(&counter, t1, t2);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
91 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
92
a61af66fc99e Initial load
duke
parents:
diff changeset
93 //----------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
94 // Call stubs are used to call Java from C
a61af66fc99e Initial load
duke
parents:
diff changeset
95
a61af66fc99e Initial load
duke
parents:
diff changeset
96 address generate_call_stub(address& return_pc) {
a61af66fc99e Initial load
duke
parents:
diff changeset
97 StubCodeMark mark(this, "StubRoutines", "call_stub");
a61af66fc99e Initial load
duke
parents:
diff changeset
98 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
99
a61af66fc99e Initial load
duke
parents:
diff changeset
100 // Incoming arguments:
a61af66fc99e Initial load
duke
parents:
diff changeset
101 //
a61af66fc99e Initial load
duke
parents:
diff changeset
102 // o0 : call wrapper address
a61af66fc99e Initial load
duke
parents:
diff changeset
103 // o1 : result (address)
a61af66fc99e Initial load
duke
parents:
diff changeset
104 // o2 : result type
a61af66fc99e Initial load
duke
parents:
diff changeset
105 // o3 : method
a61af66fc99e Initial load
duke
parents:
diff changeset
106 // o4 : (interpreter) entry point
a61af66fc99e Initial load
duke
parents:
diff changeset
107 // o5 : parameters (address)
a61af66fc99e Initial load
duke
parents:
diff changeset
108 // [sp + 0x5c]: parameter size (in words)
a61af66fc99e Initial load
duke
parents:
diff changeset
109 // [sp + 0x60]: thread
a61af66fc99e Initial load
duke
parents:
diff changeset
110 //
a61af66fc99e Initial load
duke
parents:
diff changeset
111 // +---------------+ <--- sp + 0
a61af66fc99e Initial load
duke
parents:
diff changeset
112 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
113 // . reg save area .
a61af66fc99e Initial load
duke
parents:
diff changeset
114 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
115 // +---------------+ <--- sp + 0x40
a61af66fc99e Initial load
duke
parents:
diff changeset
116 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
117 // . extra 7 slots .
a61af66fc99e Initial load
duke
parents:
diff changeset
118 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
119 // +---------------+ <--- sp + 0x5c
a61af66fc99e Initial load
duke
parents:
diff changeset
120 // | param. size |
a61af66fc99e Initial load
duke
parents:
diff changeset
121 // +---------------+ <--- sp + 0x60
a61af66fc99e Initial load
duke
parents:
diff changeset
122 // | thread |
a61af66fc99e Initial load
duke
parents:
diff changeset
123 // +---------------+
a61af66fc99e Initial load
duke
parents:
diff changeset
124 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
125
a61af66fc99e Initial load
duke
parents:
diff changeset
126 // note: if the link argument position changes, adjust
a61af66fc99e Initial load
duke
parents:
diff changeset
127 // the code in frame::entry_frame_call_wrapper()
a61af66fc99e Initial load
duke
parents:
diff changeset
128
a61af66fc99e Initial load
duke
parents:
diff changeset
129 const Argument link = Argument(0, false); // used only for GC
a61af66fc99e Initial load
duke
parents:
diff changeset
130 const Argument result = Argument(1, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
131 const Argument result_type = Argument(2, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
132 const Argument method = Argument(3, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
133 const Argument entry_point = Argument(4, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
134 const Argument parameters = Argument(5, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
135 const Argument parameter_size = Argument(6, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
136 const Argument thread = Argument(7, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
137
a61af66fc99e Initial load
duke
parents:
diff changeset
138 // setup thread register
a61af66fc99e Initial load
duke
parents:
diff changeset
139 __ ld_ptr(thread.as_address(), G2_thread);
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
140 __ reinit_heapbase();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
141
a61af66fc99e Initial load
duke
parents:
diff changeset
142 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
143 // make sure we have no pending exceptions
a61af66fc99e Initial load
duke
parents:
diff changeset
144 { const Register t = G3_scratch;
a61af66fc99e Initial load
duke
parents:
diff changeset
145 Label L;
a61af66fc99e Initial load
duke
parents:
diff changeset
146 __ ld_ptr(G2_thread, in_bytes(Thread::pending_exception_offset()), t);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
147 __ br_null_short(t, Assembler::pt, L);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
148 __ stop("StubRoutines::call_stub: entered with pending exception");
a61af66fc99e Initial load
duke
parents:
diff changeset
149 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
150 }
a61af66fc99e Initial load
duke
parents:
diff changeset
151 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
152
a61af66fc99e Initial load
duke
parents:
diff changeset
153 // create activation frame & allocate space for parameters
a61af66fc99e Initial load
duke
parents:
diff changeset
154 { const Register t = G3_scratch;
a61af66fc99e Initial load
duke
parents:
diff changeset
155 __ ld_ptr(parameter_size.as_address(), t); // get parameter size (in words)
a61af66fc99e Initial load
duke
parents:
diff changeset
156 __ add(t, frame::memory_parameter_word_sp_offset, t); // add space for save area (in words)
a61af66fc99e Initial load
duke
parents:
diff changeset
157 __ round_to(t, WordsPerLong); // make sure it is multiple of 2 (in words)
1506
2338d41fbd81 6943304: remove tagged stack interpreter
twisti
parents: 1503
diff changeset
158 __ sll(t, Interpreter::logStackElementSize, t); // compute number of bytes
0
a61af66fc99e Initial load
duke
parents:
diff changeset
159 __ neg(t); // negate so it can be used with save
a61af66fc99e Initial load
duke
parents:
diff changeset
160 __ save(SP, t, SP); // setup new frame
a61af66fc99e Initial load
duke
parents:
diff changeset
161 }
a61af66fc99e Initial load
duke
parents:
diff changeset
162
a61af66fc99e Initial load
duke
parents:
diff changeset
163 // +---------------+ <--- sp + 0
a61af66fc99e Initial load
duke
parents:
diff changeset
164 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
165 // . reg save area .
a61af66fc99e Initial load
duke
parents:
diff changeset
166 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
167 // +---------------+ <--- sp + 0x40
a61af66fc99e Initial load
duke
parents:
diff changeset
168 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
169 // . extra 7 slots .
a61af66fc99e Initial load
duke
parents:
diff changeset
170 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
171 // +---------------+ <--- sp + 0x5c
a61af66fc99e Initial load
duke
parents:
diff changeset
172 // | empty slot | (only if parameter size is even)
a61af66fc99e Initial load
duke
parents:
diff changeset
173 // +---------------+
a61af66fc99e Initial load
duke
parents:
diff changeset
174 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
175 // . parameters .
a61af66fc99e Initial load
duke
parents:
diff changeset
176 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
177 // +---------------+ <--- fp + 0
a61af66fc99e Initial load
duke
parents:
diff changeset
178 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
179 // . reg save area .
a61af66fc99e Initial load
duke
parents:
diff changeset
180 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
181 // +---------------+ <--- fp + 0x40
a61af66fc99e Initial load
duke
parents:
diff changeset
182 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
183 // . extra 7 slots .
a61af66fc99e Initial load
duke
parents:
diff changeset
184 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
185 // +---------------+ <--- fp + 0x5c
a61af66fc99e Initial load
duke
parents:
diff changeset
186 // | param. size |
a61af66fc99e Initial load
duke
parents:
diff changeset
187 // +---------------+ <--- fp + 0x60
a61af66fc99e Initial load
duke
parents:
diff changeset
188 // | thread |
a61af66fc99e Initial load
duke
parents:
diff changeset
189 // +---------------+
a61af66fc99e Initial load
duke
parents:
diff changeset
190 // | |
a61af66fc99e Initial load
duke
parents:
diff changeset
191
a61af66fc99e Initial load
duke
parents:
diff changeset
192 // pass parameters if any
a61af66fc99e Initial load
duke
parents:
diff changeset
193 BLOCK_COMMENT("pass parameters if any");
a61af66fc99e Initial load
duke
parents:
diff changeset
194 { const Register src = parameters.as_in().as_register();
a61af66fc99e Initial load
duke
parents:
diff changeset
195 const Register dst = Lentry_args;
a61af66fc99e Initial load
duke
parents:
diff changeset
196 const Register tmp = G3_scratch;
a61af66fc99e Initial load
duke
parents:
diff changeset
197 const Register cnt = G4_scratch;
a61af66fc99e Initial load
duke
parents:
diff changeset
198
a61af66fc99e Initial load
duke
parents:
diff changeset
199 // test if any parameters & setup of Lentry_args
a61af66fc99e Initial load
duke
parents:
diff changeset
200 Label exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
201 __ ld_ptr(parameter_size.as_in().as_address(), cnt); // parameter counter
a61af66fc99e Initial load
duke
parents:
diff changeset
202 __ add( FP, STACK_BIAS, dst );
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
203 __ cmp_zero_and_br(Assembler::zero, cnt, exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
204 __ delayed()->sub(dst, BytesPerWord, dst); // setup Lentry_args
a61af66fc99e Initial load
duke
parents:
diff changeset
205
a61af66fc99e Initial load
duke
parents:
diff changeset
206 // copy parameters if any
a61af66fc99e Initial load
duke
parents:
diff changeset
207 Label loop;
a61af66fc99e Initial load
duke
parents:
diff changeset
208 __ BIND(loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
209 // Store parameter value
a61af66fc99e Initial load
duke
parents:
diff changeset
210 __ ld_ptr(src, 0, tmp);
a61af66fc99e Initial load
duke
parents:
diff changeset
211 __ add(src, BytesPerWord, src);
1506
2338d41fbd81 6943304: remove tagged stack interpreter
twisti
parents: 1503
diff changeset
212 __ st_ptr(tmp, dst, 0);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
213 __ deccc(cnt);
a61af66fc99e Initial load
duke
parents:
diff changeset
214 __ br(Assembler::greater, false, Assembler::pt, loop);
1506
2338d41fbd81 6943304: remove tagged stack interpreter
twisti
parents: 1503
diff changeset
215 __ delayed()->sub(dst, Interpreter::stackElementSize, dst);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
216
a61af66fc99e Initial load
duke
parents:
diff changeset
217 // done
a61af66fc99e Initial load
duke
parents:
diff changeset
218 __ BIND(exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
219 }
a61af66fc99e Initial load
duke
parents:
diff changeset
220
a61af66fc99e Initial load
duke
parents:
diff changeset
221 // setup parameters, method & call Java function
a61af66fc99e Initial load
duke
parents:
diff changeset
222 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
223 // layout_activation_impl checks it's notion of saved SP against
a61af66fc99e Initial load
duke
parents:
diff changeset
224 // this register, so if this changes update it as well.
a61af66fc99e Initial load
duke
parents:
diff changeset
225 const Register saved_SP = Lscratch;
a61af66fc99e Initial load
duke
parents:
diff changeset
226 __ mov(SP, saved_SP); // keep track of SP before call
a61af66fc99e Initial load
duke
parents:
diff changeset
227 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
228
a61af66fc99e Initial load
duke
parents:
diff changeset
229 // setup parameters
a61af66fc99e Initial load
duke
parents:
diff changeset
230 const Register t = G3_scratch;
a61af66fc99e Initial load
duke
parents:
diff changeset
231 __ ld_ptr(parameter_size.as_in().as_address(), t); // get parameter size (in words)
1506
2338d41fbd81 6943304: remove tagged stack interpreter
twisti
parents: 1503
diff changeset
232 __ sll(t, Interpreter::logStackElementSize, t); // compute number of bytes
0
a61af66fc99e Initial load
duke
parents:
diff changeset
233 __ sub(FP, t, Gargs); // setup parameter pointer
a61af66fc99e Initial load
duke
parents:
diff changeset
234 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
235 __ add( Gargs, STACK_BIAS, Gargs ); // Account for LP64 stack bias
a61af66fc99e Initial load
duke
parents:
diff changeset
236 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
237 __ mov(SP, O5_savedSP);
a61af66fc99e Initial load
duke
parents:
diff changeset
238
a61af66fc99e Initial load
duke
parents:
diff changeset
239
a61af66fc99e Initial load
duke
parents:
diff changeset
240 // do the call
a61af66fc99e Initial load
duke
parents:
diff changeset
241 //
a61af66fc99e Initial load
duke
parents:
diff changeset
242 // the following register must be setup:
a61af66fc99e Initial load
duke
parents:
diff changeset
243 //
a61af66fc99e Initial load
duke
parents:
diff changeset
244 // G2_thread
a61af66fc99e Initial load
duke
parents:
diff changeset
245 // G5_method
a61af66fc99e Initial load
duke
parents:
diff changeset
246 // Gargs
a61af66fc99e Initial load
duke
parents:
diff changeset
247 BLOCK_COMMENT("call Java function");
a61af66fc99e Initial load
duke
parents:
diff changeset
248 __ jmpl(entry_point.as_in().as_register(), G0, O7);
a61af66fc99e Initial load
duke
parents:
diff changeset
249 __ delayed()->mov(method.as_in().as_register(), G5_method); // setup method
a61af66fc99e Initial load
duke
parents:
diff changeset
250
a61af66fc99e Initial load
duke
parents:
diff changeset
251 BLOCK_COMMENT("call_stub_return_address:");
a61af66fc99e Initial load
duke
parents:
diff changeset
252 return_pc = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
253
a61af66fc99e Initial load
duke
parents:
diff changeset
254 // The callee, if it wasn't interpreted, can return with SP changed so
a61af66fc99e Initial load
duke
parents:
diff changeset
255 // we can no longer assert of change of SP.
a61af66fc99e Initial load
duke
parents:
diff changeset
256
a61af66fc99e Initial load
duke
parents:
diff changeset
257 // store result depending on type
a61af66fc99e Initial load
duke
parents:
diff changeset
258 // (everything that is not T_OBJECT, T_LONG, T_FLOAT, or T_DOUBLE
a61af66fc99e Initial load
duke
parents:
diff changeset
259 // is treated as T_INT)
a61af66fc99e Initial load
duke
parents:
diff changeset
260 { const Register addr = result .as_in().as_register();
a61af66fc99e Initial load
duke
parents:
diff changeset
261 const Register type = result_type.as_in().as_register();
a61af66fc99e Initial load
duke
parents:
diff changeset
262 Label is_long, is_float, is_double, is_object, exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
263 __ cmp(type, T_OBJECT); __ br(Assembler::equal, false, Assembler::pn, is_object);
a61af66fc99e Initial load
duke
parents:
diff changeset
264 __ delayed()->cmp(type, T_FLOAT); __ br(Assembler::equal, false, Assembler::pn, is_float);
a61af66fc99e Initial load
duke
parents:
diff changeset
265 __ delayed()->cmp(type, T_DOUBLE); __ br(Assembler::equal, false, Assembler::pn, is_double);
a61af66fc99e Initial load
duke
parents:
diff changeset
266 __ delayed()->cmp(type, T_LONG); __ br(Assembler::equal, false, Assembler::pn, is_long);
a61af66fc99e Initial load
duke
parents:
diff changeset
267 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
268
a61af66fc99e Initial load
duke
parents:
diff changeset
269 // store int result
a61af66fc99e Initial load
duke
parents:
diff changeset
270 __ st(O0, addr, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
271
a61af66fc99e Initial load
duke
parents:
diff changeset
272 __ BIND(exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
273 __ ret();
a61af66fc99e Initial load
duke
parents:
diff changeset
274 __ delayed()->restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
275
a61af66fc99e Initial load
duke
parents:
diff changeset
276 __ BIND(is_object);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
277 __ ba(exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
278 __ delayed()->st_ptr(O0, addr, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
279
a61af66fc99e Initial load
duke
parents:
diff changeset
280 __ BIND(is_float);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
281 __ ba(exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
282 __ delayed()->stf(FloatRegisterImpl::S, F0, addr, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
283
a61af66fc99e Initial load
duke
parents:
diff changeset
284 __ BIND(is_double);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
285 __ ba(exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
286 __ delayed()->stf(FloatRegisterImpl::D, F0, addr, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
287
a61af66fc99e Initial load
duke
parents:
diff changeset
288 __ BIND(is_long);
a61af66fc99e Initial load
duke
parents:
diff changeset
289 #ifdef _LP64
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
290 __ ba(exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
291 __ delayed()->st_long(O0, addr, G0); // store entire long
a61af66fc99e Initial load
duke
parents:
diff changeset
292 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
293 #if defined(COMPILER2)
a61af66fc99e Initial load
duke
parents:
diff changeset
294 // All return values are where we want them, except for Longs. C2 returns
a61af66fc99e Initial load
duke
parents:
diff changeset
295 // longs in G1 in the 32-bit build whereas the interpreter wants them in O0/O1.
a61af66fc99e Initial load
duke
parents:
diff changeset
296 // Since the interpreter will return longs in G1 and O0/O1 in the 32bit
a61af66fc99e Initial load
duke
parents:
diff changeset
297 // build we simply always use G1.
a61af66fc99e Initial load
duke
parents:
diff changeset
298 // Note: I tried to make c2 return longs in O0/O1 and G1 so we wouldn't have to
a61af66fc99e Initial load
duke
parents:
diff changeset
299 // do this here. Unfortunately if we did a rethrow we'd see an machepilog node
a61af66fc99e Initial load
duke
parents:
diff changeset
300 // first which would move g1 -> O0/O1 and destroy the exception we were throwing.
a61af66fc99e Initial load
duke
parents:
diff changeset
301
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
302 __ ba(exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
303 __ delayed()->stx(G1, addr, G0); // store entire long
a61af66fc99e Initial load
duke
parents:
diff changeset
304 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
305 __ st(O1, addr, BytesPerInt);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
306 __ ba(exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
307 __ delayed()->st(O0, addr, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
308 #endif /* COMPILER2 */
a61af66fc99e Initial load
duke
parents:
diff changeset
309 #endif /* _LP64 */
a61af66fc99e Initial load
duke
parents:
diff changeset
310 }
a61af66fc99e Initial load
duke
parents:
diff changeset
311 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
312 }
a61af66fc99e Initial load
duke
parents:
diff changeset
313
a61af66fc99e Initial load
duke
parents:
diff changeset
314
a61af66fc99e Initial load
duke
parents:
diff changeset
315 //----------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
316 // Return point for a Java call if there's an exception thrown in Java code.
a61af66fc99e Initial load
duke
parents:
diff changeset
317 // The exception is caught and transformed into a pending exception stored in
a61af66fc99e Initial load
duke
parents:
diff changeset
318 // JavaThread that can be tested from within the VM.
a61af66fc99e Initial load
duke
parents:
diff changeset
319 //
a61af66fc99e Initial load
duke
parents:
diff changeset
320 // Oexception: exception oop
a61af66fc99e Initial load
duke
parents:
diff changeset
321
a61af66fc99e Initial load
duke
parents:
diff changeset
322 address generate_catch_exception() {
a61af66fc99e Initial load
duke
parents:
diff changeset
323 StubCodeMark mark(this, "StubRoutines", "catch_exception");
a61af66fc99e Initial load
duke
parents:
diff changeset
324
a61af66fc99e Initial load
duke
parents:
diff changeset
325 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
326 // verify that thread corresponds
a61af66fc99e Initial load
duke
parents:
diff changeset
327 __ verify_thread();
a61af66fc99e Initial load
duke
parents:
diff changeset
328
a61af66fc99e Initial load
duke
parents:
diff changeset
329 const Register& temp_reg = Gtemp;
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
330 Address pending_exception_addr (G2_thread, Thread::pending_exception_offset());
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
331 Address exception_file_offset_addr(G2_thread, Thread::exception_file_offset ());
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
332 Address exception_line_offset_addr(G2_thread, Thread::exception_line_offset ());
0
a61af66fc99e Initial load
duke
parents:
diff changeset
333
a61af66fc99e Initial load
duke
parents:
diff changeset
334 // set pending exception
a61af66fc99e Initial load
duke
parents:
diff changeset
335 __ verify_oop(Oexception);
a61af66fc99e Initial load
duke
parents:
diff changeset
336 __ st_ptr(Oexception, pending_exception_addr);
a61af66fc99e Initial load
duke
parents:
diff changeset
337 __ set((intptr_t)__FILE__, temp_reg);
a61af66fc99e Initial load
duke
parents:
diff changeset
338 __ st_ptr(temp_reg, exception_file_offset_addr);
a61af66fc99e Initial load
duke
parents:
diff changeset
339 __ set((intptr_t)__LINE__, temp_reg);
a61af66fc99e Initial load
duke
parents:
diff changeset
340 __ st(temp_reg, exception_line_offset_addr);
a61af66fc99e Initial load
duke
parents:
diff changeset
341
a61af66fc99e Initial load
duke
parents:
diff changeset
342 // complete return to VM
a61af66fc99e Initial load
duke
parents:
diff changeset
343 assert(StubRoutines::_call_stub_return_address != NULL, "must have been generated before");
a61af66fc99e Initial load
duke
parents:
diff changeset
344
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
345 AddressLiteral stub_ret(StubRoutines::_call_stub_return_address);
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
346 __ jump_to(stub_ret, temp_reg);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
347 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
348
a61af66fc99e Initial load
duke
parents:
diff changeset
349 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
350 }
a61af66fc99e Initial load
duke
parents:
diff changeset
351
a61af66fc99e Initial load
duke
parents:
diff changeset
352
a61af66fc99e Initial load
duke
parents:
diff changeset
353 //----------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
354 // Continuation point for runtime calls returning with a pending exception
a61af66fc99e Initial load
duke
parents:
diff changeset
355 // The pending exception check happened in the runtime or native call stub
a61af66fc99e Initial load
duke
parents:
diff changeset
356 // The pending exception in Thread is converted into a Java-level exception
a61af66fc99e Initial load
duke
parents:
diff changeset
357 //
a61af66fc99e Initial load
duke
parents:
diff changeset
358 // Contract with Java-level exception handler: O0 = exception
a61af66fc99e Initial load
duke
parents:
diff changeset
359 // O1 = throwing pc
a61af66fc99e Initial load
duke
parents:
diff changeset
360
a61af66fc99e Initial load
duke
parents:
diff changeset
361 address generate_forward_exception() {
a61af66fc99e Initial load
duke
parents:
diff changeset
362 StubCodeMark mark(this, "StubRoutines", "forward_exception");
a61af66fc99e Initial load
duke
parents:
diff changeset
363 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
364
a61af66fc99e Initial load
duke
parents:
diff changeset
365 // Upon entry, O7 has the return address returning into Java
a61af66fc99e Initial load
duke
parents:
diff changeset
366 // (interpreted or compiled) code; i.e. the return address
a61af66fc99e Initial load
duke
parents:
diff changeset
367 // becomes the throwing pc.
a61af66fc99e Initial load
duke
parents:
diff changeset
368
a61af66fc99e Initial load
duke
parents:
diff changeset
369 const Register& handler_reg = Gtemp;
a61af66fc99e Initial load
duke
parents:
diff changeset
370
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
371 Address exception_addr(G2_thread, Thread::pending_exception_offset());
0
a61af66fc99e Initial load
duke
parents:
diff changeset
372
a61af66fc99e Initial load
duke
parents:
diff changeset
373 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
374 // make sure that this code is only executed if there is a pending exception
a61af66fc99e Initial load
duke
parents:
diff changeset
375 { Label L;
a61af66fc99e Initial load
duke
parents:
diff changeset
376 __ ld_ptr(exception_addr, Gtemp);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
377 __ br_notnull_short(Gtemp, Assembler::pt, L);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
378 __ stop("StubRoutines::forward exception: no pending exception (1)");
a61af66fc99e Initial load
duke
parents:
diff changeset
379 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
380 }
a61af66fc99e Initial load
duke
parents:
diff changeset
381 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
382
a61af66fc99e Initial load
duke
parents:
diff changeset
383 // compute exception handler into handler_reg
a61af66fc99e Initial load
duke
parents:
diff changeset
384 __ get_thread();
a61af66fc99e Initial load
duke
parents:
diff changeset
385 __ ld_ptr(exception_addr, Oexception);
a61af66fc99e Initial load
duke
parents:
diff changeset
386 __ verify_oop(Oexception);
a61af66fc99e Initial load
duke
parents:
diff changeset
387 __ save_frame(0); // compensates for compiler weakness
a61af66fc99e Initial load
duke
parents:
diff changeset
388 __ add(O7->after_save(), frame::pc_return_offset, Lscratch); // save the issuing PC
a61af66fc99e Initial load
duke
parents:
diff changeset
389 BLOCK_COMMENT("call exception_handler_for_return_address");
1295
3cf667df43ef 6919934: JSR 292 needs to support x86 C1
twisti
parents: 1174
diff changeset
390 __ call_VM_leaf(L7_thread_cache, CAST_FROM_FN_PTR(address, SharedRuntime::exception_handler_for_return_address), G2_thread, Lscratch);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
391 __ mov(O0, handler_reg);
a61af66fc99e Initial load
duke
parents:
diff changeset
392 __ restore(); // compensates for compiler weakness
a61af66fc99e Initial load
duke
parents:
diff changeset
393
a61af66fc99e Initial load
duke
parents:
diff changeset
394 __ ld_ptr(exception_addr, Oexception);
a61af66fc99e Initial load
duke
parents:
diff changeset
395 __ add(O7, frame::pc_return_offset, Oissuing_pc); // save the issuing PC
a61af66fc99e Initial load
duke
parents:
diff changeset
396
a61af66fc99e Initial load
duke
parents:
diff changeset
397 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
398 // make sure exception is set
a61af66fc99e Initial load
duke
parents:
diff changeset
399 { Label L;
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
400 __ br_notnull_short(Oexception, Assembler::pt, L);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
401 __ stop("StubRoutines::forward exception: no pending exception (2)");
a61af66fc99e Initial load
duke
parents:
diff changeset
402 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
403 }
a61af66fc99e Initial load
duke
parents:
diff changeset
404 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
405 // jump to exception handler
a61af66fc99e Initial load
duke
parents:
diff changeset
406 __ jmp(handler_reg, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
407 // clear pending exception
a61af66fc99e Initial load
duke
parents:
diff changeset
408 __ delayed()->st_ptr(G0, exception_addr);
a61af66fc99e Initial load
duke
parents:
diff changeset
409
a61af66fc99e Initial load
duke
parents:
diff changeset
410 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
411 }
a61af66fc99e Initial load
duke
parents:
diff changeset
412
11127
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
413 // Safefetch stubs.
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
414 void generate_safefetch(const char* name, int size, address* entry,
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
415 address* fault_pc, address* continuation_pc) {
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
416 // safefetch signatures:
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
417 // int SafeFetch32(int* adr, int errValue);
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
418 // intptr_t SafeFetchN (intptr_t* adr, intptr_t errValue);
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
419 //
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
420 // arguments:
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
421 // o0 = adr
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
422 // o1 = errValue
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
423 //
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
424 // result:
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
425 // o0 = *adr or errValue
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
426
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
427 StubCodeMark mark(this, "StubRoutines", name);
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
428
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
429 // Entry point, pc or function descriptor.
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
430 __ align(CodeEntryAlignment);
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
431 *entry = __ pc();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
432
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
433 __ mov(O0, G1); // g1 = o0
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
434 __ mov(O1, O0); // o0 = o1
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
435 // Load *adr into c_rarg1, may fault.
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
436 *fault_pc = __ pc();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
437 switch (size) {
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
438 case 4:
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
439 // int32_t
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
440 __ ldsw(G1, 0, O0); // o0 = [g1]
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
441 break;
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
442 case 8:
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
443 // int64_t
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
444 __ ldx(G1, 0, O0); // o0 = [g1]
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
445 break;
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
446 default:
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
447 ShouldNotReachHere();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
448 }
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
449
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
450 // return errValue or *adr
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
451 *continuation_pc = __ pc();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
452 // By convention with the trap handler we ensure there is a non-CTI
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
453 // instruction in the trap shadow.
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
454 __ nop();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
455 __ retl();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
456 __ delayed()->nop();
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
457 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
458
a61af66fc99e Initial load
duke
parents:
diff changeset
459 //------------------------------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
460 // Continuation point for throwing of implicit exceptions that are not handled in
a61af66fc99e Initial load
duke
parents:
diff changeset
461 // the current activation. Fabricates an exception oop and initiates normal
a61af66fc99e Initial load
duke
parents:
diff changeset
462 // exception dispatching in this frame. Only callee-saved registers are preserved
a61af66fc99e Initial load
duke
parents:
diff changeset
463 // (through the normal register window / RegisterMap handling).
a61af66fc99e Initial load
duke
parents:
diff changeset
464 // If the compiler needs all registers to be preserved between the fault
a61af66fc99e Initial load
duke
parents:
diff changeset
465 // point and the exception handler then it must assume responsibility for that in
a61af66fc99e Initial load
duke
parents:
diff changeset
466 // AbstractCompiler::continuation_for_implicit_null_exception or
a61af66fc99e Initial load
duke
parents:
diff changeset
467 // continuation_for_implicit_division_by_zero_exception. All other implicit
a61af66fc99e Initial load
duke
parents:
diff changeset
468 // exceptions (e.g., NullPointerException or AbstractMethodError on entry) are
a61af66fc99e Initial load
duke
parents:
diff changeset
469 // either at call sites or otherwise assume that stack unwinding will be initiated,
a61af66fc99e Initial load
duke
parents:
diff changeset
470 // so caller saved registers were assumed volatile in the compiler.
a61af66fc99e Initial load
duke
parents:
diff changeset
471
a61af66fc99e Initial load
duke
parents:
diff changeset
472 // Note that we generate only this stub into a RuntimeStub, because it needs to be
a61af66fc99e Initial load
duke
parents:
diff changeset
473 // properly traversed and ignored during GC, so we change the meaning of the "__"
a61af66fc99e Initial load
duke
parents:
diff changeset
474 // macro within this method.
a61af66fc99e Initial load
duke
parents:
diff changeset
475 #undef __
a61af66fc99e Initial load
duke
parents:
diff changeset
476 #define __ masm->
a61af66fc99e Initial load
duke
parents:
diff changeset
477
3937
c565834fb592 7088020: SEGV in JNIHandleBlock::release_block
never
parents: 3903
diff changeset
478 address generate_throw_exception(const char* name, address runtime_entry,
3451
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
479 Register arg1 = noreg, Register arg2 = noreg) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
480 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
481 int insts_size = VerifyThread ? 1 * K : 600;
a61af66fc99e Initial load
duke
parents:
diff changeset
482 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
483 int insts_size = VerifyThread ? 1 * K : 256;
a61af66fc99e Initial load
duke
parents:
diff changeset
484 #endif /* ASSERT */
a61af66fc99e Initial load
duke
parents:
diff changeset
485 int locs_size = 32;
a61af66fc99e Initial load
duke
parents:
diff changeset
486
a61af66fc99e Initial load
duke
parents:
diff changeset
487 CodeBuffer code(name, insts_size, locs_size);
a61af66fc99e Initial load
duke
parents:
diff changeset
488 MacroAssembler* masm = new MacroAssembler(&code);
a61af66fc99e Initial load
duke
parents:
diff changeset
489
a61af66fc99e Initial load
duke
parents:
diff changeset
490 __ verify_thread();
a61af66fc99e Initial load
duke
parents:
diff changeset
491
a61af66fc99e Initial load
duke
parents:
diff changeset
492 // This is an inlined and slightly modified version of call_VM
a61af66fc99e Initial load
duke
parents:
diff changeset
493 // which has the ability to fetch the return PC out of thread-local storage
a61af66fc99e Initial load
duke
parents:
diff changeset
494 __ assert_not_delayed();
a61af66fc99e Initial load
duke
parents:
diff changeset
495
a61af66fc99e Initial load
duke
parents:
diff changeset
496 // Note that we always push a frame because on the SPARC
a61af66fc99e Initial load
duke
parents:
diff changeset
497 // architecture, for all of our implicit exception kinds at call
a61af66fc99e Initial load
duke
parents:
diff changeset
498 // sites, the implicit exception is taken before the callee frame
a61af66fc99e Initial load
duke
parents:
diff changeset
499 // is pushed.
a61af66fc99e Initial load
duke
parents:
diff changeset
500 __ save_frame(0);
a61af66fc99e Initial load
duke
parents:
diff changeset
501
a61af66fc99e Initial load
duke
parents:
diff changeset
502 int frame_complete = __ offset();
a61af66fc99e Initial load
duke
parents:
diff changeset
503
a61af66fc99e Initial load
duke
parents:
diff changeset
504 // Note that we always have a runtime stub frame on the top of stack by this point
a61af66fc99e Initial load
duke
parents:
diff changeset
505 Register last_java_sp = SP;
a61af66fc99e Initial load
duke
parents:
diff changeset
506 // 64-bit last_java_sp is biased!
a61af66fc99e Initial load
duke
parents:
diff changeset
507 __ set_last_Java_frame(last_java_sp, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
508 if (VerifyThread) __ mov(G2_thread, O0); // about to be smashed; pass early
a61af66fc99e Initial load
duke
parents:
diff changeset
509 __ save_thread(noreg);
3451
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
510 if (arg1 != noreg) {
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
511 assert(arg2 != O1, "clobbered");
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
512 __ mov(arg1, O1);
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
513 }
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
514 if (arg2 != noreg) {
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
515 __ mov(arg2, O2);
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
516 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
517 // do the call
a61af66fc99e Initial load
duke
parents:
diff changeset
518 BLOCK_COMMENT("call runtime_entry");
a61af66fc99e Initial load
duke
parents:
diff changeset
519 __ call(runtime_entry, relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
520 if (!VerifyThread)
a61af66fc99e Initial load
duke
parents:
diff changeset
521 __ delayed()->mov(G2_thread, O0); // pass thread as first argument
a61af66fc99e Initial load
duke
parents:
diff changeset
522 else
a61af66fc99e Initial load
duke
parents:
diff changeset
523 __ delayed()->nop(); // (thread already passed)
a61af66fc99e Initial load
duke
parents:
diff changeset
524 __ restore_thread(noreg);
a61af66fc99e Initial load
duke
parents:
diff changeset
525 __ reset_last_Java_frame();
a61af66fc99e Initial load
duke
parents:
diff changeset
526
a61af66fc99e Initial load
duke
parents:
diff changeset
527 // check for pending exceptions. use Gtemp as scratch register.
a61af66fc99e Initial load
duke
parents:
diff changeset
528 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
529 Label L;
a61af66fc99e Initial load
duke
parents:
diff changeset
530
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
531 Address exception_addr(G2_thread, Thread::pending_exception_offset());
0
a61af66fc99e Initial load
duke
parents:
diff changeset
532 Register scratch_reg = Gtemp;
a61af66fc99e Initial load
duke
parents:
diff changeset
533 __ ld_ptr(exception_addr, scratch_reg);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
534 __ br_notnull_short(scratch_reg, Assembler::pt, L);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
535 __ should_not_reach_here();
a61af66fc99e Initial load
duke
parents:
diff changeset
536 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
537 #endif // ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
538 BLOCK_COMMENT("call forward_exception_entry");
a61af66fc99e Initial load
duke
parents:
diff changeset
539 __ call(StubRoutines::forward_exception_entry(), relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
540 // we use O7 linkage so that forward_exception_entry has the issuing PC
a61af66fc99e Initial load
duke
parents:
diff changeset
541 __ delayed()->restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
542
a61af66fc99e Initial load
duke
parents:
diff changeset
543 RuntimeStub* stub = RuntimeStub::new_runtime_stub(name, &code, frame_complete, masm->total_frame_size_in_bytes(0), NULL, false);
a61af66fc99e Initial load
duke
parents:
diff changeset
544 return stub->entry_point();
a61af66fc99e Initial load
duke
parents:
diff changeset
545 }
a61af66fc99e Initial load
duke
parents:
diff changeset
546
a61af66fc99e Initial load
duke
parents:
diff changeset
547 #undef __
a61af66fc99e Initial load
duke
parents:
diff changeset
548 #define __ _masm->
a61af66fc99e Initial load
duke
parents:
diff changeset
549
a61af66fc99e Initial load
duke
parents:
diff changeset
550
a61af66fc99e Initial load
duke
parents:
diff changeset
551 // Generate a routine that sets all the registers so we
a61af66fc99e Initial load
duke
parents:
diff changeset
552 // can tell if the stop routine prints them correctly.
a61af66fc99e Initial load
duke
parents:
diff changeset
553 address generate_test_stop() {
a61af66fc99e Initial load
duke
parents:
diff changeset
554 StubCodeMark mark(this, "StubRoutines", "test_stop");
a61af66fc99e Initial load
duke
parents:
diff changeset
555 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
556
a61af66fc99e Initial load
duke
parents:
diff changeset
557 int i;
a61af66fc99e Initial load
duke
parents:
diff changeset
558
a61af66fc99e Initial load
duke
parents:
diff changeset
559 __ save_frame(0);
a61af66fc99e Initial load
duke
parents:
diff changeset
560
a61af66fc99e Initial load
duke
parents:
diff changeset
561 static jfloat zero = 0.0, one = 1.0;
a61af66fc99e Initial load
duke
parents:
diff changeset
562
a61af66fc99e Initial load
duke
parents:
diff changeset
563 // put addr in L0, then load through L0 to F0
a61af66fc99e Initial load
duke
parents:
diff changeset
564 __ set((intptr_t)&zero, L0); __ ldf( FloatRegisterImpl::S, L0, 0, F0);
a61af66fc99e Initial load
duke
parents:
diff changeset
565 __ set((intptr_t)&one, L0); __ ldf( FloatRegisterImpl::S, L0, 0, F1); // 1.0 to F1
a61af66fc99e Initial load
duke
parents:
diff changeset
566
a61af66fc99e Initial load
duke
parents:
diff changeset
567 // use add to put 2..18 in F2..F18
a61af66fc99e Initial load
duke
parents:
diff changeset
568 for ( i = 2; i <= 18; ++i ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
569 __ fadd( FloatRegisterImpl::S, F1, as_FloatRegister(i-1), as_FloatRegister(i));
a61af66fc99e Initial load
duke
parents:
diff changeset
570 }
a61af66fc99e Initial load
duke
parents:
diff changeset
571
a61af66fc99e Initial load
duke
parents:
diff changeset
572 // Now put double 2 in F16, double 18 in F18
a61af66fc99e Initial load
duke
parents:
diff changeset
573 __ ftof( FloatRegisterImpl::S, FloatRegisterImpl::D, F2, F16 );
a61af66fc99e Initial load
duke
parents:
diff changeset
574 __ ftof( FloatRegisterImpl::S, FloatRegisterImpl::D, F18, F18 );
a61af66fc99e Initial load
duke
parents:
diff changeset
575
a61af66fc99e Initial load
duke
parents:
diff changeset
576 // use add to put 20..32 in F20..F32
a61af66fc99e Initial load
duke
parents:
diff changeset
577 for (i = 20; i < 32; i += 2) {
a61af66fc99e Initial load
duke
parents:
diff changeset
578 __ fadd( FloatRegisterImpl::D, F16, as_FloatRegister(i-2), as_FloatRegister(i));
a61af66fc99e Initial load
duke
parents:
diff changeset
579 }
a61af66fc99e Initial load
duke
parents:
diff changeset
580
a61af66fc99e Initial load
duke
parents:
diff changeset
581 // put 0..7 in i's, 8..15 in l's, 16..23 in o's, 24..31 in g's
a61af66fc99e Initial load
duke
parents:
diff changeset
582 for ( i = 0; i < 8; ++i ) {
a61af66fc99e Initial load
duke
parents:
diff changeset
583 if (i < 6) {
a61af66fc99e Initial load
duke
parents:
diff changeset
584 __ set( i, as_iRegister(i));
a61af66fc99e Initial load
duke
parents:
diff changeset
585 __ set(16 + i, as_oRegister(i));
a61af66fc99e Initial load
duke
parents:
diff changeset
586 __ set(24 + i, as_gRegister(i));
a61af66fc99e Initial load
duke
parents:
diff changeset
587 }
a61af66fc99e Initial load
duke
parents:
diff changeset
588 __ set( 8 + i, as_lRegister(i));
a61af66fc99e Initial load
duke
parents:
diff changeset
589 }
a61af66fc99e Initial load
duke
parents:
diff changeset
590
a61af66fc99e Initial load
duke
parents:
diff changeset
591 __ stop("testing stop");
a61af66fc99e Initial load
duke
parents:
diff changeset
592
a61af66fc99e Initial load
duke
parents:
diff changeset
593
a61af66fc99e Initial load
duke
parents:
diff changeset
594 __ ret();
a61af66fc99e Initial load
duke
parents:
diff changeset
595 __ delayed()->restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
596
a61af66fc99e Initial load
duke
parents:
diff changeset
597 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
598 }
a61af66fc99e Initial load
duke
parents:
diff changeset
599
a61af66fc99e Initial load
duke
parents:
diff changeset
600
a61af66fc99e Initial load
duke
parents:
diff changeset
601 address generate_stop_subroutine() {
a61af66fc99e Initial load
duke
parents:
diff changeset
602 StubCodeMark mark(this, "StubRoutines", "stop_subroutine");
a61af66fc99e Initial load
duke
parents:
diff changeset
603 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
604
a61af66fc99e Initial load
duke
parents:
diff changeset
605 __ stop_subroutine();
a61af66fc99e Initial load
duke
parents:
diff changeset
606
a61af66fc99e Initial load
duke
parents:
diff changeset
607 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
608 }
a61af66fc99e Initial load
duke
parents:
diff changeset
609
a61af66fc99e Initial load
duke
parents:
diff changeset
610 address generate_flush_callers_register_windows() {
a61af66fc99e Initial load
duke
parents:
diff changeset
611 StubCodeMark mark(this, "StubRoutines", "flush_callers_register_windows");
a61af66fc99e Initial load
duke
parents:
diff changeset
612 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
613
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
614 __ flushw();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
615 __ retl(false);
a61af66fc99e Initial load
duke
parents:
diff changeset
616 __ delayed()->add( FP, STACK_BIAS, O0 );
a61af66fc99e Initial load
duke
parents:
diff changeset
617 // The returned value must be a stack pointer whose register save area
a61af66fc99e Initial load
duke
parents:
diff changeset
618 // is flushed, and will stay flushed while the caller executes.
a61af66fc99e Initial load
duke
parents:
diff changeset
619
a61af66fc99e Initial load
duke
parents:
diff changeset
620 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
621 }
a61af66fc99e Initial load
duke
parents:
diff changeset
622
a61af66fc99e Initial load
duke
parents:
diff changeset
623 // Support for jint Atomic::xchg(jint exchange_value, volatile jint* dest).
a61af66fc99e Initial load
duke
parents:
diff changeset
624 //
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
625 // Arguments:
0
a61af66fc99e Initial load
duke
parents:
diff changeset
626 //
a61af66fc99e Initial load
duke
parents:
diff changeset
627 // exchange_value: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
628 // dest: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
629 //
a61af66fc99e Initial load
duke
parents:
diff changeset
630 // Results:
a61af66fc99e Initial load
duke
parents:
diff changeset
631 //
a61af66fc99e Initial load
duke
parents:
diff changeset
632 // O0: the value previously stored in dest
a61af66fc99e Initial load
duke
parents:
diff changeset
633 //
a61af66fc99e Initial load
duke
parents:
diff changeset
634 address generate_atomic_xchg() {
a61af66fc99e Initial load
duke
parents:
diff changeset
635 StubCodeMark mark(this, "StubRoutines", "atomic_xchg");
a61af66fc99e Initial load
duke
parents:
diff changeset
636 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
637
a61af66fc99e Initial load
duke
parents:
diff changeset
638 if (UseCASForSwap) {
a61af66fc99e Initial load
duke
parents:
diff changeset
639 // Use CAS instead of swap, just in case the MP hardware
a61af66fc99e Initial load
duke
parents:
diff changeset
640 // prefers to work with just one kind of synch. instruction.
a61af66fc99e Initial load
duke
parents:
diff changeset
641 Label retry;
a61af66fc99e Initial load
duke
parents:
diff changeset
642 __ BIND(retry);
a61af66fc99e Initial load
duke
parents:
diff changeset
643 __ mov(O0, O3); // scratch copy of exchange value
a61af66fc99e Initial load
duke
parents:
diff changeset
644 __ ld(O1, 0, O2); // observe the previous value
a61af66fc99e Initial load
duke
parents:
diff changeset
645 // try to replace O2 with O3
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
646 __ cas(O1, O2, O3);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
647 __ cmp_and_br_short(O2, O3, Assembler::notEqual, Assembler::pn, retry);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
648
a61af66fc99e Initial load
duke
parents:
diff changeset
649 __ retl(false);
a61af66fc99e Initial load
duke
parents:
diff changeset
650 __ delayed()->mov(O2, O0); // report previous value to caller
a61af66fc99e Initial load
duke
parents:
diff changeset
651 } else {
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
652 __ retl(false);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
653 __ delayed()->swap(O1, 0, O0);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
654 }
a61af66fc99e Initial load
duke
parents:
diff changeset
655
a61af66fc99e Initial load
duke
parents:
diff changeset
656 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
657 }
a61af66fc99e Initial load
duke
parents:
diff changeset
658
a61af66fc99e Initial load
duke
parents:
diff changeset
659
a61af66fc99e Initial load
duke
parents:
diff changeset
660 // Support for jint Atomic::cmpxchg(jint exchange_value, volatile jint* dest, jint compare_value)
a61af66fc99e Initial load
duke
parents:
diff changeset
661 //
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
662 // Arguments:
0
a61af66fc99e Initial load
duke
parents:
diff changeset
663 //
a61af66fc99e Initial load
duke
parents:
diff changeset
664 // exchange_value: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
665 // dest: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
666 // compare_value: O2
a61af66fc99e Initial load
duke
parents:
diff changeset
667 //
a61af66fc99e Initial load
duke
parents:
diff changeset
668 // Results:
a61af66fc99e Initial load
duke
parents:
diff changeset
669 //
a61af66fc99e Initial load
duke
parents:
diff changeset
670 // O0: the value previously stored in dest
a61af66fc99e Initial load
duke
parents:
diff changeset
671 //
a61af66fc99e Initial load
duke
parents:
diff changeset
672 address generate_atomic_cmpxchg() {
a61af66fc99e Initial load
duke
parents:
diff changeset
673 StubCodeMark mark(this, "StubRoutines", "atomic_cmpxchg");
a61af66fc99e Initial load
duke
parents:
diff changeset
674 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
675
a61af66fc99e Initial load
duke
parents:
diff changeset
676 // cmpxchg(dest, compare_value, exchange_value)
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
677 __ cas(O1, O2, O0);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
678 __ retl(false);
a61af66fc99e Initial load
duke
parents:
diff changeset
679 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
680
a61af66fc99e Initial load
duke
parents:
diff changeset
681 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
682 }
a61af66fc99e Initial load
duke
parents:
diff changeset
683
a61af66fc99e Initial load
duke
parents:
diff changeset
684 // Support for jlong Atomic::cmpxchg(jlong exchange_value, volatile jlong *dest, jlong compare_value)
a61af66fc99e Initial load
duke
parents:
diff changeset
685 //
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
686 // Arguments:
0
a61af66fc99e Initial load
duke
parents:
diff changeset
687 //
a61af66fc99e Initial load
duke
parents:
diff changeset
688 // exchange_value: O1:O0
a61af66fc99e Initial load
duke
parents:
diff changeset
689 // dest: O2
a61af66fc99e Initial load
duke
parents:
diff changeset
690 // compare_value: O4:O3
a61af66fc99e Initial load
duke
parents:
diff changeset
691 //
a61af66fc99e Initial load
duke
parents:
diff changeset
692 // Results:
a61af66fc99e Initial load
duke
parents:
diff changeset
693 //
a61af66fc99e Initial load
duke
parents:
diff changeset
694 // O1:O0: the value previously stored in dest
a61af66fc99e Initial load
duke
parents:
diff changeset
695 //
a61af66fc99e Initial load
duke
parents:
diff changeset
696 // Overwrites: G1,G2,G3
a61af66fc99e Initial load
duke
parents:
diff changeset
697 //
a61af66fc99e Initial load
duke
parents:
diff changeset
698 address generate_atomic_cmpxchg_long() {
a61af66fc99e Initial load
duke
parents:
diff changeset
699 StubCodeMark mark(this, "StubRoutines", "atomic_cmpxchg_long");
a61af66fc99e Initial load
duke
parents:
diff changeset
700 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
701
a61af66fc99e Initial load
duke
parents:
diff changeset
702 __ sllx(O0, 32, O0);
a61af66fc99e Initial load
duke
parents:
diff changeset
703 __ srl(O1, 0, O1);
a61af66fc99e Initial load
duke
parents:
diff changeset
704 __ or3(O0,O1,O0); // O0 holds 64-bit value from compare_value
a61af66fc99e Initial load
duke
parents:
diff changeset
705 __ sllx(O3, 32, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
706 __ srl(O4, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
707 __ or3(O3,O4,O3); // O3 holds 64-bit value from exchange_value
a61af66fc99e Initial load
duke
parents:
diff changeset
708 __ casx(O2, O3, O0);
a61af66fc99e Initial load
duke
parents:
diff changeset
709 __ srl(O0, 0, O1); // unpacked return value in O1:O0
a61af66fc99e Initial load
duke
parents:
diff changeset
710 __ retl(false);
a61af66fc99e Initial load
duke
parents:
diff changeset
711 __ delayed()->srlx(O0, 32, O0);
a61af66fc99e Initial load
duke
parents:
diff changeset
712
a61af66fc99e Initial load
duke
parents:
diff changeset
713 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
714 }
a61af66fc99e Initial load
duke
parents:
diff changeset
715
a61af66fc99e Initial load
duke
parents:
diff changeset
716
a61af66fc99e Initial load
duke
parents:
diff changeset
717 // Support for jint Atomic::add(jint add_value, volatile jint* dest).
a61af66fc99e Initial load
duke
parents:
diff changeset
718 //
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
719 // Arguments:
0
a61af66fc99e Initial load
duke
parents:
diff changeset
720 //
a61af66fc99e Initial load
duke
parents:
diff changeset
721 // add_value: O0 (e.g., +1 or -1)
a61af66fc99e Initial load
duke
parents:
diff changeset
722 // dest: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
723 //
a61af66fc99e Initial load
duke
parents:
diff changeset
724 // Results:
a61af66fc99e Initial load
duke
parents:
diff changeset
725 //
a61af66fc99e Initial load
duke
parents:
diff changeset
726 // O0: the new value stored in dest
a61af66fc99e Initial load
duke
parents:
diff changeset
727 //
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
728 // Overwrites: O3
0
a61af66fc99e Initial load
duke
parents:
diff changeset
729 //
a61af66fc99e Initial load
duke
parents:
diff changeset
730 address generate_atomic_add() {
a61af66fc99e Initial load
duke
parents:
diff changeset
731 StubCodeMark mark(this, "StubRoutines", "atomic_add");
a61af66fc99e Initial load
duke
parents:
diff changeset
732 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
733 __ BIND(_atomic_add_stub);
a61af66fc99e Initial load
duke
parents:
diff changeset
734
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
735 Label(retry);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
736 __ BIND(retry);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
737
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
738 __ lduw(O1, 0, O2);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
739 __ add(O0, O2, O3);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
740 __ cas(O1, O2, O3);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
741 __ cmp_and_br_short(O2, O3, Assembler::notEqual, Assembler::pn, retry);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
742 __ retl(false);
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
743 __ delayed()->add(O0, O2, O0); // note that cas made O2==O3
0
a61af66fc99e Initial load
duke
parents:
diff changeset
744
a61af66fc99e Initial load
duke
parents:
diff changeset
745 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
746 }
a61af66fc99e Initial load
duke
parents:
diff changeset
747 Label _atomic_add_stub; // called from other stubs
a61af66fc99e Initial load
duke
parents:
diff changeset
748
a61af66fc99e Initial load
duke
parents:
diff changeset
749
a61af66fc99e Initial load
duke
parents:
diff changeset
750 //------------------------------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
751 // The following routine generates a subroutine to throw an asynchronous
a61af66fc99e Initial load
duke
parents:
diff changeset
752 // UnknownError when an unsafe access gets a fault that could not be
a61af66fc99e Initial load
duke
parents:
diff changeset
753 // reasonably prevented by the programmer. (Example: SIGBUS/OBJERR.)
a61af66fc99e Initial load
duke
parents:
diff changeset
754 //
a61af66fc99e Initial load
duke
parents:
diff changeset
755 // Arguments :
a61af66fc99e Initial load
duke
parents:
diff changeset
756 //
a61af66fc99e Initial load
duke
parents:
diff changeset
757 // trapping PC: O7
a61af66fc99e Initial load
duke
parents:
diff changeset
758 //
a61af66fc99e Initial load
duke
parents:
diff changeset
759 // Results:
a61af66fc99e Initial load
duke
parents:
diff changeset
760 // posts an asynchronous exception, skips the trapping instruction
a61af66fc99e Initial load
duke
parents:
diff changeset
761 //
a61af66fc99e Initial load
duke
parents:
diff changeset
762
a61af66fc99e Initial load
duke
parents:
diff changeset
763 address generate_handler_for_unsafe_access() {
a61af66fc99e Initial load
duke
parents:
diff changeset
764 StubCodeMark mark(this, "StubRoutines", "handler_for_unsafe_access");
a61af66fc99e Initial load
duke
parents:
diff changeset
765 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
766
a61af66fc99e Initial load
duke
parents:
diff changeset
767 const int preserve_register_words = (64 * 2);
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
768 Address preserve_addr(FP, (-preserve_register_words * wordSize) + STACK_BIAS);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
769
a61af66fc99e Initial load
duke
parents:
diff changeset
770 Register Lthread = L7_thread_cache;
a61af66fc99e Initial load
duke
parents:
diff changeset
771 int i;
a61af66fc99e Initial load
duke
parents:
diff changeset
772
a61af66fc99e Initial load
duke
parents:
diff changeset
773 __ save_frame(0);
a61af66fc99e Initial load
duke
parents:
diff changeset
774 __ mov(G1, L1);
a61af66fc99e Initial load
duke
parents:
diff changeset
775 __ mov(G2, L2);
a61af66fc99e Initial load
duke
parents:
diff changeset
776 __ mov(G3, L3);
a61af66fc99e Initial load
duke
parents:
diff changeset
777 __ mov(G4, L4);
a61af66fc99e Initial load
duke
parents:
diff changeset
778 __ mov(G5, L5);
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
779 for (i = 0; i < 64; i += 2) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
780 __ stf(FloatRegisterImpl::D, as_FloatRegister(i), preserve_addr, i * wordSize);
a61af66fc99e Initial load
duke
parents:
diff changeset
781 }
a61af66fc99e Initial load
duke
parents:
diff changeset
782
a61af66fc99e Initial load
duke
parents:
diff changeset
783 address entry_point = CAST_FROM_FN_PTR(address, handle_unsafe_access);
a61af66fc99e Initial load
duke
parents:
diff changeset
784 BLOCK_COMMENT("call handle_unsafe_access");
a61af66fc99e Initial load
duke
parents:
diff changeset
785 __ call(entry_point, relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
786 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
787
a61af66fc99e Initial load
duke
parents:
diff changeset
788 __ mov(L1, G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
789 __ mov(L2, G2);
a61af66fc99e Initial load
duke
parents:
diff changeset
790 __ mov(L3, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
791 __ mov(L4, G4);
a61af66fc99e Initial load
duke
parents:
diff changeset
792 __ mov(L5, G5);
10997
46c544b8fbfc 8008407: remove SPARC V8 support
morris
parents: 7206
diff changeset
793 for (i = 0; i < 64; i += 2) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
794 __ ldf(FloatRegisterImpl::D, preserve_addr, as_FloatRegister(i), i * wordSize);
a61af66fc99e Initial load
duke
parents:
diff changeset
795 }
a61af66fc99e Initial load
duke
parents:
diff changeset
796
a61af66fc99e Initial load
duke
parents:
diff changeset
797 __ verify_thread();
a61af66fc99e Initial load
duke
parents:
diff changeset
798
a61af66fc99e Initial load
duke
parents:
diff changeset
799 __ jmp(O0, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
800 __ delayed()->restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
801
a61af66fc99e Initial load
duke
parents:
diff changeset
802 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
803 }
a61af66fc99e Initial load
duke
parents:
diff changeset
804
a61af66fc99e Initial load
duke
parents:
diff changeset
805
a61af66fc99e Initial load
duke
parents:
diff changeset
806 // Support for uint StubRoutine::Sparc::partial_subtype_check( Klass sub, Klass super );
a61af66fc99e Initial load
duke
parents:
diff changeset
807 // Arguments :
a61af66fc99e Initial load
duke
parents:
diff changeset
808 //
a61af66fc99e Initial load
duke
parents:
diff changeset
809 // ret : O0, returned
a61af66fc99e Initial load
duke
parents:
diff changeset
810 // icc/xcc: set as O0 (depending on wordSize)
a61af66fc99e Initial load
duke
parents:
diff changeset
811 // sub : O1, argument, not changed
a61af66fc99e Initial load
duke
parents:
diff changeset
812 // super: O2, argument, not changed
a61af66fc99e Initial load
duke
parents:
diff changeset
813 // raddr: O7, blown by call
a61af66fc99e Initial load
duke
parents:
diff changeset
814 address generate_partial_subtype_check() {
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
815 __ align(CodeEntryAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
816 StubCodeMark mark(this, "StubRoutines", "partial_subtype_check");
a61af66fc99e Initial load
duke
parents:
diff changeset
817 address start = __ pc();
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
818 Label miss;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
819
a61af66fc99e Initial load
duke
parents:
diff changeset
820 #if defined(COMPILER2) && !defined(_LP64)
a61af66fc99e Initial load
duke
parents:
diff changeset
821 // Do not use a 'save' because it blows the 64-bit O registers.
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
822 __ add(SP,-4*wordSize,SP); // Make space for 4 temps (stack must be 2 words aligned)
0
a61af66fc99e Initial load
duke
parents:
diff changeset
823 __ st_ptr(L0,SP,(frame::register_save_words+0)*wordSize);
a61af66fc99e Initial load
duke
parents:
diff changeset
824 __ st_ptr(L1,SP,(frame::register_save_words+1)*wordSize);
a61af66fc99e Initial load
duke
parents:
diff changeset
825 __ st_ptr(L2,SP,(frame::register_save_words+2)*wordSize);
a61af66fc99e Initial load
duke
parents:
diff changeset
826 __ st_ptr(L3,SP,(frame::register_save_words+3)*wordSize);
a61af66fc99e Initial load
duke
parents:
diff changeset
827 Register Rret = O0;
a61af66fc99e Initial load
duke
parents:
diff changeset
828 Register Rsub = O1;
a61af66fc99e Initial load
duke
parents:
diff changeset
829 Register Rsuper = O2;
a61af66fc99e Initial load
duke
parents:
diff changeset
830 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
831 __ save_frame(0);
a61af66fc99e Initial load
duke
parents:
diff changeset
832 Register Rret = I0;
a61af66fc99e Initial load
duke
parents:
diff changeset
833 Register Rsub = I1;
a61af66fc99e Initial load
duke
parents:
diff changeset
834 Register Rsuper = I2;
a61af66fc99e Initial load
duke
parents:
diff changeset
835 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
836
a61af66fc99e Initial load
duke
parents:
diff changeset
837 Register L0_ary_len = L0;
a61af66fc99e Initial load
duke
parents:
diff changeset
838 Register L1_ary_ptr = L1;
a61af66fc99e Initial load
duke
parents:
diff changeset
839 Register L2_super = L2;
a61af66fc99e Initial load
duke
parents:
diff changeset
840 Register L3_index = L3;
a61af66fc99e Initial load
duke
parents:
diff changeset
841
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
842 __ check_klass_subtype_slow_path(Rsub, Rsuper,
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
843 L0, L1, L2, L3,
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
844 NULL, &miss);
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
845
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
846 // Match falls through here.
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
847 __ addcc(G0,0,Rret); // set Z flags, Z result
0
a61af66fc99e Initial load
duke
parents:
diff changeset
848
a61af66fc99e Initial load
duke
parents:
diff changeset
849 #if defined(COMPILER2) && !defined(_LP64)
a61af66fc99e Initial load
duke
parents:
diff changeset
850 __ ld_ptr(SP,(frame::register_save_words+0)*wordSize,L0);
a61af66fc99e Initial load
duke
parents:
diff changeset
851 __ ld_ptr(SP,(frame::register_save_words+1)*wordSize,L1);
a61af66fc99e Initial load
duke
parents:
diff changeset
852 __ ld_ptr(SP,(frame::register_save_words+2)*wordSize,L2);
a61af66fc99e Initial load
duke
parents:
diff changeset
853 __ ld_ptr(SP,(frame::register_save_words+3)*wordSize,L3);
a61af66fc99e Initial load
duke
parents:
diff changeset
854 __ retl(); // Result in Rret is zero; flags set to Z
a61af66fc99e Initial load
duke
parents:
diff changeset
855 __ delayed()->add(SP,4*wordSize,SP);
a61af66fc99e Initial load
duke
parents:
diff changeset
856 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
857 __ ret(); // Result in Rret is zero; flags set to Z
a61af66fc99e Initial load
duke
parents:
diff changeset
858 __ delayed()->restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
859 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
860
a61af66fc99e Initial load
duke
parents:
diff changeset
861 __ BIND(miss);
a61af66fc99e Initial load
duke
parents:
diff changeset
862 __ addcc(G0,1,Rret); // set NZ flags, NZ result
a61af66fc99e Initial load
duke
parents:
diff changeset
863
a61af66fc99e Initial load
duke
parents:
diff changeset
864 #if defined(COMPILER2) && !defined(_LP64)
a61af66fc99e Initial load
duke
parents:
diff changeset
865 __ ld_ptr(SP,(frame::register_save_words+0)*wordSize,L0);
a61af66fc99e Initial load
duke
parents:
diff changeset
866 __ ld_ptr(SP,(frame::register_save_words+1)*wordSize,L1);
a61af66fc99e Initial load
duke
parents:
diff changeset
867 __ ld_ptr(SP,(frame::register_save_words+2)*wordSize,L2);
a61af66fc99e Initial load
duke
parents:
diff changeset
868 __ ld_ptr(SP,(frame::register_save_words+3)*wordSize,L3);
a61af66fc99e Initial load
duke
parents:
diff changeset
869 __ retl(); // Result in Rret is != 0; flags set to NZ
a61af66fc99e Initial load
duke
parents:
diff changeset
870 __ delayed()->add(SP,4*wordSize,SP);
a61af66fc99e Initial load
duke
parents:
diff changeset
871 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
872 __ ret(); // Result in Rret is != 0; flags set to NZ
a61af66fc99e Initial load
duke
parents:
diff changeset
873 __ delayed()->restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
874 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
875
a61af66fc99e Initial load
duke
parents:
diff changeset
876 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
877 }
a61af66fc99e Initial load
duke
parents:
diff changeset
878
a61af66fc99e Initial load
duke
parents:
diff changeset
879
a61af66fc99e Initial load
duke
parents:
diff changeset
880 // Called from MacroAssembler::verify_oop
a61af66fc99e Initial load
duke
parents:
diff changeset
881 //
a61af66fc99e Initial load
duke
parents:
diff changeset
882 address generate_verify_oop_subroutine() {
a61af66fc99e Initial load
duke
parents:
diff changeset
883 StubCodeMark mark(this, "StubRoutines", "verify_oop_stub");
a61af66fc99e Initial load
duke
parents:
diff changeset
884
a61af66fc99e Initial load
duke
parents:
diff changeset
885 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
886
a61af66fc99e Initial load
duke
parents:
diff changeset
887 __ verify_oop_subroutine();
a61af66fc99e Initial load
duke
parents:
diff changeset
888
a61af66fc99e Initial load
duke
parents:
diff changeset
889 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
890 }
a61af66fc99e Initial load
duke
parents:
diff changeset
891
a61af66fc99e Initial load
duke
parents:
diff changeset
892
a61af66fc99e Initial load
duke
parents:
diff changeset
893 //
a61af66fc99e Initial load
duke
parents:
diff changeset
894 // Verify that a register contains clean 32-bits positive value
a61af66fc99e Initial load
duke
parents:
diff changeset
895 // (high 32-bits are 0) so it could be used in 64-bits shifts (sllx, srax).
a61af66fc99e Initial load
duke
parents:
diff changeset
896 //
a61af66fc99e Initial load
duke
parents:
diff changeset
897 // Input:
a61af66fc99e Initial load
duke
parents:
diff changeset
898 // Rint - 32-bits value
a61af66fc99e Initial load
duke
parents:
diff changeset
899 // Rtmp - scratch
a61af66fc99e Initial load
duke
parents:
diff changeset
900 //
a61af66fc99e Initial load
duke
parents:
diff changeset
901 void assert_clean_int(Register Rint, Register Rtmp) {
a61af66fc99e Initial load
duke
parents:
diff changeset
902 #if defined(ASSERT) && defined(_LP64)
a61af66fc99e Initial load
duke
parents:
diff changeset
903 __ signx(Rint, Rtmp);
a61af66fc99e Initial load
duke
parents:
diff changeset
904 __ cmp(Rint, Rtmp);
a61af66fc99e Initial load
duke
parents:
diff changeset
905 __ breakpoint_trap(Assembler::notEqual, Assembler::xcc);
a61af66fc99e Initial load
duke
parents:
diff changeset
906 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
907 }
a61af66fc99e Initial load
duke
parents:
diff changeset
908
a61af66fc99e Initial load
duke
parents:
diff changeset
909 //
a61af66fc99e Initial load
duke
parents:
diff changeset
910 // Generate overlap test for array copy stubs
a61af66fc99e Initial load
duke
parents:
diff changeset
911 //
a61af66fc99e Initial load
duke
parents:
diff changeset
912 // Input:
a61af66fc99e Initial load
duke
parents:
diff changeset
913 // O0 - array1
a61af66fc99e Initial load
duke
parents:
diff changeset
914 // O1 - array2
a61af66fc99e Initial load
duke
parents:
diff changeset
915 // O2 - element count
a61af66fc99e Initial load
duke
parents:
diff changeset
916 //
a61af66fc99e Initial load
duke
parents:
diff changeset
917 // Kills temps: O3, O4
a61af66fc99e Initial load
duke
parents:
diff changeset
918 //
a61af66fc99e Initial load
duke
parents:
diff changeset
919 void array_overlap_test(address no_overlap_target, int log2_elem_size) {
a61af66fc99e Initial load
duke
parents:
diff changeset
920 assert(no_overlap_target != NULL, "must be generated");
a61af66fc99e Initial load
duke
parents:
diff changeset
921 array_overlap_test(no_overlap_target, NULL, log2_elem_size);
a61af66fc99e Initial load
duke
parents:
diff changeset
922 }
a61af66fc99e Initial load
duke
parents:
diff changeset
923 void array_overlap_test(Label& L_no_overlap, int log2_elem_size) {
a61af66fc99e Initial load
duke
parents:
diff changeset
924 array_overlap_test(NULL, &L_no_overlap, log2_elem_size);
a61af66fc99e Initial load
duke
parents:
diff changeset
925 }
a61af66fc99e Initial load
duke
parents:
diff changeset
926 void array_overlap_test(address no_overlap_target, Label* NOLp, int log2_elem_size) {
a61af66fc99e Initial load
duke
parents:
diff changeset
927 const Register from = O0;
a61af66fc99e Initial load
duke
parents:
diff changeset
928 const Register to = O1;
a61af66fc99e Initial load
duke
parents:
diff changeset
929 const Register count = O2;
a61af66fc99e Initial load
duke
parents:
diff changeset
930 const Register to_from = O3; // to - from
a61af66fc99e Initial load
duke
parents:
diff changeset
931 const Register byte_count = O4; // count << log2_elem_size
a61af66fc99e Initial load
duke
parents:
diff changeset
932
a61af66fc99e Initial load
duke
parents:
diff changeset
933 __ subcc(to, from, to_from);
a61af66fc99e Initial load
duke
parents:
diff changeset
934 __ sll_ptr(count, log2_elem_size, byte_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
935 if (NOLp == NULL)
a61af66fc99e Initial load
duke
parents:
diff changeset
936 __ brx(Assembler::lessEqualUnsigned, false, Assembler::pt, no_overlap_target);
a61af66fc99e Initial load
duke
parents:
diff changeset
937 else
a61af66fc99e Initial load
duke
parents:
diff changeset
938 __ brx(Assembler::lessEqualUnsigned, false, Assembler::pt, (*NOLp));
a61af66fc99e Initial load
duke
parents:
diff changeset
939 __ delayed()->cmp(to_from, byte_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
940 if (NOLp == NULL)
1655
e7ec8cd4dd8a 6962569: assembler_sparc.cpp:1969: assert(false) failed: error
tonyp
parents: 1579
diff changeset
941 __ brx(Assembler::greaterEqualUnsigned, false, Assembler::pt, no_overlap_target);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
942 else
1655
e7ec8cd4dd8a 6962569: assembler_sparc.cpp:1969: assert(false) failed: error
tonyp
parents: 1579
diff changeset
943 __ brx(Assembler::greaterEqualUnsigned, false, Assembler::pt, (*NOLp));
0
a61af66fc99e Initial load
duke
parents:
diff changeset
944 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
945 }
a61af66fc99e Initial load
duke
parents:
diff changeset
946
a61af66fc99e Initial load
duke
parents:
diff changeset
947 //
a61af66fc99e Initial load
duke
parents:
diff changeset
948 // Generate pre-write barrier for array.
a61af66fc99e Initial load
duke
parents:
diff changeset
949 //
a61af66fc99e Initial load
duke
parents:
diff changeset
950 // Input:
a61af66fc99e Initial load
duke
parents:
diff changeset
951 // addr - register containing starting address
a61af66fc99e Initial load
duke
parents:
diff changeset
952 // count - register containing element count
a61af66fc99e Initial load
duke
parents:
diff changeset
953 // tmp - scratch register
a61af66fc99e Initial load
duke
parents:
diff changeset
954 //
a61af66fc99e Initial load
duke
parents:
diff changeset
955 // The input registers are overwritten.
a61af66fc99e Initial load
duke
parents:
diff changeset
956 //
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
957 void gen_write_ref_array_pre_barrier(Register addr, Register count, bool dest_uninitialized) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
958 BarrierSet* bs = Universe::heap()->barrier_set();
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
959 switch (bs->kind()) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
960 case BarrierSet::G1SATBCT:
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
961 case BarrierSet::G1SATBCTLogging:
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
962 // With G1, don't generate the call if we statically know that the target in uninitialized
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
963 if (!dest_uninitialized) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
964 __ save_frame(0);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
965 // Save the necessary global regs... will be used after.
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
966 if (addr->is_global()) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
967 __ mov(addr, L0);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
968 }
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
969 if (count->is_global()) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
970 __ mov(count, L1);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
971 }
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
972 __ mov(addr->after_save(), O0);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
973 // Get the count into O1
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
974 __ call(CAST_FROM_FN_PTR(address, BarrierSet::static_write_ref_array_pre));
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
975 __ delayed()->mov(count->after_save(), O1);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
976 if (addr->is_global()) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
977 __ mov(L0, addr);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
978 }
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
979 if (count->is_global()) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
980 __ mov(L1, count);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
981 }
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
982 __ restore();
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
983 }
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
984 break;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
985 case BarrierSet::CardTableModRef:
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
986 case BarrierSet::CardTableExtension:
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
987 case BarrierSet::ModRef:
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
988 break;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
989 default:
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
990 ShouldNotReachHere();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
991 }
a61af66fc99e Initial load
duke
parents:
diff changeset
992 }
a61af66fc99e Initial load
duke
parents:
diff changeset
993 //
a61af66fc99e Initial load
duke
parents:
diff changeset
994 // Generate post-write barrier for array.
a61af66fc99e Initial load
duke
parents:
diff changeset
995 //
a61af66fc99e Initial load
duke
parents:
diff changeset
996 // Input:
a61af66fc99e Initial load
duke
parents:
diff changeset
997 // addr - register containing starting address
a61af66fc99e Initial load
duke
parents:
diff changeset
998 // count - register containing element count
a61af66fc99e Initial load
duke
parents:
diff changeset
999 // tmp - scratch register
a61af66fc99e Initial load
duke
parents:
diff changeset
1000 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1001 // The input registers are overwritten.
a61af66fc99e Initial load
duke
parents:
diff changeset
1002 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1003 void gen_write_ref_array_post_barrier(Register addr, Register count,
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
1004 Register tmp) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1005 BarrierSet* bs = Universe::heap()->barrier_set();
a61af66fc99e Initial load
duke
parents:
diff changeset
1006
a61af66fc99e Initial load
duke
parents:
diff changeset
1007 switch (bs->kind()) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1008 case BarrierSet::G1SATBCT:
a61af66fc99e Initial load
duke
parents:
diff changeset
1009 case BarrierSet::G1SATBCTLogging:
a61af66fc99e Initial load
duke
parents:
diff changeset
1010 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1011 // Get some new fresh output registers.
a61af66fc99e Initial load
duke
parents:
diff changeset
1012 __ save_frame(0);
342
37f87013dfd8 6711316: Open source the Garbage-First garbage collector
ysr
parents: 113
diff changeset
1013 __ mov(addr->after_save(), O0);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1014 __ call(CAST_FROM_FN_PTR(address, BarrierSet::static_write_ref_array_post));
342
37f87013dfd8 6711316: Open source the Garbage-First garbage collector
ysr
parents: 113
diff changeset
1015 __ delayed()->mov(count->after_save(), O1);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1016 __ restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
1017 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1018 break;
a61af66fc99e Initial load
duke
parents:
diff changeset
1019 case BarrierSet::CardTableModRef:
a61af66fc99e Initial load
duke
parents:
diff changeset
1020 case BarrierSet::CardTableExtension:
a61af66fc99e Initial load
duke
parents:
diff changeset
1021 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1022 CardTableModRefBS* ct = (CardTableModRefBS*)bs;
a61af66fc99e Initial load
duke
parents:
diff changeset
1023 assert(sizeof(*ct->byte_map_base) == sizeof(jbyte), "adjust this code");
a61af66fc99e Initial load
duke
parents:
diff changeset
1024 assert_different_registers(addr, count, tmp);
a61af66fc99e Initial load
duke
parents:
diff changeset
1025
a61af66fc99e Initial load
duke
parents:
diff changeset
1026 Label L_loop;
a61af66fc99e Initial load
duke
parents:
diff changeset
1027
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
1028 __ sll_ptr(count, LogBytesPerHeapOop, count);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
1029 __ sub(count, BytesPerHeapOop, count);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1030 __ add(count, addr, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1031 // Use two shifts to clear out those low order two bits! (Cannot opt. into 1.)
a61af66fc99e Initial load
duke
parents:
diff changeset
1032 __ srl_ptr(addr, CardTableModRefBS::card_shift, addr);
a61af66fc99e Initial load
duke
parents:
diff changeset
1033 __ srl_ptr(count, CardTableModRefBS::card_shift, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1034 __ sub(count, addr, count);
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
1035 AddressLiteral rs(ct->byte_map_base);
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
1036 __ set(rs, tmp);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1037 __ BIND(L_loop);
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
1038 __ stb(G0, tmp, addr);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1039 __ subcc(count, 1, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1040 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1041 __ delayed()->add(addr, 1, addr);
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
1042 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1043 break;
a61af66fc99e Initial load
duke
parents:
diff changeset
1044 case BarrierSet::ModRef:
a61af66fc99e Initial load
duke
parents:
diff changeset
1045 break;
727
6b2273dd6fa9 6822110: Add AddressLiteral class on SPARC
twisti
parents: 671
diff changeset
1046 default:
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1047 ShouldNotReachHere();
a61af66fc99e Initial load
duke
parents:
diff changeset
1048 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1049 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1050
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1051 //
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1052 // Generate main code for disjoint arraycopy
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1053 //
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1054 typedef void (StubGenerator::*CopyLoopFunc)(Register from, Register to, Register count, int count_dec,
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1055 Label& L_loop, bool use_prefetch, bool use_bis);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1056
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1057 void disjoint_copy_core(Register from, Register to, Register count, int log2_elem_size,
17939
0fb5b60ab4a2 8022070: Compilation error in stubGenerator_sparc.cpp with some compilers
mikael
parents: 17910
diff changeset
1058 int iter_size, StubGenerator::CopyLoopFunc copy_loop_func) {
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1059 Label L_copy;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1060
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1061 assert(log2_elem_size <= 3, "the following code should be changed");
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1062 int count_dec = 16>>log2_elem_size;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1063
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1064 int prefetch_dist = MAX2(ArraycopySrcPrefetchDistance, ArraycopyDstPrefetchDistance);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1065 assert(prefetch_dist < 4096, "invalid value");
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1066 prefetch_dist = (prefetch_dist + (iter_size-1)) & (-iter_size); // round up to one iteration copy size
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1067 int prefetch_count = (prefetch_dist >> log2_elem_size); // elements count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1068
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1069 if (UseBlockCopy) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1070 Label L_block_copy, L_block_copy_prefetch, L_skip_block_copy;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1071
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1072 // 64 bytes tail + bytes copied in one loop iteration
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1073 int tail_size = 64 + iter_size;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1074 int block_copy_count = (MAX2(tail_size, (int)BlockCopyLowLimit)) >> log2_elem_size;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1075 // Use BIS copy only for big arrays since it requires membar.
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1076 __ set(block_copy_count, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1077 __ cmp_and_br_short(count, O4, Assembler::lessUnsigned, Assembler::pt, L_skip_block_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1078 // This code is for disjoint source and destination:
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1079 // to <= from || to >= from+count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1080 // but BIS will stomp over 'from' if (to > from-tail_size && to <= from)
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1081 __ sub(from, to, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1082 __ srax(O4, 4, O4); // divide by 16 since following short branch have only 5 bits for imm.
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1083 __ cmp_and_br_short(O4, (tail_size>>4), Assembler::lessEqualUnsigned, Assembler::pn, L_skip_block_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1084
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1085 __ wrasi(G0, Assembler::ASI_ST_BLKINIT_PRIMARY);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1086 // BIS should not be used to copy tail (64 bytes+iter_size)
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1087 // to avoid zeroing of following values.
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1088 __ sub(count, (tail_size>>log2_elem_size), count); // count is still positive >= 0
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1089
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1090 if (prefetch_count > 0) { // rounded up to one iteration count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1091 // Do prefetching only if copy size is bigger
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1092 // than prefetch distance.
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1093 __ set(prefetch_count, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1094 __ cmp_and_brx_short(count, O4, Assembler::less, Assembler::pt, L_block_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1095 __ sub(count, prefetch_count, count);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1096
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1097 (this->*copy_loop_func)(from, to, count, count_dec, L_block_copy_prefetch, true, true);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1098 __ add(count, prefetch_count, count); // restore count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1099
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1100 } // prefetch_count > 0
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1101
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1102 (this->*copy_loop_func)(from, to, count, count_dec, L_block_copy, false, true);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1103 __ add(count, (tail_size>>log2_elem_size), count); // restore count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1104
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1105 __ wrasi(G0, Assembler::ASI_PRIMARY_NOFAULT);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1106 // BIS needs membar.
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1107 __ membar(Assembler::StoreLoad);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1108 // Copy tail
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1109 __ ba_short(L_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1110
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1111 __ BIND(L_skip_block_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1112 } // UseBlockCopy
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1113
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1114 if (prefetch_count > 0) { // rounded up to one iteration count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1115 // Do prefetching only if copy size is bigger
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1116 // than prefetch distance.
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1117 __ set(prefetch_count, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1118 __ cmp_and_brx_short(count, O4, Assembler::lessUnsigned, Assembler::pt, L_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1119 __ sub(count, prefetch_count, count);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1120
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1121 Label L_copy_prefetch;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1122 (this->*copy_loop_func)(from, to, count, count_dec, L_copy_prefetch, true, false);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1123 __ add(count, prefetch_count, count); // restore count
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1124
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1125 } // prefetch_count > 0
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1126
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1127 (this->*copy_loop_func)(from, to, count, count_dec, L_copy, false, false);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1128 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1129
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1130
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1131
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1132 //
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1133 // Helper methods for copy_16_bytes_forward_with_shift()
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1134 //
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1135 void copy_16_bytes_shift_loop(Register from, Register to, Register count, int count_dec,
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1136 Label& L_loop, bool use_prefetch, bool use_bis) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1137
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1138 const Register left_shift = G1; // left shift bit counter
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1139 const Register right_shift = G5; // right shift bit counter
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1140
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1141 __ align(OptoLoopAlignment);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1142 __ BIND(L_loop);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1143 if (use_prefetch) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1144 if (ArraycopySrcPrefetchDistance > 0) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1145 __ prefetch(from, ArraycopySrcPrefetchDistance, Assembler::severalReads);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1146 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1147 if (ArraycopyDstPrefetchDistance > 0) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1148 __ prefetch(to, ArraycopyDstPrefetchDistance, Assembler::severalWritesAndPossiblyReads);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1149 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1150 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1151 __ ldx(from, 0, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1152 __ ldx(from, 8, G4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1153 __ inc(to, 16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1154 __ inc(from, 16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1155 __ deccc(count, count_dec); // Can we do next iteration after this one?
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1156 __ srlx(O4, right_shift, G3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1157 __ bset(G3, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1158 __ sllx(O4, left_shift, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1159 __ srlx(G4, right_shift, G3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1160 __ bset(G3, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1161 if (use_bis) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1162 __ stxa(O3, to, -16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1163 __ stxa(O4, to, -8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1164 } else {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1165 __ stx(O3, to, -16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1166 __ stx(O4, to, -8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1167 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1168 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_loop);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1169 __ delayed()->sllx(G4, left_shift, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1170 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1171
a61af66fc99e Initial load
duke
parents:
diff changeset
1172 // Copy big chunks forward with shift
a61af66fc99e Initial load
duke
parents:
diff changeset
1173 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1174 // Inputs:
a61af66fc99e Initial load
duke
parents:
diff changeset
1175 // from - source arrays
a61af66fc99e Initial load
duke
parents:
diff changeset
1176 // to - destination array aligned to 8-bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1177 // count - elements count to copy >= the count equivalent to 16 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1178 // count_dec - elements count's decrement equivalent to 16 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1179 // L_copy_bytes - copy exit label
a61af66fc99e Initial load
duke
parents:
diff changeset
1180 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1181 void copy_16_bytes_forward_with_shift(Register from, Register to,
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1182 Register count, int log2_elem_size, Label& L_copy_bytes) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1183 Label L_aligned_copy, L_copy_last_bytes;
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1184 assert(log2_elem_size <= 3, "the following code should be changed");
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1185 int count_dec = 16>>log2_elem_size;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1186
a61af66fc99e Initial load
duke
parents:
diff changeset
1187 // if both arrays have the same alignment mod 8, do 8 bytes aligned copy
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1188 __ andcc(from, 7, G1); // misaligned bytes
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1189 __ br(Assembler::zero, false, Assembler::pt, L_aligned_copy);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1190 __ delayed()->nop();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1191
a61af66fc99e Initial load
duke
parents:
diff changeset
1192 const Register left_shift = G1; // left shift bit counter
a61af66fc99e Initial load
duke
parents:
diff changeset
1193 const Register right_shift = G5; // right shift bit counter
a61af66fc99e Initial load
duke
parents:
diff changeset
1194
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1195 __ sll(G1, LogBitsPerByte, left_shift);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1196 __ mov(64, right_shift);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1197 __ sub(right_shift, left_shift, right_shift);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1198
a61af66fc99e Initial load
duke
parents:
diff changeset
1199 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1200 // Load 2 aligned 8-bytes chunks and use one from previous iteration
a61af66fc99e Initial load
duke
parents:
diff changeset
1201 // to form 2 aligned 8-bytes chunks to store.
a61af66fc99e Initial load
duke
parents:
diff changeset
1202 //
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1203 __ dec(count, count_dec); // Pre-decrement 'count'
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1204 __ andn(from, 7, from); // Align address
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1205 __ ldx(from, 0, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1206 __ inc(from, 8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1207 __ sllx(O3, left_shift, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1208
17939
0fb5b60ab4a2 8022070: Compilation error in stubGenerator_sparc.cpp with some compilers
mikael
parents: 17910
diff changeset
1209 disjoint_copy_core(from, to, count, log2_elem_size, 16, &StubGenerator::copy_16_bytes_shift_loop);
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1210
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1211 __ inccc(count, count_dec>>1 ); // + 8 bytes
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1212 __ brx(Assembler::negative, true, Assembler::pn, L_copy_last_bytes);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1213 __ delayed()->inc(count, count_dec>>1); // restore 'count'
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1214
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1215 // copy 8 bytes, part of them already loaded in O3
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1216 __ ldx(from, 0, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1217 __ inc(to, 8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1218 __ inc(from, 8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1219 __ srlx(O4, right_shift, G3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1220 __ bset(O3, G3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1221 __ stx(G3, to, -8);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1222
a61af66fc99e Initial load
duke
parents:
diff changeset
1223 __ BIND(L_copy_last_bytes);
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1224 __ srl(right_shift, LogBitsPerByte, right_shift); // misaligned bytes
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1225 __ br(Assembler::always, false, Assembler::pt, L_copy_bytes);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1226 __ delayed()->sub(from, right_shift, from); // restore address
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1227
a61af66fc99e Initial load
duke
parents:
diff changeset
1228 __ BIND(L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
1229 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1230
a61af66fc99e Initial load
duke
parents:
diff changeset
1231 // Copy big chunks backward with shift
a61af66fc99e Initial load
duke
parents:
diff changeset
1232 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1233 // Inputs:
a61af66fc99e Initial load
duke
parents:
diff changeset
1234 // end_from - source arrays end address
a61af66fc99e Initial load
duke
parents:
diff changeset
1235 // end_to - destination array end address aligned to 8-bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1236 // count - elements count to copy >= the count equivalent to 16 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1237 // count_dec - elements count's decrement equivalent to 16 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1238 // L_aligned_copy - aligned copy exit label
a61af66fc99e Initial load
duke
parents:
diff changeset
1239 // L_copy_bytes - copy exit label
a61af66fc99e Initial load
duke
parents:
diff changeset
1240 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1241 void copy_16_bytes_backward_with_shift(Register end_from, Register end_to,
a61af66fc99e Initial load
duke
parents:
diff changeset
1242 Register count, int count_dec,
a61af66fc99e Initial load
duke
parents:
diff changeset
1243 Label& L_aligned_copy, Label& L_copy_bytes) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1244 Label L_loop, L_copy_last_bytes;
a61af66fc99e Initial load
duke
parents:
diff changeset
1245
a61af66fc99e Initial load
duke
parents:
diff changeset
1246 // if both arrays have the same alignment mod 8, do 8 bytes aligned copy
a61af66fc99e Initial load
duke
parents:
diff changeset
1247 __ andcc(end_from, 7, G1); // misaligned bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1248 __ br(Assembler::zero, false, Assembler::pt, L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
1249 __ delayed()->deccc(count, count_dec); // Pre-decrement 'count'
a61af66fc99e Initial load
duke
parents:
diff changeset
1250
a61af66fc99e Initial load
duke
parents:
diff changeset
1251 const Register left_shift = G1; // left shift bit counter
a61af66fc99e Initial load
duke
parents:
diff changeset
1252 const Register right_shift = G5; // right shift bit counter
a61af66fc99e Initial load
duke
parents:
diff changeset
1253
a61af66fc99e Initial load
duke
parents:
diff changeset
1254 __ sll(G1, LogBitsPerByte, left_shift);
a61af66fc99e Initial load
duke
parents:
diff changeset
1255 __ mov(64, right_shift);
a61af66fc99e Initial load
duke
parents:
diff changeset
1256 __ sub(right_shift, left_shift, right_shift);
a61af66fc99e Initial load
duke
parents:
diff changeset
1257
a61af66fc99e Initial load
duke
parents:
diff changeset
1258 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1259 // Load 2 aligned 8-bytes chunks and use one from previous iteration
a61af66fc99e Initial load
duke
parents:
diff changeset
1260 // to form 2 aligned 8-bytes chunks to store.
a61af66fc99e Initial load
duke
parents:
diff changeset
1261 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1262 __ andn(end_from, 7, end_from); // Align address
a61af66fc99e Initial load
duke
parents:
diff changeset
1263 __ ldx(end_from, 0, O3);
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
1264 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1265 __ BIND(L_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1266 __ ldx(end_from, -8, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1267 __ deccc(count, count_dec); // Can we do next iteration after this one?
a61af66fc99e Initial load
duke
parents:
diff changeset
1268 __ ldx(end_from, -16, G4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1269 __ dec(end_to, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1270 __ dec(end_from, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1271 __ srlx(O3, right_shift, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1272 __ sllx(O4, left_shift, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1273 __ bset(G3, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1274 __ stx(O3, end_to, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1275 __ srlx(O4, right_shift, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1276 __ sllx(G4, left_shift, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1277 __ bset(G3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1278 __ stx(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1279 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1280 __ delayed()->mov(G4, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1281
a61af66fc99e Initial load
duke
parents:
diff changeset
1282 __ inccc(count, count_dec>>1 ); // + 8 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1283 __ brx(Assembler::negative, true, Assembler::pn, L_copy_last_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
1284 __ delayed()->inc(count, count_dec>>1); // restore 'count'
a61af66fc99e Initial load
duke
parents:
diff changeset
1285
a61af66fc99e Initial load
duke
parents:
diff changeset
1286 // copy 8 bytes, part of them already loaded in O3
a61af66fc99e Initial load
duke
parents:
diff changeset
1287 __ ldx(end_from, -8, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1288 __ dec(end_to, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1289 __ dec(end_from, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1290 __ srlx(O3, right_shift, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1291 __ sllx(O4, left_shift, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1292 __ bset(O3, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1293 __ stx(G3, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1294
a61af66fc99e Initial load
duke
parents:
diff changeset
1295 __ BIND(L_copy_last_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
1296 __ srl(left_shift, LogBitsPerByte, left_shift); // misaligned bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1297 __ br(Assembler::always, false, Assembler::pt, L_copy_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
1298 __ delayed()->add(end_from, left_shift, end_from); // restore address
a61af66fc99e Initial load
duke
parents:
diff changeset
1299 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1300
a61af66fc99e Initial load
duke
parents:
diff changeset
1301 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1302 // Generate stub for disjoint byte copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
1303 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
1304 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1305 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
1306 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
1307 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
1308 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
1309 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1310 address generate_disjoint_byte_copy(bool aligned, address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1311 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1312 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
1313 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
1314
a61af66fc99e Initial load
duke
parents:
diff changeset
1315 Label L_skip_alignment, L_align;
a61af66fc99e Initial load
duke
parents:
diff changeset
1316 Label L_copy_byte, L_copy_byte_loop, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
1317
a61af66fc99e Initial load
duke
parents:
diff changeset
1318 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1319 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1320 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
1321 const Register offset = O5; // offset from start of arrays
a61af66fc99e Initial load
duke
parents:
diff changeset
1322 // O3, O4, G3, G4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
1323
a61af66fc99e Initial load
duke
parents:
diff changeset
1324 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
1325
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1326 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1327 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1328 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1329 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1330 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1331
a61af66fc99e Initial load
duke
parents:
diff changeset
1332 // for short arrays, just do single element copy
a61af66fc99e Initial load
duke
parents:
diff changeset
1333 __ cmp(count, 23); // 16 + 7
a61af66fc99e Initial load
duke
parents:
diff changeset
1334 __ brx(Assembler::less, false, Assembler::pn, L_copy_byte);
a61af66fc99e Initial load
duke
parents:
diff changeset
1335 __ delayed()->mov(G0, offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
1336
a61af66fc99e Initial load
duke
parents:
diff changeset
1337 if (aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1338 // 'aligned' == true when it is known statically during compilation
a61af66fc99e Initial load
duke
parents:
diff changeset
1339 // of this arraycopy call site that both 'from' and 'to' addresses
a61af66fc99e Initial load
duke
parents:
diff changeset
1340 // are HeapWordSize aligned (see LibraryCallKit::basictype2arraycopy()).
a61af66fc99e Initial load
duke
parents:
diff changeset
1341 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1342 // Aligned arrays have 4 bytes alignment in 32-bits VM
a61af66fc99e Initial load
duke
parents:
diff changeset
1343 // and 8 bytes - in 64-bits VM. So we do it only for 32-bits VM
a61af66fc99e Initial load
duke
parents:
diff changeset
1344 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1345 #ifndef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
1346 // copy a 4-bytes word if necessary to align 'to' to 8 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1347 __ andcc(to, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1348 __ br(Assembler::zero, false, Assembler::pn, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1349 __ delayed()->ld(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1350 __ inc(from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1351 __ inc(to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1352 __ dec(count, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1353 __ st(O3, to, -4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1354 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1355 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
1356 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
1357 // copy bytes to align 'to' on 8 byte boundary
a61af66fc99e Initial load
duke
parents:
diff changeset
1358 __ andcc(to, 7, G1); // misaligned bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1359 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1360 __ delayed()->neg(G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
1361 __ inc(G1, 8); // bytes need to copy to next 8-bytes alignment
a61af66fc99e Initial load
duke
parents:
diff changeset
1362 __ sub(count, G1, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1363 __ BIND(L_align);
a61af66fc99e Initial load
duke
parents:
diff changeset
1364 __ ldub(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1365 __ deccc(G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
1366 __ inc(from);
a61af66fc99e Initial load
duke
parents:
diff changeset
1367 __ stb(O3, to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1368 __ br(Assembler::notZero, false, Assembler::pt, L_align);
a61af66fc99e Initial load
duke
parents:
diff changeset
1369 __ delayed()->inc(to);
a61af66fc99e Initial load
duke
parents:
diff changeset
1370 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1371 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1372 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
1373 if (!aligned)
a61af66fc99e Initial load
duke
parents:
diff changeset
1374 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
1375 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1376 // Copy with shift 16 bytes per iteration if arrays do not have
a61af66fc99e Initial load
duke
parents:
diff changeset
1377 // the same alignment mod 8, otherwise fall through to the next
a61af66fc99e Initial load
duke
parents:
diff changeset
1378 // code for aligned copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
1379 // The compare above (count >= 23) guarantes 'count' >= 16 bytes.
a61af66fc99e Initial load
duke
parents:
diff changeset
1380 // Also jump over aligned copy after the copy with shift completed.
a61af66fc99e Initial load
duke
parents:
diff changeset
1381
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1382 copy_16_bytes_forward_with_shift(from, to, count, 0, L_copy_byte);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1383 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1384
a61af66fc99e Initial load
duke
parents:
diff changeset
1385 // Both array are 8 bytes aligned, copy 16 bytes at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
1386 __ and3(count, 7, G4); // Save count
a61af66fc99e Initial load
duke
parents:
diff changeset
1387 __ srl(count, 3, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1388 generate_disjoint_long_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
1389 __ mov(G4, count); // Restore count
a61af66fc99e Initial load
duke
parents:
diff changeset
1390
a61af66fc99e Initial load
duke
parents:
diff changeset
1391 // copy tailing bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1392 __ BIND(L_copy_byte);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
1393 __ cmp_and_br_short(count, 0, Assembler::equal, Assembler::pt, L_exit);
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
1394 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1395 __ BIND(L_copy_byte_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1396 __ ldub(from, offset, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1397 __ deccc(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1398 __ stb(O3, to, offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
1399 __ brx(Assembler::notZero, false, Assembler::pt, L_copy_byte_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1400 __ delayed()->inc(offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
1401
a61af66fc99e Initial load
duke
parents:
diff changeset
1402 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
1403 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
1404 inc_counter_np(SharedRuntime::_jbyte_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1405 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
1406 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
1407 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
1408 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1409
a61af66fc99e Initial load
duke
parents:
diff changeset
1410 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1411 // Generate stub for conjoint byte copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
1412 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
1413 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1414 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
1415 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
1416 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
1417 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
1418 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1419 address generate_conjoint_byte_copy(bool aligned, address nooverlap_target,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1420 address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1421 // Do reverse copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
1422
a61af66fc99e Initial load
duke
parents:
diff changeset
1423 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1424 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
1425 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
1426
a61af66fc99e Initial load
duke
parents:
diff changeset
1427 Label L_skip_alignment, L_align, L_aligned_copy;
a61af66fc99e Initial load
duke
parents:
diff changeset
1428 Label L_copy_byte, L_copy_byte_loop, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
1429
a61af66fc99e Initial load
duke
parents:
diff changeset
1430 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1431 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1432 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
1433 const Register end_from = from; // source array end address
a61af66fc99e Initial load
duke
parents:
diff changeset
1434 const Register end_to = to; // destination array end address
a61af66fc99e Initial load
duke
parents:
diff changeset
1435
a61af66fc99e Initial load
duke
parents:
diff changeset
1436 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
1437
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1438 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1439 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1440 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1441 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1442 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1443
a61af66fc99e Initial load
duke
parents:
diff changeset
1444 array_overlap_test(nooverlap_target, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1445
a61af66fc99e Initial load
duke
parents:
diff changeset
1446 __ add(to, count, end_to); // offset after last copied element
a61af66fc99e Initial load
duke
parents:
diff changeset
1447
a61af66fc99e Initial load
duke
parents:
diff changeset
1448 // for short arrays, just do single element copy
a61af66fc99e Initial load
duke
parents:
diff changeset
1449 __ cmp(count, 23); // 16 + 7
a61af66fc99e Initial load
duke
parents:
diff changeset
1450 __ brx(Assembler::less, false, Assembler::pn, L_copy_byte);
a61af66fc99e Initial load
duke
parents:
diff changeset
1451 __ delayed()->add(from, count, end_from);
a61af66fc99e Initial load
duke
parents:
diff changeset
1452
a61af66fc99e Initial load
duke
parents:
diff changeset
1453 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1454 // Align end of arrays since they could be not aligned even
a61af66fc99e Initial load
duke
parents:
diff changeset
1455 // when arrays itself are aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
1456
a61af66fc99e Initial load
duke
parents:
diff changeset
1457 // copy bytes to align 'end_to' on 8 byte boundary
a61af66fc99e Initial load
duke
parents:
diff changeset
1458 __ andcc(end_to, 7, G1); // misaligned bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1459 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1460 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
1461 __ sub(count, G1, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1462 __ BIND(L_align);
a61af66fc99e Initial load
duke
parents:
diff changeset
1463 __ dec(end_from);
a61af66fc99e Initial load
duke
parents:
diff changeset
1464 __ dec(end_to);
a61af66fc99e Initial load
duke
parents:
diff changeset
1465 __ ldub(end_from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1466 __ deccc(G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
1467 __ brx(Assembler::notZero, false, Assembler::pt, L_align);
a61af66fc99e Initial load
duke
parents:
diff changeset
1468 __ delayed()->stb(O3, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1469 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1470 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1471 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
1472 if (aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1473 // Both arrays are aligned to 8-bytes in 64-bits VM.
a61af66fc99e Initial load
duke
parents:
diff changeset
1474 // The 'count' is decremented in copy_16_bytes_backward_with_shift()
a61af66fc99e Initial load
duke
parents:
diff changeset
1475 // in unaligned case.
a61af66fc99e Initial load
duke
parents:
diff changeset
1476 __ dec(count, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1477 } else
a61af66fc99e Initial load
duke
parents:
diff changeset
1478 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
1479 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1480 // Copy with shift 16 bytes per iteration if arrays do not have
a61af66fc99e Initial load
duke
parents:
diff changeset
1481 // the same alignment mod 8, otherwise jump to the next
a61af66fc99e Initial load
duke
parents:
diff changeset
1482 // code for aligned copy (and substracting 16 from 'count' before jump).
a61af66fc99e Initial load
duke
parents:
diff changeset
1483 // The compare above (count >= 11) guarantes 'count' >= 16 bytes.
a61af66fc99e Initial load
duke
parents:
diff changeset
1484 // Also jump over aligned copy after the copy with shift completed.
a61af66fc99e Initial load
duke
parents:
diff changeset
1485
a61af66fc99e Initial load
duke
parents:
diff changeset
1486 copy_16_bytes_backward_with_shift(end_from, end_to, count, 16,
a61af66fc99e Initial load
duke
parents:
diff changeset
1487 L_aligned_copy, L_copy_byte);
a61af66fc99e Initial load
duke
parents:
diff changeset
1488 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1489 // copy 4 elements (16 bytes) at a time
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
1490 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1491 __ BIND(L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
1492 __ dec(end_from, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1493 __ ldx(end_from, 8, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1494 __ ldx(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1495 __ dec(end_to, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1496 __ deccc(count, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1497 __ stx(O3, end_to, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1498 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
1499 __ delayed()->stx(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1500 __ inc(count, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1501
a61af66fc99e Initial load
duke
parents:
diff changeset
1502 // copy 1 element (2 bytes) at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
1503 __ BIND(L_copy_byte);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
1504 __ cmp_and_br_short(count, 0, Assembler::equal, Assembler::pt, L_exit);
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
1505 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1506 __ BIND(L_copy_byte_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1507 __ dec(end_from);
a61af66fc99e Initial load
duke
parents:
diff changeset
1508 __ dec(end_to);
a61af66fc99e Initial load
duke
parents:
diff changeset
1509 __ ldub(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1510 __ deccc(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1511 __ brx(Assembler::greater, false, Assembler::pt, L_copy_byte_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1512 __ delayed()->stb(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1513
a61af66fc99e Initial load
duke
parents:
diff changeset
1514 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
1515 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
1516 inc_counter_np(SharedRuntime::_jbyte_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1517 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
1518 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
1519 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
1520 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1521
a61af66fc99e Initial load
duke
parents:
diff changeset
1522 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1523 // Generate stub for disjoint short copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
1524 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
1525 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1526 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
1527 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
1528 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
1529 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
1530 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1531 address generate_disjoint_short_copy(bool aligned, address *entry, const char * name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1532 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1533 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
1534 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
1535
a61af66fc99e Initial load
duke
parents:
diff changeset
1536 Label L_skip_alignment, L_skip_alignment2;
a61af66fc99e Initial load
duke
parents:
diff changeset
1537 Label L_copy_2_bytes, L_copy_2_bytes_loop, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
1538
a61af66fc99e Initial load
duke
parents:
diff changeset
1539 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1540 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1541 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
1542 const Register offset = O5; // offset from start of arrays
a61af66fc99e Initial load
duke
parents:
diff changeset
1543 // O3, O4, G3, G4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
1544
a61af66fc99e Initial load
duke
parents:
diff changeset
1545 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
1546
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1547 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1548 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1549 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1550 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1551 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1552
a61af66fc99e Initial load
duke
parents:
diff changeset
1553 // for short arrays, just do single element copy
a61af66fc99e Initial load
duke
parents:
diff changeset
1554 __ cmp(count, 11); // 8 + 3 (22 bytes)
a61af66fc99e Initial load
duke
parents:
diff changeset
1555 __ brx(Assembler::less, false, Assembler::pn, L_copy_2_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
1556 __ delayed()->mov(G0, offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
1557
a61af66fc99e Initial load
duke
parents:
diff changeset
1558 if (aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1559 // 'aligned' == true when it is known statically during compilation
a61af66fc99e Initial load
duke
parents:
diff changeset
1560 // of this arraycopy call site that both 'from' and 'to' addresses
a61af66fc99e Initial load
duke
parents:
diff changeset
1561 // are HeapWordSize aligned (see LibraryCallKit::basictype2arraycopy()).
a61af66fc99e Initial load
duke
parents:
diff changeset
1562 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1563 // Aligned arrays have 4 bytes alignment in 32-bits VM
a61af66fc99e Initial load
duke
parents:
diff changeset
1564 // and 8 bytes - in 64-bits VM.
a61af66fc99e Initial load
duke
parents:
diff changeset
1565 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1566 #ifndef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
1567 // copy a 2-elements word if necessary to align 'to' to 8 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1568 __ andcc(to, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1569 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1570 __ delayed()->ld(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1571 __ inc(from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1572 __ inc(to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1573 __ dec(count, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1574 __ st(O3, to, -4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1575 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1576 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
1577 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
1578 // copy 1 element if necessary to align 'to' on an 4 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1579 __ andcc(to, 3, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1580 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1581 __ delayed()->lduh(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1582 __ inc(from, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1583 __ inc(to, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1584 __ dec(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1585 __ sth(O3, to, -2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1586 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1587
a61af66fc99e Initial load
duke
parents:
diff changeset
1588 // copy 2 elements to align 'to' on an 8 byte boundary
a61af66fc99e Initial load
duke
parents:
diff changeset
1589 __ andcc(to, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1590 __ br(Assembler::zero, false, Assembler::pn, L_skip_alignment2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1591 __ delayed()->lduh(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1592 __ dec(count, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1593 __ lduh(from, 2, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1594 __ inc(from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1595 __ inc(to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1596 __ sth(O3, to, -4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1597 __ sth(O4, to, -2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1598 __ BIND(L_skip_alignment2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1599 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1600 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
1601 if (!aligned)
a61af66fc99e Initial load
duke
parents:
diff changeset
1602 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
1603 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1604 // Copy with shift 16 bytes per iteration if arrays do not have
a61af66fc99e Initial load
duke
parents:
diff changeset
1605 // the same alignment mod 8, otherwise fall through to the next
a61af66fc99e Initial load
duke
parents:
diff changeset
1606 // code for aligned copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
1607 // The compare above (count >= 11) guarantes 'count' >= 16 bytes.
a61af66fc99e Initial load
duke
parents:
diff changeset
1608 // Also jump over aligned copy after the copy with shift completed.
a61af66fc99e Initial load
duke
parents:
diff changeset
1609
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1610 copy_16_bytes_forward_with_shift(from, to, count, 1, L_copy_2_bytes);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1611 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1612
a61af66fc99e Initial load
duke
parents:
diff changeset
1613 // Both array are 8 bytes aligned, copy 16 bytes at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
1614 __ and3(count, 3, G4); // Save
a61af66fc99e Initial load
duke
parents:
diff changeset
1615 __ srl(count, 2, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1616 generate_disjoint_long_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
1617 __ mov(G4, count); // restore
a61af66fc99e Initial load
duke
parents:
diff changeset
1618
a61af66fc99e Initial load
duke
parents:
diff changeset
1619 // copy 1 element at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
1620 __ BIND(L_copy_2_bytes);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
1621 __ cmp_and_br_short(count, 0, Assembler::equal, Assembler::pt, L_exit);
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
1622 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1623 __ BIND(L_copy_2_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1624 __ lduh(from, offset, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1625 __ deccc(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1626 __ sth(O3, to, offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
1627 __ brx(Assembler::notZero, false, Assembler::pt, L_copy_2_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1628 __ delayed()->inc(offset, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1629
a61af66fc99e Initial load
duke
parents:
diff changeset
1630 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
1631 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
1632 inc_counter_np(SharedRuntime::_jshort_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1633 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
1634 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
1635 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
1636 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1637
a61af66fc99e Initial load
duke
parents:
diff changeset
1638 //
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1639 // Generate stub for disjoint short fill. If "aligned" is true, the
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1640 // "to" address is assumed to be heapword aligned.
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1641 //
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1642 // Arguments for generated stub:
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1643 // to: O0
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1644 // value: O1
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1645 // count: O2 treated as signed
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1646 //
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1647 address generate_fill(BasicType t, bool aligned, const char* name) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1648 __ align(CodeEntryAlignment);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1649 StubCodeMark mark(this, "StubRoutines", name);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1650 address start = __ pc();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1651
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1652 const Register to = O0; // source array address
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1653 const Register value = O1; // fill value
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1654 const Register count = O2; // elements count
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1655 // O3 is used as a temp register
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1656
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1657 assert_clean_int(count, O3); // Make sure 'count' is clean int.
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1658
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1659 Label L_exit, L_skip_align1, L_skip_align2, L_fill_byte;
1794
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1660 Label L_fill_2_bytes, L_fill_elements, L_fill_32_bytes;
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1661
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1662 int shift = -1;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1663 switch (t) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1664 case T_BYTE:
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1665 shift = 2;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1666 break;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1667 case T_SHORT:
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1668 shift = 1;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1669 break;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1670 case T_INT:
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1671 shift = 0;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1672 break;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1673 default: ShouldNotReachHere();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1674 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1675
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1676 BLOCK_COMMENT("Entry:");
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1677
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1678 if (t == T_BYTE) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1679 // Zero extend value
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1680 __ and3(value, 0xff, value);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1681 __ sllx(value, 8, O3);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1682 __ or3(value, O3, value);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1683 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1684 if (t == T_SHORT) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1685 // Zero extend value
1794
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1686 __ sllx(value, 48, value);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1687 __ srlx(value, 48, value);
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1688 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1689 if (t == T_BYTE || t == T_SHORT) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1690 __ sllx(value, 16, O3);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1691 __ or3(value, O3, value);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1692 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1693
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1694 __ cmp(count, 2<<shift); // Short arrays (< 8 bytes) fill by element
1794
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1695 __ brx(Assembler::lessUnsigned, false, Assembler::pn, L_fill_elements); // use unsigned cmp
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1696 __ delayed()->andcc(count, 1, G0);
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1697
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1698 if (!aligned && (t == T_BYTE || t == T_SHORT)) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1699 // align source address at 4 bytes address boundary
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1700 if (t == T_BYTE) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1701 // One byte misalignment happens only for byte arrays
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1702 __ andcc(to, 1, G0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1703 __ br(Assembler::zero, false, Assembler::pt, L_skip_align1);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1704 __ delayed()->nop();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1705 __ stb(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1706 __ inc(to, 1);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1707 __ dec(count, 1);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1708 __ BIND(L_skip_align1);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1709 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1710 // Two bytes misalignment happens only for byte and short (char) arrays
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1711 __ andcc(to, 2, G0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1712 __ br(Assembler::zero, false, Assembler::pt, L_skip_align2);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1713 __ delayed()->nop();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1714 __ sth(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1715 __ inc(to, 2);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1716 __ dec(count, 1 << (shift - 1));
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1717 __ BIND(L_skip_align2);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1718 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1719 #ifdef _LP64
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1720 if (!aligned) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1721 #endif
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1722 // align to 8 bytes, we know we are 4 byte aligned to start
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1723 __ andcc(to, 7, G0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1724 __ br(Assembler::zero, false, Assembler::pt, L_fill_32_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1725 __ delayed()->nop();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1726 __ stw(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1727 __ inc(to, 4);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1728 __ dec(count, 1 << shift);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1729 __ BIND(L_fill_32_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1730 #ifdef _LP64
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1731 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1732 #endif
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1733
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1734 if (t == T_INT) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1735 // Zero extend value
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1736 __ srl(value, 0, value);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1737 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1738 if (t == T_BYTE || t == T_SHORT || t == T_INT) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1739 __ sllx(value, 32, O3);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1740 __ or3(value, O3, value);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1741 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1742
1782
f353275af40e 6981773: incorrect fill value with OptimizeFill
never
parents: 1763
diff changeset
1743 Label L_check_fill_8_bytes;
f353275af40e 6981773: incorrect fill value with OptimizeFill
never
parents: 1763
diff changeset
1744 // Fill 32-byte chunks
f353275af40e 6981773: incorrect fill value with OptimizeFill
never
parents: 1763
diff changeset
1745 __ subcc(count, 8 << shift, count);
f353275af40e 6981773: incorrect fill value with OptimizeFill
never
parents: 1763
diff changeset
1746 __ brx(Assembler::less, false, Assembler::pt, L_check_fill_8_bytes);
f353275af40e 6981773: incorrect fill value with OptimizeFill
never
parents: 1763
diff changeset
1747 __ delayed()->nop();
f353275af40e 6981773: incorrect fill value with OptimizeFill
never
parents: 1763
diff changeset
1748
1794
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1749 Label L_fill_32_bytes_loop, L_fill_4_bytes;
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1750 __ align(16);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1751 __ BIND(L_fill_32_bytes_loop);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1752
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1753 __ stx(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1754 __ stx(value, to, 8);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1755 __ stx(value, to, 16);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1756 __ stx(value, to, 24);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1757
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1758 __ subcc(count, 8 << shift, count);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1759 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_fill_32_bytes_loop);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1760 __ delayed()->add(to, 32, to);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1761
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1762 __ BIND(L_check_fill_8_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1763 __ addcc(count, 8 << shift, count);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1764 __ brx(Assembler::zero, false, Assembler::pn, L_exit);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1765 __ delayed()->subcc(count, 1 << (shift + 1), count);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1766 __ brx(Assembler::less, false, Assembler::pn, L_fill_4_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1767 __ delayed()->andcc(count, 1<<shift, G0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1768
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1769 //
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1770 // length is too short, just fill 8 bytes at a time
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1771 //
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1772 Label L_fill_8_bytes_loop;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1773 __ BIND(L_fill_8_bytes_loop);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1774 __ stx(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1775 __ subcc(count, 1 << (shift + 1), count);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1776 __ brx(Assembler::greaterEqual, false, Assembler::pn, L_fill_8_bytes_loop);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1777 __ delayed()->add(to, 8, to);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1778
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1779 // fill trailing 4 bytes
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1780 __ andcc(count, 1<<shift, G0); // in delay slot of branches
1794
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1781 if (t == T_INT) {
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1782 __ BIND(L_fill_elements);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1783 }
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1784 __ BIND(L_fill_4_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1785 __ brx(Assembler::zero, false, Assembler::pt, L_fill_2_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1786 if (t == T_BYTE || t == T_SHORT) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1787 __ delayed()->andcc(count, 1<<(shift-1), G0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1788 } else {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1789 __ delayed()->nop();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1790 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1791 __ stw(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1792 if (t == T_BYTE || t == T_SHORT) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1793 __ inc(to, 4);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1794 // fill trailing 2 bytes
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1795 __ andcc(count, 1<<(shift-1), G0); // in delay slot of branches
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1796 __ BIND(L_fill_2_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1797 __ brx(Assembler::zero, false, Assembler::pt, L_fill_byte);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1798 __ delayed()->andcc(count, 1, count);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1799 __ sth(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1800 if (t == T_BYTE) {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1801 __ inc(to, 2);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1802 // fill trailing byte
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1803 __ andcc(count, 1, count); // in delay slot of branches
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1804 __ BIND(L_fill_byte);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1805 __ brx(Assembler::zero, false, Assembler::pt, L_exit);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1806 __ delayed()->nop();
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1807 __ stb(value, to, 0);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1808 } else {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1809 __ BIND(L_fill_byte);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1810 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1811 } else {
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1812 __ BIND(L_fill_2_bytes);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1813 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1814 __ BIND(L_exit);
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1815 __ retl();
1794
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1816 __ delayed()->nop();
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1817
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1818 // Handle copies less than 8 bytes. Int is handled elsewhere.
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1819 if (t == T_BYTE) {
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1820 __ BIND(L_fill_elements);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1821 Label L_fill_2, L_fill_4;
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1822 // in delay slot __ andcc(count, 1, G0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1823 __ brx(Assembler::zero, false, Assembler::pt, L_fill_2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1824 __ delayed()->andcc(count, 2, G0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1825 __ stb(value, to, 0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1826 __ inc(to, 1);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1827 __ BIND(L_fill_2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1828 __ brx(Assembler::zero, false, Assembler::pt, L_fill_4);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1829 __ delayed()->andcc(count, 4, G0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1830 __ stb(value, to, 0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1831 __ stb(value, to, 1);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1832 __ inc(to, 2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1833 __ BIND(L_fill_4);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1834 __ brx(Assembler::zero, false, Assembler::pt, L_exit);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1835 __ delayed()->nop();
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1836 __ stb(value, to, 0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1837 __ stb(value, to, 1);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1838 __ stb(value, to, 2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1839 __ retl();
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1840 __ delayed()->stb(value, to, 3);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1841 }
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1842
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1843 if (t == T_SHORT) {
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1844 Label L_fill_2;
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1845 __ BIND(L_fill_elements);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1846 // in delay slot __ andcc(count, 1, G0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1847 __ brx(Assembler::zero, false, Assembler::pt, L_fill_2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1848 __ delayed()->andcc(count, 2, G0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1849 __ sth(value, to, 0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1850 __ inc(to, 2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1851 __ BIND(L_fill_2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1852 __ brx(Assembler::zero, false, Assembler::pt, L_exit);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1853 __ delayed()->nop();
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1854 __ sth(value, to, 0);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1855 __ retl();
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1856 __ delayed()->sth(value, to, 2);
065dd1ca3ab6 6982370: SIGBUS in jbyte_fill
never
parents: 1782
diff changeset
1857 }
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1858 return start;
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1859 }
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1860
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
1861 //
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1862 // Generate stub for conjoint short copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
1863 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
1864 //
a61af66fc99e Initial load
duke
parents:
diff changeset
1865 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
1866 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
1867 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
1868 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
1869 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1870 address generate_conjoint_short_copy(bool aligned, address nooverlap_target,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1871 address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1872 // Do reverse copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
1873
a61af66fc99e Initial load
duke
parents:
diff changeset
1874 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1875 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
1876 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
1877
a61af66fc99e Initial load
duke
parents:
diff changeset
1878 Label L_skip_alignment, L_skip_alignment2, L_aligned_copy;
a61af66fc99e Initial load
duke
parents:
diff changeset
1879 Label L_copy_2_bytes, L_copy_2_bytes_loop, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
1880
a61af66fc99e Initial load
duke
parents:
diff changeset
1881 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1882 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
1883 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
1884 const Register end_from = from; // source array end address
a61af66fc99e Initial load
duke
parents:
diff changeset
1885 const Register end_to = to; // destination array end address
a61af66fc99e Initial load
duke
parents:
diff changeset
1886
a61af66fc99e Initial load
duke
parents:
diff changeset
1887 const Register byte_count = O3; // bytes count to copy
a61af66fc99e Initial load
duke
parents:
diff changeset
1888
a61af66fc99e Initial load
duke
parents:
diff changeset
1889 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
1890
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1891 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1892 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1893 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1894 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
1895 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1896
a61af66fc99e Initial load
duke
parents:
diff changeset
1897 array_overlap_test(nooverlap_target, 1);
a61af66fc99e Initial load
duke
parents:
diff changeset
1898
a61af66fc99e Initial load
duke
parents:
diff changeset
1899 __ sllx(count, LogBytesPerShort, byte_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1900 __ add(to, byte_count, end_to); // offset after last copied element
a61af66fc99e Initial load
duke
parents:
diff changeset
1901
a61af66fc99e Initial load
duke
parents:
diff changeset
1902 // for short arrays, just do single element copy
a61af66fc99e Initial load
duke
parents:
diff changeset
1903 __ cmp(count, 11); // 8 + 3 (22 bytes)
a61af66fc99e Initial load
duke
parents:
diff changeset
1904 __ brx(Assembler::less, false, Assembler::pn, L_copy_2_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
1905 __ delayed()->add(from, byte_count, end_from);
a61af66fc99e Initial load
duke
parents:
diff changeset
1906
a61af66fc99e Initial load
duke
parents:
diff changeset
1907 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1908 // Align end of arrays since they could be not aligned even
a61af66fc99e Initial load
duke
parents:
diff changeset
1909 // when arrays itself are aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
1910
a61af66fc99e Initial load
duke
parents:
diff changeset
1911 // copy 1 element if necessary to align 'end_to' on an 4 bytes
a61af66fc99e Initial load
duke
parents:
diff changeset
1912 __ andcc(end_to, 3, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1913 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1914 __ delayed()->lduh(end_from, -2, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1915 __ dec(end_from, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1916 __ dec(end_to, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1917 __ dec(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1918 __ sth(O3, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1919 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
1920
a61af66fc99e Initial load
duke
parents:
diff changeset
1921 // copy 2 elements to align 'end_to' on an 8 byte boundary
a61af66fc99e Initial load
duke
parents:
diff changeset
1922 __ andcc(end_to, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1923 __ br(Assembler::zero, false, Assembler::pn, L_skip_alignment2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1924 __ delayed()->lduh(end_from, -2, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1925 __ dec(count, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1926 __ lduh(end_from, -4, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1927 __ dec(end_from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1928 __ dec(end_to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1929 __ sth(O3, end_to, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1930 __ sth(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1931 __ BIND(L_skip_alignment2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1932 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1933 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
1934 if (aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
1935 // Both arrays are aligned to 8-bytes in 64-bits VM.
a61af66fc99e Initial load
duke
parents:
diff changeset
1936 // The 'count' is decremented in copy_16_bytes_backward_with_shift()
a61af66fc99e Initial load
duke
parents:
diff changeset
1937 // in unaligned case.
a61af66fc99e Initial load
duke
parents:
diff changeset
1938 __ dec(count, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1939 } else
a61af66fc99e Initial load
duke
parents:
diff changeset
1940 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
1941 {
a61af66fc99e Initial load
duke
parents:
diff changeset
1942 // Copy with shift 16 bytes per iteration if arrays do not have
a61af66fc99e Initial load
duke
parents:
diff changeset
1943 // the same alignment mod 8, otherwise jump to the next
a61af66fc99e Initial load
duke
parents:
diff changeset
1944 // code for aligned copy (and substracting 8 from 'count' before jump).
a61af66fc99e Initial load
duke
parents:
diff changeset
1945 // The compare above (count >= 11) guarantes 'count' >= 16 bytes.
a61af66fc99e Initial load
duke
parents:
diff changeset
1946 // Also jump over aligned copy after the copy with shift completed.
a61af66fc99e Initial load
duke
parents:
diff changeset
1947
a61af66fc99e Initial load
duke
parents:
diff changeset
1948 copy_16_bytes_backward_with_shift(end_from, end_to, count, 8,
a61af66fc99e Initial load
duke
parents:
diff changeset
1949 L_aligned_copy, L_copy_2_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
1950 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1951 // copy 4 elements (16 bytes) at a time
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
1952 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1953 __ BIND(L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
1954 __ dec(end_from, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1955 __ ldx(end_from, 8, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
1956 __ ldx(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1957 __ dec(end_to, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
1958 __ deccc(count, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1959 __ stx(O3, end_to, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1960 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
1961 __ delayed()->stx(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1962 __ inc(count, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
1963
a61af66fc99e Initial load
duke
parents:
diff changeset
1964 // copy 1 element (2 bytes) at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
1965 __ BIND(L_copy_2_bytes);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
1966 __ cmp_and_br_short(count, 0, Assembler::equal, Assembler::pt, L_exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
1967 __ BIND(L_copy_2_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1968 __ dec(end_from, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1969 __ dec(end_to, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
1970 __ lduh(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1971 __ deccc(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
1972 __ brx(Assembler::greater, false, Assembler::pt, L_copy_2_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
1973 __ delayed()->sth(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
1974
a61af66fc99e Initial load
duke
parents:
diff changeset
1975 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
1976 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
1977 inc_counter_np(SharedRuntime::_jshort_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
1978 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
1979 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
1980 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
1981 }
a61af66fc99e Initial load
duke
parents:
diff changeset
1982
a61af66fc99e Initial load
duke
parents:
diff changeset
1983 //
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1984 // Helper methods for generate_disjoint_int_copy_core()
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1985 //
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1986 void copy_16_bytes_loop(Register from, Register to, Register count, int count_dec,
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1987 Label& L_loop, bool use_prefetch, bool use_bis) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1988
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1989 __ align(OptoLoopAlignment);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1990 __ BIND(L_loop);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1991 if (use_prefetch) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1992 if (ArraycopySrcPrefetchDistance > 0) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1993 __ prefetch(from, ArraycopySrcPrefetchDistance, Assembler::severalReads);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1994 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1995 if (ArraycopyDstPrefetchDistance > 0) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1996 __ prefetch(to, ArraycopyDstPrefetchDistance, Assembler::severalWritesAndPossiblyReads);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1997 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1998 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
1999 __ ldx(from, 4, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2000 __ ldx(from, 12, G4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2001 __ inc(to, 16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2002 __ inc(from, 16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2003 __ deccc(count, 4); // Can we do next iteration after this one?
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2004
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2005 __ srlx(O4, 32, G3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2006 __ bset(G3, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2007 __ sllx(O4, 32, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2008 __ srlx(G4, 32, G3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2009 __ bset(G3, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2010 if (use_bis) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2011 __ stxa(O3, to, -16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2012 __ stxa(O4, to, -8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2013 } else {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2014 __ stx(O3, to, -16);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2015 __ stx(O4, to, -8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2016 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2017 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_loop);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2018 __ delayed()->sllx(G4, 32, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2019
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2020 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2021
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2022 //
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2023 // Generate core code for disjoint int copy (and oop copy on 32-bit).
a61af66fc99e Initial load
duke
parents:
diff changeset
2024 // If "aligned" is true, the "from" and "to" addresses are assumed
a61af66fc99e Initial load
duke
parents:
diff changeset
2025 // to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2026 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2027 // Arguments:
a61af66fc99e Initial load
duke
parents:
diff changeset
2028 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2029 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2030 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2031 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2032 void generate_disjoint_int_copy_core(bool aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
2033
a61af66fc99e Initial load
duke
parents:
diff changeset
2034 Label L_skip_alignment, L_aligned_copy;
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2035 Label L_copy_4_bytes, L_copy_4_bytes_loop, L_exit;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2036
a61af66fc99e Initial load
duke
parents:
diff changeset
2037 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2038 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2039 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2040 const Register offset = O5; // offset from start of arrays
a61af66fc99e Initial load
duke
parents:
diff changeset
2041 // O3, O4, G3, G4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2042
a61af66fc99e Initial load
duke
parents:
diff changeset
2043 // 'aligned' == true when it is known statically during compilation
a61af66fc99e Initial load
duke
parents:
diff changeset
2044 // of this arraycopy call site that both 'from' and 'to' addresses
a61af66fc99e Initial load
duke
parents:
diff changeset
2045 // are HeapWordSize aligned (see LibraryCallKit::basictype2arraycopy()).
a61af66fc99e Initial load
duke
parents:
diff changeset
2046 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2047 // Aligned arrays have 4 bytes alignment in 32-bits VM
a61af66fc99e Initial load
duke
parents:
diff changeset
2048 // and 8 bytes - in 64-bits VM.
a61af66fc99e Initial load
duke
parents:
diff changeset
2049 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2050 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
2051 if (!aligned)
a61af66fc99e Initial load
duke
parents:
diff changeset
2052 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
2053 {
a61af66fc99e Initial load
duke
parents:
diff changeset
2054 // The next check could be put under 'ifndef' since the code in
a61af66fc99e Initial load
duke
parents:
diff changeset
2055 // generate_disjoint_long_copy_core() has own checks and set 'offset'.
a61af66fc99e Initial load
duke
parents:
diff changeset
2056
a61af66fc99e Initial load
duke
parents:
diff changeset
2057 // for short arrays, just do single element copy
a61af66fc99e Initial load
duke
parents:
diff changeset
2058 __ cmp(count, 5); // 4 + 1 (20 bytes)
a61af66fc99e Initial load
duke
parents:
diff changeset
2059 __ brx(Assembler::lessEqual, false, Assembler::pn, L_copy_4_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2060 __ delayed()->mov(G0, offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
2061
a61af66fc99e Initial load
duke
parents:
diff changeset
2062 // copy 1 element to align 'to' on an 8 byte boundary
a61af66fc99e Initial load
duke
parents:
diff changeset
2063 __ andcc(to, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2064 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2065 __ delayed()->ld(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2066 __ inc(from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2067 __ inc(to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2068 __ dec(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2069 __ st(O3, to, -4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2070 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2071
a61af66fc99e Initial load
duke
parents:
diff changeset
2072 // if arrays have same alignment mod 8, do 4 elements copy
a61af66fc99e Initial load
duke
parents:
diff changeset
2073 __ andcc(from, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2074 __ br(Assembler::zero, false, Assembler::pt, L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
2075 __ delayed()->ld(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2076
a61af66fc99e Initial load
duke
parents:
diff changeset
2077 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2078 // Load 2 aligned 8-bytes chunks and use one from previous iteration
a61af66fc99e Initial load
duke
parents:
diff changeset
2079 // to form 2 aligned 8-bytes chunks to store.
a61af66fc99e Initial load
duke
parents:
diff changeset
2080 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2081 // copy_16_bytes_forward_with_shift() is not used here since this
a61af66fc99e Initial load
duke
parents:
diff changeset
2082 // code is more optimal.
a61af66fc99e Initial load
duke
parents:
diff changeset
2083
a61af66fc99e Initial load
duke
parents:
diff changeset
2084 // copy with shift 4 elements (16 bytes) at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
2085 __ dec(count, 4); // The cmp at the beginning guaranty count >= 4
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2086 __ sllx(O3, 32, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2087
17939
0fb5b60ab4a2 8022070: Compilation error in stubGenerator_sparc.cpp with some compilers
mikael
parents: 17910
diff changeset
2088 disjoint_copy_core(from, to, count, 2, 16, &StubGenerator::copy_16_bytes_loop);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2089
a61af66fc99e Initial load
duke
parents:
diff changeset
2090 __ br(Assembler::always, false, Assembler::pt, L_copy_4_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2091 __ delayed()->inc(count, 4); // restore 'count'
a61af66fc99e Initial load
duke
parents:
diff changeset
2092
a61af66fc99e Initial load
duke
parents:
diff changeset
2093 __ BIND(L_aligned_copy);
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2094 } // !aligned
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2095
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2096 // copy 4 elements (16 bytes) at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
2097 __ and3(count, 1, G4); // Save
a61af66fc99e Initial load
duke
parents:
diff changeset
2098 __ srl(count, 1, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2099 generate_disjoint_long_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2100 __ mov(G4, count); // Restore
a61af66fc99e Initial load
duke
parents:
diff changeset
2101
a61af66fc99e Initial load
duke
parents:
diff changeset
2102 // copy 1 element at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
2103 __ BIND(L_copy_4_bytes);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
2104 __ cmp_and_br_short(count, 0, Assembler::equal, Assembler::pt, L_exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2105 __ BIND(L_copy_4_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
2106 __ ld(from, offset, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2107 __ deccc(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2108 __ st(O3, to, offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
2109 __ brx(Assembler::notZero, false, Assembler::pt, L_copy_4_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
2110 __ delayed()->inc(offset, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2111 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
2112 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2113
a61af66fc99e Initial load
duke
parents:
diff changeset
2114 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2115 // Generate stub for disjoint int copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
2116 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2117 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2118 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2119 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2120 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2121 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2122 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2123 address generate_disjoint_int_copy(bool aligned, address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2124 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2125 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2126 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2127
a61af66fc99e Initial load
duke
parents:
diff changeset
2128 const Register count = O2;
a61af66fc99e Initial load
duke
parents:
diff changeset
2129 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
2130
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2131 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2132 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2133 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2134 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2135 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2136
a61af66fc99e Initial load
duke
parents:
diff changeset
2137 generate_disjoint_int_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2138
a61af66fc99e Initial load
duke
parents:
diff changeset
2139 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2140 inc_counter_np(SharedRuntime::_jint_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2141 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2142 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2143 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2144 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2145
a61af66fc99e Initial load
duke
parents:
diff changeset
2146 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2147 // Generate core code for conjoint int copy (and oop copy on 32-bit).
a61af66fc99e Initial load
duke
parents:
diff changeset
2148 // If "aligned" is true, the "from" and "to" addresses are assumed
a61af66fc99e Initial load
duke
parents:
diff changeset
2149 // to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2150 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2151 // Arguments:
a61af66fc99e Initial load
duke
parents:
diff changeset
2152 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2153 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2154 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2155 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2156 void generate_conjoint_int_copy_core(bool aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
2157 // Do reverse copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
2158
a61af66fc99e Initial load
duke
parents:
diff changeset
2159 Label L_skip_alignment, L_aligned_copy;
a61af66fc99e Initial load
duke
parents:
diff changeset
2160 Label L_copy_16_bytes, L_copy_4_bytes, L_copy_4_bytes_loop, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
2161
a61af66fc99e Initial load
duke
parents:
diff changeset
2162 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2163 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2164 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2165 const Register end_from = from; // source array end address
a61af66fc99e Initial load
duke
parents:
diff changeset
2166 const Register end_to = to; // destination array end address
a61af66fc99e Initial load
duke
parents:
diff changeset
2167 // O3, O4, O5, G3 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2168
a61af66fc99e Initial load
duke
parents:
diff changeset
2169 const Register byte_count = O3; // bytes count to copy
a61af66fc99e Initial load
duke
parents:
diff changeset
2170
a61af66fc99e Initial load
duke
parents:
diff changeset
2171 __ sllx(count, LogBytesPerInt, byte_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2172 __ add(to, byte_count, end_to); // offset after last copied element
a61af66fc99e Initial load
duke
parents:
diff changeset
2173
a61af66fc99e Initial load
duke
parents:
diff changeset
2174 __ cmp(count, 5); // for short arrays, just do single element copy
a61af66fc99e Initial load
duke
parents:
diff changeset
2175 __ brx(Assembler::lessEqual, false, Assembler::pn, L_copy_4_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2176 __ delayed()->add(from, byte_count, end_from);
a61af66fc99e Initial load
duke
parents:
diff changeset
2177
a61af66fc99e Initial load
duke
parents:
diff changeset
2178 // copy 1 element to align 'to' on an 8 byte boundary
a61af66fc99e Initial load
duke
parents:
diff changeset
2179 __ andcc(end_to, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2180 __ br(Assembler::zero, false, Assembler::pt, L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2181 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
2182 __ dec(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2183 __ dec(end_from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2184 __ dec(end_to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2185 __ ld(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2186 __ st(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2187 __ BIND(L_skip_alignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2188
a61af66fc99e Initial load
duke
parents:
diff changeset
2189 // Check if 'end_from' and 'end_to' has the same alignment.
a61af66fc99e Initial load
duke
parents:
diff changeset
2190 __ andcc(end_from, 7, G0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2191 __ br(Assembler::zero, false, Assembler::pt, L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
2192 __ delayed()->dec(count, 4); // The cmp at the start guaranty cnt >= 4
a61af66fc99e Initial load
duke
parents:
diff changeset
2193
a61af66fc99e Initial load
duke
parents:
diff changeset
2194 // copy with shift 4 elements (16 bytes) at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
2195 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2196 // Load 2 aligned 8-bytes chunks and use one from previous iteration
a61af66fc99e Initial load
duke
parents:
diff changeset
2197 // to form 2 aligned 8-bytes chunks to store.
a61af66fc99e Initial load
duke
parents:
diff changeset
2198 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2199 __ ldx(end_from, -4, O3);
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
2200 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2201 __ BIND(L_copy_16_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2202 __ ldx(end_from, -12, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2203 __ deccc(count, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2204 __ ldx(end_from, -20, O5);
a61af66fc99e Initial load
duke
parents:
diff changeset
2205 __ dec(end_to, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2206 __ dec(end_from, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2207 __ srlx(O3, 32, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2208 __ sllx(O4, 32, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2209 __ bset(G3, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2210 __ stx(O3, end_to, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
2211 __ srlx(O4, 32, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2212 __ sllx(O5, 32, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2213 __ bset(O4, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2214 __ stx(G3, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2215 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_copy_16_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2216 __ delayed()->mov(O5, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2217
a61af66fc99e Initial load
duke
parents:
diff changeset
2218 __ br(Assembler::always, false, Assembler::pt, L_copy_4_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2219 __ delayed()->inc(count, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2220
a61af66fc99e Initial load
duke
parents:
diff changeset
2221 // copy 4 elements (16 bytes) at a time
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
2222 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2223 __ BIND(L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
2224 __ dec(end_from, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2225 __ ldx(end_from, 8, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2226 __ ldx(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2227 __ dec(end_to, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2228 __ deccc(count, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2229 __ stx(O3, end_to, 8);
a61af66fc99e Initial load
duke
parents:
diff changeset
2230 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_aligned_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
2231 __ delayed()->stx(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2232 __ inc(count, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2233
a61af66fc99e Initial load
duke
parents:
diff changeset
2234 // copy 1 element (4 bytes) at a time
a61af66fc99e Initial load
duke
parents:
diff changeset
2235 __ BIND(L_copy_4_bytes);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
2236 __ cmp_and_br_short(count, 0, Assembler::equal, Assembler::pt, L_exit);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2237 __ BIND(L_copy_4_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
2238 __ dec(end_from, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2239 __ dec(end_to, 4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2240 __ ld(end_from, 0, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2241 __ deccc(count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2242 __ brx(Assembler::greater, false, Assembler::pt, L_copy_4_bytes_loop);
a61af66fc99e Initial load
duke
parents:
diff changeset
2243 __ delayed()->st(O4, end_to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2244 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
2245 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2246
a61af66fc99e Initial load
duke
parents:
diff changeset
2247 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2248 // Generate stub for conjoint int copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
2249 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2250 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2251 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2252 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2253 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2254 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2255 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2256 address generate_conjoint_int_copy(bool aligned, address nooverlap_target,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2257 address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2258 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2259 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2260 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2261
a61af66fc99e Initial load
duke
parents:
diff changeset
2262 assert_clean_int(O2, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
2263
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2264 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2265 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2266 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2267 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2268 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2269
a61af66fc99e Initial load
duke
parents:
diff changeset
2270 array_overlap_test(nooverlap_target, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
2271
a61af66fc99e Initial load
duke
parents:
diff changeset
2272 generate_conjoint_int_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2273
a61af66fc99e Initial load
duke
parents:
diff changeset
2274 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2275 inc_counter_np(SharedRuntime::_jint_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2276 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2277 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2278 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2279 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2280
a61af66fc99e Initial load
duke
parents:
diff changeset
2281 //
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2282 // Helper methods for generate_disjoint_long_copy_core()
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2283 //
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2284 void copy_64_bytes_loop(Register from, Register to, Register count, int count_dec,
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2285 Label& L_loop, bool use_prefetch, bool use_bis) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2286 __ align(OptoLoopAlignment);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2287 __ BIND(L_loop);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2288 for (int off = 0; off < 64; off += 16) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2289 if (use_prefetch && (off & 31) == 0) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2290 if (ArraycopySrcPrefetchDistance > 0) {
3961
a92cdbac8b9e 7081933: Use zeroing elimination optimization for large array
kvn
parents: 3937
diff changeset
2291 __ prefetch(from, ArraycopySrcPrefetchDistance+off, Assembler::severalReads);
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2292 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2293 if (ArraycopyDstPrefetchDistance > 0) {
3961
a92cdbac8b9e 7081933: Use zeroing elimination optimization for large array
kvn
parents: 3937
diff changeset
2294 __ prefetch(to, ArraycopyDstPrefetchDistance+off, Assembler::severalWritesAndPossiblyReads);
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2295 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2296 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2297 __ ldx(from, off+0, O4);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2298 __ ldx(from, off+8, O5);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2299 if (use_bis) {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2300 __ stxa(O4, to, off+0);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2301 __ stxa(O5, to, off+8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2302 } else {
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2303 __ stx(O4, to, off+0);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2304 __ stx(O5, to, off+8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2305 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2306 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2307 __ deccc(count, 8);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2308 __ inc(from, 64);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2309 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_loop);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2310 __ delayed()->inc(to, 64);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2311 }
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2312
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2313 //
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2314 // Generate core code for disjoint long copy (and oop copy on 64-bit).
a61af66fc99e Initial load
duke
parents:
diff changeset
2315 // "aligned" is ignored, because we must make the stronger
a61af66fc99e Initial load
duke
parents:
diff changeset
2316 // assumption that both addresses are always 64-bit aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2317 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2318 // Arguments:
a61af66fc99e Initial load
duke
parents:
diff changeset
2319 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2320 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2321 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2322 //
1364
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2323 // count -= 2;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2324 // if ( count >= 0 ) { // >= 2 elements
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2325 // if ( count > 6) { // >= 8 elements
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2326 // count -= 6; // original count - 8
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2327 // do {
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2328 // copy_8_elements;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2329 // count -= 8;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2330 // } while ( count >= 0 );
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2331 // count += 6;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2332 // }
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2333 // if ( count >= 0 ) { // >= 2 elements
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2334 // do {
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2335 // copy_2_elements;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2336 // } while ( (count=count-2) >= 0 );
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2337 // }
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2338 // }
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2339 // count += 2;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2340 // if ( count != 0 ) { // 1 element left
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2341 // copy_1_element;
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2342 // }
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2343 //
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2344 void generate_disjoint_long_copy_core(bool aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
2345 Label L_copy_8_bytes, L_copy_16_bytes, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
2346 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2347 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2348 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2349 const Register offset0 = O4; // element offset
a61af66fc99e Initial load
duke
parents:
diff changeset
2350 const Register offset8 = O5; // next element offset
a61af66fc99e Initial load
duke
parents:
diff changeset
2351
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2352 __ deccc(count, 2);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2353 __ mov(G0, offset0); // offset from start of arrays (0)
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2354 __ brx(Assembler::negative, false, Assembler::pn, L_copy_8_bytes );
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2355 __ delayed()->add(offset0, 8, offset8);
1364
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2356
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2357 // Copy by 64 bytes chunks
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2358
1364
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2359 const Register from64 = O3; // source address
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2360 const Register to64 = G3; // destination address
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2361 __ subcc(count, 6, O3);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2362 __ brx(Assembler::negative, false, Assembler::pt, L_copy_16_bytes );
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2363 __ delayed()->mov(to, to64);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2364 // Now we can use O4(offset0), O5(offset8) as temps
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2365 __ mov(O3, count);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2366 // count >= 0 (original count - 8)
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2367 __ mov(from, from64);
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2368
17939
0fb5b60ab4a2 8022070: Compilation error in stubGenerator_sparc.cpp with some compilers
mikael
parents: 17910
diff changeset
2369 disjoint_copy_core(from64, to64, count, 3, 64, &StubGenerator::copy_64_bytes_loop);
1364
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2370
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2371 // Restore O4(offset0), O5(offset8)
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2372 __ sub(from64, from, offset0);
3903
2f9b79ddb05c 7039731: arraycopy could use prefetch on SPARC
kvn
parents: 3892
diff changeset
2373 __ inccc(count, 6); // restore count
1364
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2374 __ brx(Assembler::negative, false, Assembler::pn, L_copy_8_bytes );
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2375 __ delayed()->add(offset0, 8, offset8);
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2376
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2377 // Copy by 16 bytes chunks
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
2378 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2379 __ BIND(L_copy_16_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2380 __ ldx(from, offset0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2381 __ ldx(from, offset8, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2382 __ deccc(count, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
2383 __ stx(O3, to, offset0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2384 __ inc(offset0, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2385 __ stx(G3, to, offset8);
a61af66fc99e Initial load
duke
parents:
diff changeset
2386 __ brx(Assembler::greaterEqual, false, Assembler::pt, L_copy_16_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2387 __ delayed()->inc(offset8, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2388
1364
0dc88ad3244e 6940677: Use 64 bytes chunk copy for arraycopy on Sparc
kvn
parents: 1295
diff changeset
2389 // Copy last 8 bytes
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2390 __ BIND(L_copy_8_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2391 __ inccc(count, 2);
a61af66fc99e Initial load
duke
parents:
diff changeset
2392 __ brx(Assembler::zero, true, Assembler::pn, L_exit );
a61af66fc99e Initial load
duke
parents:
diff changeset
2393 __ delayed()->mov(offset0, offset8); // Set O5 used by other stubs
a61af66fc99e Initial load
duke
parents:
diff changeset
2394 __ ldx(from, offset0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2395 __ stx(O3, to, offset0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2396 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
2397 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2398
a61af66fc99e Initial load
duke
parents:
diff changeset
2399 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2400 // Generate stub for disjoint long copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
2401 // "aligned" is ignored, because we must make the stronger
a61af66fc99e Initial load
duke
parents:
diff changeset
2402 // assumption that both addresses are always 64-bit aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2403 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2404 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2405 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2406 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2407 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2408 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2409 address generate_disjoint_long_copy(bool aligned, address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2410 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2411 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2412 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2413
a61af66fc99e Initial load
duke
parents:
diff changeset
2414 assert_clean_int(O2, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
2415
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2416 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2417 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2418 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2419 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2420 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2421
a61af66fc99e Initial load
duke
parents:
diff changeset
2422 generate_disjoint_long_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2423
a61af66fc99e Initial load
duke
parents:
diff changeset
2424 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2425 inc_counter_np(SharedRuntime::_jlong_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2426 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2427 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2428 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2429 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2430
a61af66fc99e Initial load
duke
parents:
diff changeset
2431 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2432 // Generate core code for conjoint long copy (and oop copy on 64-bit).
a61af66fc99e Initial load
duke
parents:
diff changeset
2433 // "aligned" is ignored, because we must make the stronger
a61af66fc99e Initial load
duke
parents:
diff changeset
2434 // assumption that both addresses are always 64-bit aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2435 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2436 // Arguments:
a61af66fc99e Initial load
duke
parents:
diff changeset
2437 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2438 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2439 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2440 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2441 void generate_conjoint_long_copy_core(bool aligned) {
a61af66fc99e Initial load
duke
parents:
diff changeset
2442 // Do reverse copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
2443 Label L_copy_8_bytes, L_copy_16_bytes, L_exit;
a61af66fc99e Initial load
duke
parents:
diff changeset
2444 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2445 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2446 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2447 const Register offset8 = O4; // element offset
a61af66fc99e Initial load
duke
parents:
diff changeset
2448 const Register offset0 = O5; // previous element offset
a61af66fc99e Initial load
duke
parents:
diff changeset
2449
a61af66fc99e Initial load
duke
parents:
diff changeset
2450 __ subcc(count, 1, count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2451 __ brx(Assembler::lessEqual, false, Assembler::pn, L_copy_8_bytes );
a61af66fc99e Initial load
duke
parents:
diff changeset
2452 __ delayed()->sllx(count, LogBytesPerLong, offset8);
a61af66fc99e Initial load
duke
parents:
diff changeset
2453 __ sub(offset8, 8, offset0);
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
2454 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2455 __ BIND(L_copy_16_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2456 __ ldx(from, offset8, O2);
a61af66fc99e Initial load
duke
parents:
diff changeset
2457 __ ldx(from, offset0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2458 __ stx(O2, to, offset8);
a61af66fc99e Initial load
duke
parents:
diff changeset
2459 __ deccc(offset8, 16); // use offset8 as counter
a61af66fc99e Initial load
duke
parents:
diff changeset
2460 __ stx(O3, to, offset0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2461 __ brx(Assembler::greater, false, Assembler::pt, L_copy_16_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2462 __ delayed()->dec(offset0, 16);
a61af66fc99e Initial load
duke
parents:
diff changeset
2463
a61af66fc99e Initial load
duke
parents:
diff changeset
2464 __ BIND(L_copy_8_bytes);
a61af66fc99e Initial load
duke
parents:
diff changeset
2465 __ brx(Assembler::negative, false, Assembler::pn, L_exit );
a61af66fc99e Initial load
duke
parents:
diff changeset
2466 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
2467 __ ldx(from, 0, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2468 __ stx(O3, to, 0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2469 __ BIND(L_exit);
a61af66fc99e Initial load
duke
parents:
diff changeset
2470 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2471
a61af66fc99e Initial load
duke
parents:
diff changeset
2472 // Generate stub for conjoint long copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
2473 // "aligned" is ignored, because we must make the stronger
a61af66fc99e Initial load
duke
parents:
diff changeset
2474 // assumption that both addresses are always 64-bit aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2475 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2476 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2477 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2478 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2479 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2480 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2481 address generate_conjoint_long_copy(bool aligned, address nooverlap_target,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2482 address *entry, const char *name) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2483 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2484 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2485 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2486
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2487 assert(aligned, "Should always be aligned");
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2488
a61af66fc99e Initial load
duke
parents:
diff changeset
2489 assert_clean_int(O2, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
2490
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2491 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2492 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2493 // caller can pass a 64-bit byte count here (from Unsafe.copyMemory)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2494 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2495 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2496
a61af66fc99e Initial load
duke
parents:
diff changeset
2497 array_overlap_test(nooverlap_target, 3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2498
a61af66fc99e Initial load
duke
parents:
diff changeset
2499 generate_conjoint_long_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2500
a61af66fc99e Initial load
duke
parents:
diff changeset
2501 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2502 inc_counter_np(SharedRuntime::_jlong_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2503 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2504 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2505 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2506 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2507
a61af66fc99e Initial load
duke
parents:
diff changeset
2508 // Generate stub for disjoint oop copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
2509 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2510 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2511 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2512 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2513 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2514 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2515 //
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2516 address generate_disjoint_oop_copy(bool aligned, address *entry, const char *name,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2517 bool dest_uninitialized = false) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2518
a61af66fc99e Initial load
duke
parents:
diff changeset
2519 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2520 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2521 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2522
a61af66fc99e Initial load
duke
parents:
diff changeset
2523 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2524 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2525 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2526
a61af66fc99e Initial load
duke
parents:
diff changeset
2527 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
2528
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2529 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2530 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2531 // caller can pass a 64-bit byte count here
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2532 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2533 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2534
a61af66fc99e Initial load
duke
parents:
diff changeset
2535 // save arguments for barrier generation
a61af66fc99e Initial load
duke
parents:
diff changeset
2536 __ mov(to, G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
2537 __ mov(count, G5);
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2538 gen_write_ref_array_pre_barrier(G1, G5, dest_uninitialized);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2539 #ifdef _LP64
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2540 assert_clean_int(count, O3); // Make sure 'count' is clean int.
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2541 if (UseCompressedOops) {
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2542 generate_disjoint_int_copy_core(aligned);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2543 } else {
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2544 generate_disjoint_long_copy_core(aligned);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2545 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2546 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
2547 generate_disjoint_int_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2548 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
2549 // O0 is used as temp register
a61af66fc99e Initial load
duke
parents:
diff changeset
2550 gen_write_ref_array_post_barrier(G1, G5, O0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2551
a61af66fc99e Initial load
duke
parents:
diff changeset
2552 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2553 inc_counter_np(SharedRuntime::_oop_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2554 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2555 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2556 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2557 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2558
a61af66fc99e Initial load
duke
parents:
diff changeset
2559 // Generate stub for conjoint oop copy. If "aligned" is true, the
a61af66fc99e Initial load
duke
parents:
diff changeset
2560 // "from" and "to" addresses are assumed to be heapword aligned.
a61af66fc99e Initial load
duke
parents:
diff changeset
2561 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2562 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2563 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2564 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2565 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2566 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2567 address generate_conjoint_oop_copy(bool aligned, address nooverlap_target,
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2568 address *entry, const char *name,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2569 bool dest_uninitialized = false) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2570
a61af66fc99e Initial load
duke
parents:
diff changeset
2571 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2572 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2573 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2574
a61af66fc99e Initial load
duke
parents:
diff changeset
2575 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2576 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2577 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2578
a61af66fc99e Initial load
duke
parents:
diff changeset
2579 assert_clean_int(count, O3); // Make sure 'count' is clean int.
a61af66fc99e Initial load
duke
parents:
diff changeset
2580
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2581 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2582 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2583 // caller can pass a 64-bit byte count here
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2584 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2585 }
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2586
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2587 array_overlap_test(nooverlap_target, LogBytesPerHeapOop);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2588
a61af66fc99e Initial load
duke
parents:
diff changeset
2589 // save arguments for barrier generation
a61af66fc99e Initial load
duke
parents:
diff changeset
2590 __ mov(to, G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
2591 __ mov(count, G5);
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2592 gen_write_ref_array_pre_barrier(G1, G5, dest_uninitialized);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2593
a61af66fc99e Initial load
duke
parents:
diff changeset
2594 #ifdef _LP64
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2595 if (UseCompressedOops) {
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2596 generate_conjoint_int_copy_core(aligned);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2597 } else {
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2598 generate_conjoint_long_copy_core(aligned);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2599 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2600 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
2601 generate_conjoint_int_copy_core(aligned);
a61af66fc99e Initial load
duke
parents:
diff changeset
2602 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
2603
a61af66fc99e Initial load
duke
parents:
diff changeset
2604 // O0 is used as temp register
a61af66fc99e Initial load
duke
parents:
diff changeset
2605 gen_write_ref_array_post_barrier(G1, G5, O0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2606
a61af66fc99e Initial load
duke
parents:
diff changeset
2607 // O3, O4 are used as temp registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2608 inc_counter_np(SharedRuntime::_oop_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2609 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2610 __ delayed()->mov(G0, O0); // return 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2611 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2612 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2613
a61af66fc99e Initial load
duke
parents:
diff changeset
2614
a61af66fc99e Initial load
duke
parents:
diff changeset
2615 // Helper for generating a dynamic type check.
a61af66fc99e Initial load
duke
parents:
diff changeset
2616 // Smashes only the given temp registers.
a61af66fc99e Initial load
duke
parents:
diff changeset
2617 void generate_type_check(Register sub_klass,
a61af66fc99e Initial load
duke
parents:
diff changeset
2618 Register super_check_offset,
a61af66fc99e Initial load
duke
parents:
diff changeset
2619 Register super_klass,
a61af66fc99e Initial load
duke
parents:
diff changeset
2620 Register temp,
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2621 Label& L_success) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2622 assert_different_registers(sub_klass, super_check_offset, super_klass, temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
2623
a61af66fc99e Initial load
duke
parents:
diff changeset
2624 BLOCK_COMMENT("type_check:");
a61af66fc99e Initial load
duke
parents:
diff changeset
2625
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2626 Label L_miss, L_pop_to_miss;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2627
a61af66fc99e Initial load
duke
parents:
diff changeset
2628 assert_clean_int(super_check_offset, temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
2629
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2630 __ check_klass_subtype_fast_path(sub_klass, super_klass, temp, noreg,
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2631 &L_success, &L_miss, NULL,
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2632 super_check_offset);
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2633
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2634 BLOCK_COMMENT("type_check_slow_path:");
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2635 __ save_frame(0);
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2636 __ check_klass_subtype_slow_path(sub_klass->after_save(),
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2637 super_klass->after_save(),
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2638 L0, L1, L2, L4,
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2639 NULL, &L_pop_to_miss);
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
2640 __ ba(L_success);
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2641 __ delayed()->restore();
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2642
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2643 __ bind(L_pop_to_miss);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2644 __ restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
2645
a61af66fc99e Initial load
duke
parents:
diff changeset
2646 // Fall through on failure!
a61af66fc99e Initial load
duke
parents:
diff changeset
2647 __ BIND(L_miss);
a61af66fc99e Initial load
duke
parents:
diff changeset
2648 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2649
a61af66fc99e Initial load
duke
parents:
diff changeset
2650
a61af66fc99e Initial load
duke
parents:
diff changeset
2651 // Generate stub for checked oop copy.
a61af66fc99e Initial load
duke
parents:
diff changeset
2652 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2653 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2654 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2655 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2656 // count: O2 treated as signed
a61af66fc99e Initial load
duke
parents:
diff changeset
2657 // ckoff: O3 (super_check_offset)
a61af66fc99e Initial load
duke
parents:
diff changeset
2658 // ckval: O4 (super_klass)
a61af66fc99e Initial load
duke
parents:
diff changeset
2659 // ret: O0 zero for success; (-1^K) where K is partial transfer count
a61af66fc99e Initial load
duke
parents:
diff changeset
2660 //
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2661 address generate_checkcast_copy(const char *name, address *entry, bool dest_uninitialized = false) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2662
a61af66fc99e Initial load
duke
parents:
diff changeset
2663 const Register O0_from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2664 const Register O1_to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2665 const Register O2_count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2666 const Register O3_ckoff = O3; // super_check_offset
a61af66fc99e Initial load
duke
parents:
diff changeset
2667 const Register O4_ckval = O4; // super_klass
a61af66fc99e Initial load
duke
parents:
diff changeset
2668
a61af66fc99e Initial load
duke
parents:
diff changeset
2669 const Register O5_offset = O5; // loop var, with stride wordSize
a61af66fc99e Initial load
duke
parents:
diff changeset
2670 const Register G1_remain = G1; // loop var, with stride -1
a61af66fc99e Initial load
duke
parents:
diff changeset
2671 const Register G3_oop = G3; // actual oop copied
a61af66fc99e Initial load
duke
parents:
diff changeset
2672 const Register G4_klass = G4; // oop._klass
a61af66fc99e Initial load
duke
parents:
diff changeset
2673 const Register G5_super = G5; // oop._klass._primary_supers[ckval]
a61af66fc99e Initial load
duke
parents:
diff changeset
2674
a61af66fc99e Initial load
duke
parents:
diff changeset
2675 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2676 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2677 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2678
a61af66fc99e Initial load
duke
parents:
diff changeset
2679 #ifdef ASSERT
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2680 // We sometimes save a frame (see generate_type_check below).
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2681 // If this will cause trouble, let's fail now instead of later.
a61af66fc99e Initial load
duke
parents:
diff changeset
2682 __ save_frame(0);
a61af66fc99e Initial load
duke
parents:
diff changeset
2683 __ restore();
a61af66fc99e Initial load
duke
parents:
diff changeset
2684 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
2685
1844
75588558f1bf 6980792: Crash "exception happened outside interpreter, nmethods and vtable stubs (1)"
never
parents: 1794
diff changeset
2686 assert_clean_int(O2_count, G1); // Make sure 'count' is clean int.
75588558f1bf 6980792: Crash "exception happened outside interpreter, nmethods and vtable stubs (1)"
never
parents: 1794
diff changeset
2687
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2688 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
2689 // caller guarantees that the arrays really are different
a61af66fc99e Initial load
duke
parents:
diff changeset
2690 // otherwise, we would have to make conjoint checks
a61af66fc99e Initial load
duke
parents:
diff changeset
2691 { Label L;
a61af66fc99e Initial load
duke
parents:
diff changeset
2692 __ mov(O3, G1); // spill: overlap test smashes O3
a61af66fc99e Initial load
duke
parents:
diff changeset
2693 __ mov(O4, G4); // spill: overlap test smashes O4
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2694 array_overlap_test(L, LogBytesPerHeapOop);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2695 __ stop("checkcast_copy within a single array");
a61af66fc99e Initial load
duke
parents:
diff changeset
2696 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
2697 __ mov(G1, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2698 __ mov(G4, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2699 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2700 #endif //ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
2701
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2702 if (entry != NULL) {
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2703 *entry = __ pc();
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2704 // caller can pass a 64-bit byte count here (from generic stub)
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2705 BLOCK_COMMENT("Entry:");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2706 }
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
2707 gen_write_ref_array_pre_barrier(O1_to, O2_count, dest_uninitialized);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2708
a61af66fc99e Initial load
duke
parents:
diff changeset
2709 Label load_element, store_element, do_card_marks, fail, done;
a61af66fc99e Initial load
duke
parents:
diff changeset
2710 __ addcc(O2_count, 0, G1_remain); // initialize loop index, and test it
a61af66fc99e Initial load
duke
parents:
diff changeset
2711 __ brx(Assembler::notZero, false, Assembler::pt, load_element);
a61af66fc99e Initial load
duke
parents:
diff changeset
2712 __ delayed()->mov(G0, O5_offset); // offset from start of arrays
a61af66fc99e Initial load
duke
parents:
diff changeset
2713
a61af66fc99e Initial load
duke
parents:
diff changeset
2714 // Empty array: Nothing to do.
a61af66fc99e Initial load
duke
parents:
diff changeset
2715 inc_counter_np(SharedRuntime::_checkcast_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2716 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2717 __ delayed()->set(0, O0); // return 0 on (trivial) success
a61af66fc99e Initial load
duke
parents:
diff changeset
2718
a61af66fc99e Initial load
duke
parents:
diff changeset
2719 // ======== begin loop ========
a61af66fc99e Initial load
duke
parents:
diff changeset
2720 // (Loop is rotated; its entry is load_element.)
a61af66fc99e Initial load
duke
parents:
diff changeset
2721 // Loop variables:
a61af66fc99e Initial load
duke
parents:
diff changeset
2722 // (O5 = 0; ; O5 += wordSize) --- offset from src, dest arrays
a61af66fc99e Initial load
duke
parents:
diff changeset
2723 // (O2 = len; O2 != 0; O2--) --- number of oops *remaining*
a61af66fc99e Initial load
duke
parents:
diff changeset
2724 // G3, G4, G5 --- current oop, oop.klass, oop.klass.super
1365
6476042f815c 6940701: Don't align loops in stubs for Niagara sparc
kvn
parents: 1364
diff changeset
2725 __ align(OptoLoopAlignment);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2726
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2727 __ BIND(store_element);
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2728 __ deccc(G1_remain); // decrement the count
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2729 __ store_heap_oop(G3_oop, O1_to, O5_offset); // store the oop
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2730 __ inc(O5_offset, heapOopSize); // step to next offset
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2731 __ brx(Assembler::zero, true, Assembler::pt, do_card_marks);
a61af66fc99e Initial load
duke
parents:
diff changeset
2732 __ delayed()->set(0, O0); // return -1 on success
a61af66fc99e Initial load
duke
parents:
diff changeset
2733
a61af66fc99e Initial load
duke
parents:
diff changeset
2734 // ======== loop entry is here ========
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2735 __ BIND(load_element);
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2736 __ load_heap_oop(O0_from, O5_offset, G3_oop); // load the oop
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
2737 __ br_null_short(G3_oop, Assembler::pt, store_element);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2738
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2739 __ load_klass(G3_oop, G4_klass); // query the object klass
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2740
a61af66fc99e Initial load
duke
parents:
diff changeset
2741 generate_type_check(G4_klass, O3_ckoff, O4_ckval, G5_super,
a61af66fc99e Initial load
duke
parents:
diff changeset
2742 // branch to this on success:
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2743 store_element);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2744 // ======== end loop ========
a61af66fc99e Initial load
duke
parents:
diff changeset
2745
a61af66fc99e Initial load
duke
parents:
diff changeset
2746 // It was a real error; we must depend on the caller to finish the job.
a61af66fc99e Initial load
duke
parents:
diff changeset
2747 // Register G1 has number of *remaining* oops, O2 number of *total* oops.
a61af66fc99e Initial load
duke
parents:
diff changeset
2748 // Emit GC store barriers for the oops we have copied (O2 minus G1),
a61af66fc99e Initial load
duke
parents:
diff changeset
2749 // and report their number to the caller.
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2750 __ BIND(fail);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2751 __ subcc(O2_count, G1_remain, O2_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2752 __ brx(Assembler::zero, false, Assembler::pt, done);
a61af66fc99e Initial load
duke
parents:
diff changeset
2753 __ delayed()->not1(O2_count, O0); // report (-1^K) to caller
a61af66fc99e Initial load
duke
parents:
diff changeset
2754
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2755 __ BIND(do_card_marks);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2756 gen_write_ref_array_post_barrier(O1_to, O2_count, O3); // store check on O1[0..O2]
a61af66fc99e Initial load
duke
parents:
diff changeset
2757
644
c517646eef23 6813212: factor duplicated assembly code for general subclass check (for 6655638)
jrose
parents: 642
diff changeset
2758 __ BIND(done);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2759 inc_counter_np(SharedRuntime::_checkcast_array_copy_ctr, O3, O4);
a61af66fc99e Initial load
duke
parents:
diff changeset
2760 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
2761 __ delayed()->nop(); // return value in 00
a61af66fc99e Initial load
duke
parents:
diff changeset
2762
a61af66fc99e Initial load
duke
parents:
diff changeset
2763 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2764 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2765
a61af66fc99e Initial load
duke
parents:
diff changeset
2766
a61af66fc99e Initial load
duke
parents:
diff changeset
2767 // Generate 'unsafe' array copy stub
a61af66fc99e Initial load
duke
parents:
diff changeset
2768 // Though just as safe as the other stubs, it takes an unscaled
a61af66fc99e Initial load
duke
parents:
diff changeset
2769 // size_t argument instead of an element count.
a61af66fc99e Initial load
duke
parents:
diff changeset
2770 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2771 // Arguments for generated stub:
a61af66fc99e Initial load
duke
parents:
diff changeset
2772 // from: O0
a61af66fc99e Initial load
duke
parents:
diff changeset
2773 // to: O1
a61af66fc99e Initial load
duke
parents:
diff changeset
2774 // count: O2 byte count, treated as ssize_t, can be zero
a61af66fc99e Initial load
duke
parents:
diff changeset
2775 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2776 // Examines the alignment of the operands and dispatches
a61af66fc99e Initial load
duke
parents:
diff changeset
2777 // to a long, int, short, or byte copy loop.
a61af66fc99e Initial load
duke
parents:
diff changeset
2778 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2779 address generate_unsafe_copy(const char* name,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2780 address byte_copy_entry,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2781 address short_copy_entry,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2782 address int_copy_entry,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2783 address long_copy_entry) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2784
a61af66fc99e Initial load
duke
parents:
diff changeset
2785 const Register O0_from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2786 const Register O1_to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
2787 const Register O2_count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2788
a61af66fc99e Initial load
duke
parents:
diff changeset
2789 const Register G1_bits = G1; // test copy of low bits
a61af66fc99e Initial load
duke
parents:
diff changeset
2790
a61af66fc99e Initial load
duke
parents:
diff changeset
2791 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2792 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2793 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2794
a61af66fc99e Initial load
duke
parents:
diff changeset
2795 // bump this on entry, not on exit:
a61af66fc99e Initial load
duke
parents:
diff changeset
2796 inc_counter_np(SharedRuntime::_unsafe_array_copy_ctr, G1, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2797
a61af66fc99e Initial load
duke
parents:
diff changeset
2798 __ or3(O0_from, O1_to, G1_bits);
a61af66fc99e Initial load
duke
parents:
diff changeset
2799 __ or3(O2_count, G1_bits, G1_bits);
a61af66fc99e Initial load
duke
parents:
diff changeset
2800
a61af66fc99e Initial load
duke
parents:
diff changeset
2801 __ btst(BytesPerLong-1, G1_bits);
a61af66fc99e Initial load
duke
parents:
diff changeset
2802 __ br(Assembler::zero, true, Assembler::pt,
a61af66fc99e Initial load
duke
parents:
diff changeset
2803 long_copy_entry, relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
2804 // scale the count on the way out:
a61af66fc99e Initial load
duke
parents:
diff changeset
2805 __ delayed()->srax(O2_count, LogBytesPerLong, O2_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2806
a61af66fc99e Initial load
duke
parents:
diff changeset
2807 __ btst(BytesPerInt-1, G1_bits);
a61af66fc99e Initial load
duke
parents:
diff changeset
2808 __ br(Assembler::zero, true, Assembler::pt,
a61af66fc99e Initial load
duke
parents:
diff changeset
2809 int_copy_entry, relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
2810 // scale the count on the way out:
a61af66fc99e Initial load
duke
parents:
diff changeset
2811 __ delayed()->srax(O2_count, LogBytesPerInt, O2_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2812
a61af66fc99e Initial load
duke
parents:
diff changeset
2813 __ btst(BytesPerShort-1, G1_bits);
a61af66fc99e Initial load
duke
parents:
diff changeset
2814 __ br(Assembler::zero, true, Assembler::pt,
a61af66fc99e Initial load
duke
parents:
diff changeset
2815 short_copy_entry, relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
2816 // scale the count on the way out:
a61af66fc99e Initial load
duke
parents:
diff changeset
2817 __ delayed()->srax(O2_count, LogBytesPerShort, O2_count);
a61af66fc99e Initial load
duke
parents:
diff changeset
2818
a61af66fc99e Initial load
duke
parents:
diff changeset
2819 __ br(Assembler::always, false, Assembler::pt,
a61af66fc99e Initial load
duke
parents:
diff changeset
2820 byte_copy_entry, relocInfo::runtime_call_type);
a61af66fc99e Initial load
duke
parents:
diff changeset
2821 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
2822
a61af66fc99e Initial load
duke
parents:
diff changeset
2823 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
2824 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2825
a61af66fc99e Initial load
duke
parents:
diff changeset
2826
a61af66fc99e Initial load
duke
parents:
diff changeset
2827 // Perform range checks on the proposed arraycopy.
a61af66fc99e Initial load
duke
parents:
diff changeset
2828 // Kills the two temps, but nothing else.
a61af66fc99e Initial load
duke
parents:
diff changeset
2829 // Also, clean the sign bits of src_pos and dst_pos.
a61af66fc99e Initial load
duke
parents:
diff changeset
2830 void arraycopy_range_checks(Register src, // source array oop (O0)
a61af66fc99e Initial load
duke
parents:
diff changeset
2831 Register src_pos, // source position (O1)
a61af66fc99e Initial load
duke
parents:
diff changeset
2832 Register dst, // destination array oo (O2)
a61af66fc99e Initial load
duke
parents:
diff changeset
2833 Register dst_pos, // destination position (O3)
a61af66fc99e Initial load
duke
parents:
diff changeset
2834 Register length, // length of copy (O4)
a61af66fc99e Initial load
duke
parents:
diff changeset
2835 Register temp1, Register temp2,
a61af66fc99e Initial load
duke
parents:
diff changeset
2836 Label& L_failed) {
a61af66fc99e Initial load
duke
parents:
diff changeset
2837 BLOCK_COMMENT("arraycopy_range_checks:");
a61af66fc99e Initial load
duke
parents:
diff changeset
2838
a61af66fc99e Initial load
duke
parents:
diff changeset
2839 // if (src_pos + length > arrayOop(src)->length() ) FAIL;
a61af66fc99e Initial load
duke
parents:
diff changeset
2840
a61af66fc99e Initial load
duke
parents:
diff changeset
2841 const Register array_length = temp1; // scratch
a61af66fc99e Initial load
duke
parents:
diff changeset
2842 const Register end_pos = temp2; // scratch
a61af66fc99e Initial load
duke
parents:
diff changeset
2843
a61af66fc99e Initial load
duke
parents:
diff changeset
2844 // Note: This next instruction may be in the delay slot of a branch:
a61af66fc99e Initial load
duke
parents:
diff changeset
2845 __ add(length, src_pos, end_pos); // src_pos + length
a61af66fc99e Initial load
duke
parents:
diff changeset
2846 __ lduw(src, arrayOopDesc::length_offset_in_bytes(), array_length);
a61af66fc99e Initial load
duke
parents:
diff changeset
2847 __ cmp(end_pos, array_length);
a61af66fc99e Initial load
duke
parents:
diff changeset
2848 __ br(Assembler::greater, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2849
a61af66fc99e Initial load
duke
parents:
diff changeset
2850 // if (dst_pos + length > arrayOop(dst)->length() ) FAIL;
a61af66fc99e Initial load
duke
parents:
diff changeset
2851 __ delayed()->add(length, dst_pos, end_pos); // dst_pos + length
a61af66fc99e Initial load
duke
parents:
diff changeset
2852 __ lduw(dst, arrayOopDesc::length_offset_in_bytes(), array_length);
a61af66fc99e Initial load
duke
parents:
diff changeset
2853 __ cmp(end_pos, array_length);
a61af66fc99e Initial load
duke
parents:
diff changeset
2854 __ br(Assembler::greater, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2855
a61af66fc99e Initial load
duke
parents:
diff changeset
2856 // Have to clean up high 32-bits of 'src_pos' and 'dst_pos'.
a61af66fc99e Initial load
duke
parents:
diff changeset
2857 // Move with sign extension can be used since they are positive.
a61af66fc99e Initial load
duke
parents:
diff changeset
2858 __ delayed()->signx(src_pos, src_pos);
a61af66fc99e Initial load
duke
parents:
diff changeset
2859 __ signx(dst_pos, dst_pos);
a61af66fc99e Initial load
duke
parents:
diff changeset
2860
a61af66fc99e Initial load
duke
parents:
diff changeset
2861 BLOCK_COMMENT("arraycopy_range_checks done");
a61af66fc99e Initial load
duke
parents:
diff changeset
2862 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2863
a61af66fc99e Initial load
duke
parents:
diff changeset
2864
a61af66fc99e Initial load
duke
parents:
diff changeset
2865 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2866 // Generate generic array copy stubs
a61af66fc99e Initial load
duke
parents:
diff changeset
2867 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2868 // Input:
a61af66fc99e Initial load
duke
parents:
diff changeset
2869 // O0 - src oop
a61af66fc99e Initial load
duke
parents:
diff changeset
2870 // O1 - src_pos
a61af66fc99e Initial load
duke
parents:
diff changeset
2871 // O2 - dst oop
a61af66fc99e Initial load
duke
parents:
diff changeset
2872 // O3 - dst_pos
a61af66fc99e Initial load
duke
parents:
diff changeset
2873 // O4 - element count
a61af66fc99e Initial load
duke
parents:
diff changeset
2874 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2875 // Output:
a61af66fc99e Initial load
duke
parents:
diff changeset
2876 // O0 == 0 - success
a61af66fc99e Initial load
duke
parents:
diff changeset
2877 // O0 == -1 - need to call System.arraycopy
a61af66fc99e Initial load
duke
parents:
diff changeset
2878 //
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2879 address generate_generic_copy(const char *name,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2880 address entry_jbyte_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2881 address entry_jshort_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2882 address entry_jint_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2883 address entry_oop_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2884 address entry_jlong_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
2885 address entry_checkcast_arraycopy) {
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2886 Label L_failed, L_objArray;
a61af66fc99e Initial load
duke
parents:
diff changeset
2887
a61af66fc99e Initial load
duke
parents:
diff changeset
2888 // Input registers
a61af66fc99e Initial load
duke
parents:
diff changeset
2889 const Register src = O0; // source array oop
a61af66fc99e Initial load
duke
parents:
diff changeset
2890 const Register src_pos = O1; // source position
a61af66fc99e Initial load
duke
parents:
diff changeset
2891 const Register dst = O2; // destination array oop
a61af66fc99e Initial load
duke
parents:
diff changeset
2892 const Register dst_pos = O3; // destination position
a61af66fc99e Initial load
duke
parents:
diff changeset
2893 const Register length = O4; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
2894
a61af66fc99e Initial load
duke
parents:
diff changeset
2895 // registers used as temp
a61af66fc99e Initial load
duke
parents:
diff changeset
2896 const Register G3_src_klass = G3; // source array klass
a61af66fc99e Initial load
duke
parents:
diff changeset
2897 const Register G4_dst_klass = G4; // destination array klass
a61af66fc99e Initial load
duke
parents:
diff changeset
2898 const Register G5_lh = G5; // layout handler
a61af66fc99e Initial load
duke
parents:
diff changeset
2899 const Register O5_temp = O5;
a61af66fc99e Initial load
duke
parents:
diff changeset
2900
a61af66fc99e Initial load
duke
parents:
diff changeset
2901 __ align(CodeEntryAlignment);
a61af66fc99e Initial load
duke
parents:
diff changeset
2902 StubCodeMark mark(this, "StubRoutines", name);
a61af66fc99e Initial load
duke
parents:
diff changeset
2903 address start = __ pc();
a61af66fc99e Initial load
duke
parents:
diff changeset
2904
a61af66fc99e Initial load
duke
parents:
diff changeset
2905 // bump this on entry, not on exit:
a61af66fc99e Initial load
duke
parents:
diff changeset
2906 inc_counter_np(SharedRuntime::_generic_array_copy_ctr, G1, G3);
a61af66fc99e Initial load
duke
parents:
diff changeset
2907
a61af66fc99e Initial load
duke
parents:
diff changeset
2908 // In principle, the int arguments could be dirty.
a61af66fc99e Initial load
duke
parents:
diff changeset
2909 //assert_clean_int(src_pos, G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
2910 //assert_clean_int(dst_pos, G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
2911 //assert_clean_int(length, G1);
a61af66fc99e Initial load
duke
parents:
diff changeset
2912
a61af66fc99e Initial load
duke
parents:
diff changeset
2913 //-----------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
2914 // Assembler stubs will be used for this call to arraycopy
a61af66fc99e Initial load
duke
parents:
diff changeset
2915 // if the following conditions are met:
a61af66fc99e Initial load
duke
parents:
diff changeset
2916 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2917 // (1) src and dst must not be null.
a61af66fc99e Initial load
duke
parents:
diff changeset
2918 // (2) src_pos must not be negative.
a61af66fc99e Initial load
duke
parents:
diff changeset
2919 // (3) dst_pos must not be negative.
a61af66fc99e Initial load
duke
parents:
diff changeset
2920 // (4) length must not be negative.
a61af66fc99e Initial load
duke
parents:
diff changeset
2921 // (5) src klass and dst klass should be the same and not NULL.
a61af66fc99e Initial load
duke
parents:
diff changeset
2922 // (6) src and dst should be arrays.
a61af66fc99e Initial load
duke
parents:
diff changeset
2923 // (7) src_pos + length must not exceed length of src.
a61af66fc99e Initial load
duke
parents:
diff changeset
2924 // (8) dst_pos + length must not exceed length of dst.
a61af66fc99e Initial load
duke
parents:
diff changeset
2925 BLOCK_COMMENT("arraycopy initial argument checks");
a61af66fc99e Initial load
duke
parents:
diff changeset
2926
a61af66fc99e Initial load
duke
parents:
diff changeset
2927 // if (src == NULL) return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
2928 __ br_null(src, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2929
a61af66fc99e Initial load
duke
parents:
diff changeset
2930 // if (src_pos < 0) return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
2931 __ delayed()->tst(src_pos);
a61af66fc99e Initial load
duke
parents:
diff changeset
2932 __ br(Assembler::negative, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2933 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
2934
a61af66fc99e Initial load
duke
parents:
diff changeset
2935 // if (dst == NULL) return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
2936 __ br_null(dst, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2937
a61af66fc99e Initial load
duke
parents:
diff changeset
2938 // if (dst_pos < 0) return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
2939 __ delayed()->tst(dst_pos);
a61af66fc99e Initial load
duke
parents:
diff changeset
2940 __ br(Assembler::negative, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2941
a61af66fc99e Initial load
duke
parents:
diff changeset
2942 // if (length < 0) return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
2943 __ delayed()->tst(length);
a61af66fc99e Initial load
duke
parents:
diff changeset
2944 __ br(Assembler::negative, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
2945
a61af66fc99e Initial load
duke
parents:
diff changeset
2946 BLOCK_COMMENT("arraycopy argument klass checks");
a61af66fc99e Initial load
duke
parents:
diff changeset
2947 // get src->klass()
12226
7944aba7ba41 8015107: NPG: Use consistent naming for metaspace concepts
ehelin
parents: 11127
diff changeset
2948 if (UseCompressedClassPointers) {
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2949 __ delayed()->nop(); // ??? not good
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2950 __ load_klass(src, G3_src_klass);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2951 } else {
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2952 __ delayed()->ld_ptr(src, oopDesc::klass_offset_in_bytes(), G3_src_klass);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2953 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2954
a61af66fc99e Initial load
duke
parents:
diff changeset
2955 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
2956 // assert(src->klass() != NULL);
a61af66fc99e Initial load
duke
parents:
diff changeset
2957 BLOCK_COMMENT("assert klasses not null");
a61af66fc99e Initial load
duke
parents:
diff changeset
2958 { Label L_a, L_b;
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
2959 __ br_notnull_short(G3_src_klass, Assembler::pt, L_b); // it is broken if klass is NULL
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2960 __ bind(L_a);
a61af66fc99e Initial load
duke
parents:
diff changeset
2961 __ stop("broken null klass");
a61af66fc99e Initial load
duke
parents:
diff changeset
2962 __ bind(L_b);
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2963 __ load_klass(dst, G4_dst_klass);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2964 __ br_null(G4_dst_klass, false, Assembler::pn, L_a); // this would be broken also
a61af66fc99e Initial load
duke
parents:
diff changeset
2965 __ delayed()->mov(G0, G4_dst_klass); // scribble the temp
a61af66fc99e Initial load
duke
parents:
diff changeset
2966 BLOCK_COMMENT("assert done");
a61af66fc99e Initial load
duke
parents:
diff changeset
2967 }
a61af66fc99e Initial load
duke
parents:
diff changeset
2968 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
2969
a61af66fc99e Initial load
duke
parents:
diff changeset
2970 // Load layout helper
a61af66fc99e Initial load
duke
parents:
diff changeset
2971 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2972 // |array_tag| | header_size | element_type | |log2_element_size|
a61af66fc99e Initial load
duke
parents:
diff changeset
2973 // 32 30 24 16 8 2 0
a61af66fc99e Initial load
duke
parents:
diff changeset
2974 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2975 // array_tag: typeArray = 0x3, objArray = 0x2, non-array = 0x0
a61af66fc99e Initial load
duke
parents:
diff changeset
2976 //
a61af66fc99e Initial load
duke
parents:
diff changeset
2977
4762
069ab3f976d3 7118863: Move sizeof(klassOopDesc) into the *Klass::*_offset_in_bytes() functions
stefank
parents: 3961
diff changeset
2978 int lh_offset = in_bytes(Klass::layout_helper_offset());
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2979
a61af66fc99e Initial load
duke
parents:
diff changeset
2980 // Load 32-bits signed value. Use br() instruction with it to check icc.
a61af66fc99e Initial load
duke
parents:
diff changeset
2981 __ lduw(G3_src_klass, lh_offset, G5_lh);
a61af66fc99e Initial load
duke
parents:
diff changeset
2982
12226
7944aba7ba41 8015107: NPG: Use consistent naming for metaspace concepts
ehelin
parents: 11127
diff changeset
2983 if (UseCompressedClassPointers) {
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2984 __ load_klass(dst, G4_dst_klass);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2985 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2986 // Handle objArrays completely differently...
a61af66fc99e Initial load
duke
parents:
diff changeset
2987 juint objArray_lh = Klass::array_layout_helper(T_OBJECT);
a61af66fc99e Initial load
duke
parents:
diff changeset
2988 __ set(objArray_lh, O5_temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
2989 __ cmp(G5_lh, O5_temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
2990 __ br(Assembler::equal, false, Assembler::pt, L_objArray);
12226
7944aba7ba41 8015107: NPG: Use consistent naming for metaspace concepts
ehelin
parents: 11127
diff changeset
2991 if (UseCompressedClassPointers) {
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2992 __ delayed()->nop();
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2993 } else {
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2994 __ delayed()->ld_ptr(dst, oopDesc::klass_offset_in_bytes(), G4_dst_klass);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
2995 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2996
a61af66fc99e Initial load
duke
parents:
diff changeset
2997 // if (src->klass() != dst->klass()) return -1;
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
2998 __ cmp_and_brx_short(G3_src_klass, G4_dst_klass, Assembler::notEqual, Assembler::pn, L_failed);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
2999
a61af66fc99e Initial load
duke
parents:
diff changeset
3000 // if (!src->is_Array()) return -1;
a61af66fc99e Initial load
duke
parents:
diff changeset
3001 __ cmp(G5_lh, Klass::_lh_neutral_value); // < 0
a61af66fc99e Initial load
duke
parents:
diff changeset
3002 __ br(Assembler::greaterEqual, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
3003
a61af66fc99e Initial load
duke
parents:
diff changeset
3004 // At this point, it is known to be a typeArray (array_tag 0x3).
a61af66fc99e Initial load
duke
parents:
diff changeset
3005 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
3006 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
3007 { Label L;
a61af66fc99e Initial load
duke
parents:
diff changeset
3008 jint lh_prim_tag_in_place = (Klass::_lh_array_tag_type_value << Klass::_lh_array_tag_shift);
a61af66fc99e Initial load
duke
parents:
diff changeset
3009 __ set(lh_prim_tag_in_place, O5_temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
3010 __ cmp(G5_lh, O5_temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
3011 __ br(Assembler::greaterEqual, false, Assembler::pt, L);
a61af66fc99e Initial load
duke
parents:
diff changeset
3012 __ delayed()->nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
3013 __ stop("must be a primitive array");
a61af66fc99e Initial load
duke
parents:
diff changeset
3014 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
3015 }
a61af66fc99e Initial load
duke
parents:
diff changeset
3016 #else
a61af66fc99e Initial load
duke
parents:
diff changeset
3017 __ delayed(); // match next insn to prev branch
a61af66fc99e Initial load
duke
parents:
diff changeset
3018 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
3019
a61af66fc99e Initial load
duke
parents:
diff changeset
3020 arraycopy_range_checks(src, src_pos, dst, dst_pos, length,
a61af66fc99e Initial load
duke
parents:
diff changeset
3021 O5_temp, G4_dst_klass, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
3022
6831
d8ce2825b193 8000213: NPG: Should have renamed arrayKlass and typeArrayKlass
coleenp
parents: 6725
diff changeset
3023 // TypeArrayKlass
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3024 //
a61af66fc99e Initial load
duke
parents:
diff changeset
3025 // src_addr = (src + array_header_in_bytes()) + (src_pos << log2elemsize);
a61af66fc99e Initial load
duke
parents:
diff changeset
3026 // dst_addr = (dst + array_header_in_bytes()) + (dst_pos << log2elemsize);
a61af66fc99e Initial load
duke
parents:
diff changeset
3027 //
a61af66fc99e Initial load
duke
parents:
diff changeset
3028
a61af66fc99e Initial load
duke
parents:
diff changeset
3029 const Register G4_offset = G4_dst_klass; // array offset
a61af66fc99e Initial load
duke
parents:
diff changeset
3030 const Register G3_elsize = G3_src_klass; // log2 element size
a61af66fc99e Initial load
duke
parents:
diff changeset
3031
a61af66fc99e Initial load
duke
parents:
diff changeset
3032 __ srl(G5_lh, Klass::_lh_header_size_shift, G4_offset);
a61af66fc99e Initial load
duke
parents:
diff changeset
3033 __ and3(G4_offset, Klass::_lh_header_size_mask, G4_offset); // array_offset
a61af66fc99e Initial load
duke
parents:
diff changeset
3034 __ add(src, G4_offset, src); // src array offset
a61af66fc99e Initial load
duke
parents:
diff changeset
3035 __ add(dst, G4_offset, dst); // dst array offset
a61af66fc99e Initial load
duke
parents:
diff changeset
3036 __ and3(G5_lh, Klass::_lh_log2_element_size_mask, G3_elsize); // log2 element size
a61af66fc99e Initial load
duke
parents:
diff changeset
3037
a61af66fc99e Initial load
duke
parents:
diff changeset
3038 // next registers should be set before the jump to corresponding stub
a61af66fc99e Initial load
duke
parents:
diff changeset
3039 const Register from = O0; // source array address
a61af66fc99e Initial load
duke
parents:
diff changeset
3040 const Register to = O1; // destination array address
a61af66fc99e Initial load
duke
parents:
diff changeset
3041 const Register count = O2; // elements count
a61af66fc99e Initial load
duke
parents:
diff changeset
3042
a61af66fc99e Initial load
duke
parents:
diff changeset
3043 // 'from', 'to', 'count' registers should be set in this order
a61af66fc99e Initial load
duke
parents:
diff changeset
3044 // since they are the same as 'src', 'src_pos', 'dst'.
a61af66fc99e Initial load
duke
parents:
diff changeset
3045
a61af66fc99e Initial load
duke
parents:
diff changeset
3046 BLOCK_COMMENT("scale indexes to element size");
a61af66fc99e Initial load
duke
parents:
diff changeset
3047 __ sll_ptr(src_pos, G3_elsize, src_pos);
a61af66fc99e Initial load
duke
parents:
diff changeset
3048 __ sll_ptr(dst_pos, G3_elsize, dst_pos);
a61af66fc99e Initial load
duke
parents:
diff changeset
3049 __ add(src, src_pos, from); // src_addr
a61af66fc99e Initial load
duke
parents:
diff changeset
3050 __ add(dst, dst_pos, to); // dst_addr
a61af66fc99e Initial load
duke
parents:
diff changeset
3051
a61af66fc99e Initial load
duke
parents:
diff changeset
3052 BLOCK_COMMENT("choose copy loop based on element size");
a61af66fc99e Initial load
duke
parents:
diff changeset
3053 __ cmp(G3_elsize, 0);
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3054 __ br(Assembler::equal, true, Assembler::pt, entry_jbyte_arraycopy);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3055 __ delayed()->signx(length, count); // length
a61af66fc99e Initial load
duke
parents:
diff changeset
3056
a61af66fc99e Initial load
duke
parents:
diff changeset
3057 __ cmp(G3_elsize, LogBytesPerShort);
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3058 __ br(Assembler::equal, true, Assembler::pt, entry_jshort_arraycopy);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3059 __ delayed()->signx(length, count); // length
a61af66fc99e Initial load
duke
parents:
diff changeset
3060
a61af66fc99e Initial load
duke
parents:
diff changeset
3061 __ cmp(G3_elsize, LogBytesPerInt);
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3062 __ br(Assembler::equal, true, Assembler::pt, entry_jint_arraycopy);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3063 __ delayed()->signx(length, count); // length
a61af66fc99e Initial load
duke
parents:
diff changeset
3064 #ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
3065 { Label L;
3839
3d42f82cd811 7063628: Use cbcond on T4
kvn
parents: 3451
diff changeset
3066 __ cmp_and_br_short(G3_elsize, LogBytesPerLong, Assembler::equal, Assembler::pt, L);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3067 __ stop("must be long copy, but elsize is wrong");
a61af66fc99e Initial load
duke
parents:
diff changeset
3068 __ bind(L);
a61af66fc99e Initial load
duke
parents:
diff changeset
3069 }
a61af66fc99e Initial load
duke
parents:
diff changeset
3070 #endif
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3071 __ br(Assembler::always, false, Assembler::pt, entry_jlong_arraycopy);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3072 __ delayed()->signx(length, count); // length
a61af66fc99e Initial load
duke
parents:
diff changeset
3073
6831
d8ce2825b193 8000213: NPG: Should have renamed arrayKlass and typeArrayKlass
coleenp
parents: 6725
diff changeset
3074 // ObjArrayKlass
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3075 __ BIND(L_objArray);
a61af66fc99e Initial load
duke
parents:
diff changeset
3076 // live at this point: G3_src_klass, G4_dst_klass, src[_pos], dst[_pos], length
a61af66fc99e Initial load
duke
parents:
diff changeset
3077
a61af66fc99e Initial load
duke
parents:
diff changeset
3078 Label L_plain_copy, L_checkcast_copy;
a61af66fc99e Initial load
duke
parents:
diff changeset
3079 // test array classes for subtyping
a61af66fc99e Initial load
duke
parents:
diff changeset
3080 __ cmp(G3_src_klass, G4_dst_klass); // usual case is exact equality
a61af66fc99e Initial load
duke
parents:
diff changeset
3081 __ brx(Assembler::notEqual, true, Assembler::pn, L_checkcast_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
3082 __ delayed()->lduw(G4_dst_klass, lh_offset, O5_temp); // hoisted from below
a61af66fc99e Initial load
duke
parents:
diff changeset
3083
a61af66fc99e Initial load
duke
parents:
diff changeset
3084 // Identically typed arrays can be copied without element-wise checks.
a61af66fc99e Initial load
duke
parents:
diff changeset
3085 arraycopy_range_checks(src, src_pos, dst, dst_pos, length,
a61af66fc99e Initial load
duke
parents:
diff changeset
3086 O5_temp, G5_lh, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
3087
a61af66fc99e Initial load
duke
parents:
diff changeset
3088 __ add(src, arrayOopDesc::base_offset_in_bytes(T_OBJECT), src); //src offset
a61af66fc99e Initial load
duke
parents:
diff changeset
3089 __ add(dst, arrayOopDesc::base_offset_in_bytes(T_OBJECT), dst); //dst offset
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
3090 __ sll_ptr(src_pos, LogBytesPerHeapOop, src_pos);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
3091 __ sll_ptr(dst_pos, LogBytesPerHeapOop, dst_pos);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3092 __ add(src, src_pos, from); // src_addr
a61af66fc99e Initial load
duke
parents:
diff changeset
3093 __ add(dst, dst_pos, to); // dst_addr
a61af66fc99e Initial load
duke
parents:
diff changeset
3094 __ BIND(L_plain_copy);
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3095 __ br(Assembler::always, false, Assembler::pt, entry_oop_arraycopy);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3096 __ delayed()->signx(length, count); // length
a61af66fc99e Initial load
duke
parents:
diff changeset
3097
a61af66fc99e Initial load
duke
parents:
diff changeset
3098 __ BIND(L_checkcast_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
3099 // live at this point: G3_src_klass, G4_dst_klass
a61af66fc99e Initial load
duke
parents:
diff changeset
3100 {
a61af66fc99e Initial load
duke
parents:
diff changeset
3101 // Before looking at dst.length, make sure dst is also an objArray.
a61af66fc99e Initial load
duke
parents:
diff changeset
3102 // lduw(G4_dst_klass, lh_offset, O5_temp); // hoisted to delay slot
a61af66fc99e Initial load
duke
parents:
diff changeset
3103 __ cmp(G5_lh, O5_temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
3104 __ br(Assembler::notEqual, false, Assembler::pn, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
3105
a61af66fc99e Initial load
duke
parents:
diff changeset
3106 // It is safe to examine both src.length and dst.length.
a61af66fc99e Initial load
duke
parents:
diff changeset
3107 __ delayed(); // match next insn to prev branch
a61af66fc99e Initial load
duke
parents:
diff changeset
3108 arraycopy_range_checks(src, src_pos, dst, dst_pos, length,
a61af66fc99e Initial load
duke
parents:
diff changeset
3109 O5_temp, G5_lh, L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
3110
a61af66fc99e Initial load
duke
parents:
diff changeset
3111 // Marshal the base address arguments now, freeing registers.
a61af66fc99e Initial load
duke
parents:
diff changeset
3112 __ add(src, arrayOopDesc::base_offset_in_bytes(T_OBJECT), src); //src offset
a61af66fc99e Initial load
duke
parents:
diff changeset
3113 __ add(dst, arrayOopDesc::base_offset_in_bytes(T_OBJECT), dst); //dst offset
113
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
3114 __ sll_ptr(src_pos, LogBytesPerHeapOop, src_pos);
ba764ed4b6f2 6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
coleenp
parents: 16
diff changeset
3115 __ sll_ptr(dst_pos, LogBytesPerHeapOop, dst_pos);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3116 __ add(src, src_pos, from); // src_addr
a61af66fc99e Initial load
duke
parents:
diff changeset
3117 __ add(dst, dst_pos, to); // dst_addr
a61af66fc99e Initial load
duke
parents:
diff changeset
3118 __ signx(length, count); // length (reloaded)
a61af66fc99e Initial load
duke
parents:
diff changeset
3119
a61af66fc99e Initial load
duke
parents:
diff changeset
3120 Register sco_temp = O3; // this register is free now
a61af66fc99e Initial load
duke
parents:
diff changeset
3121 assert_different_registers(from, to, count, sco_temp,
a61af66fc99e Initial load
duke
parents:
diff changeset
3122 G4_dst_klass, G3_src_klass);
a61af66fc99e Initial load
duke
parents:
diff changeset
3123
a61af66fc99e Initial load
duke
parents:
diff changeset
3124 // Generate the type check.
4762
069ab3f976d3 7118863: Move sizeof(klassOopDesc) into the *Klass::*_offset_in_bytes() functions
stefank
parents: 3961
diff changeset
3125 int sco_offset = in_bytes(Klass::super_check_offset_offset());
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3126 __ lduw(G4_dst_klass, sco_offset, sco_temp);
a61af66fc99e Initial load
duke
parents:
diff changeset
3127 generate_type_check(G3_src_klass, sco_temp, G4_dst_klass,
a61af66fc99e Initial load
duke
parents:
diff changeset
3128 O5_temp, L_plain_copy);
a61af66fc99e Initial load
duke
parents:
diff changeset
3129
6831
d8ce2825b193 8000213: NPG: Should have renamed arrayKlass and typeArrayKlass
coleenp
parents: 6725
diff changeset
3130 // Fetch destination element klass from the ObjArrayKlass header.
d8ce2825b193 8000213: NPG: Should have renamed arrayKlass and typeArrayKlass
coleenp
parents: 6725
diff changeset
3131 int ek_offset = in_bytes(ObjArrayKlass::element_klass_offset());
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3132
a61af66fc99e Initial load
duke
parents:
diff changeset
3133 // the checkcast_copy loop needs two extra arguments:
a61af66fc99e Initial load
duke
parents:
diff changeset
3134 __ ld_ptr(G4_dst_klass, ek_offset, O4); // dest elem klass
a61af66fc99e Initial load
duke
parents:
diff changeset
3135 // lduw(O4, sco_offset, O3); // sco of elem klass
a61af66fc99e Initial load
duke
parents:
diff changeset
3136
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3137 __ br(Assembler::always, false, Assembler::pt, entry_checkcast_arraycopy);
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3138 __ delayed()->lduw(O4, sco_offset, O3);
a61af66fc99e Initial load
duke
parents:
diff changeset
3139 }
a61af66fc99e Initial load
duke
parents:
diff changeset
3140
a61af66fc99e Initial load
duke
parents:
diff changeset
3141 __ BIND(L_failed);
a61af66fc99e Initial load
duke
parents:
diff changeset
3142 __ retl();
a61af66fc99e Initial load
duke
parents:
diff changeset
3143 __ delayed()->sub(G0, 1, O0); // return -1
a61af66fc99e Initial load
duke
parents:
diff changeset
3144 return start;
a61af66fc99e Initial load
duke
parents:
diff changeset
3145 }
a61af66fc99e Initial load
duke
parents:
diff changeset
3146
3892
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3147 //
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3148 // Generate stub for heap zeroing.
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3149 // "to" address is aligned to jlong (8 bytes).
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3150 //
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3151 // Arguments for generated stub:
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3152 // to: O0
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3153 // count: O1 treated as signed (count of HeapWord)
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3154 // count could be 0
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3155 //
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3156 address generate_zero_aligned_words(const char* name) {
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3157 __ align(CodeEntryAlignment);
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3158 StubCodeMark mark(this, "StubRoutines", name);
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3159 address start = __ pc();
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3160
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3161 const Register to = O0; // source array address
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3162 const Register count = O1; // HeapWords count
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3163 const Register temp = O2; // scratch
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3164
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3165 Label Ldone;
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3166 __ sllx(count, LogHeapWordSize, count); // to bytes count
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3167 // Use BIS for zeroing
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3168 __ bis_zeroing(to, count, temp, Ldone);
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3169 __ bind(Ldone);
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3170 __ retl();
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3171 __ delayed()->nop();
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3172 return start;
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3173 }
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3174
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3175 void generate_arraycopy_stubs() {
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3176 address entry;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3177 address entry_jbyte_arraycopy;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3178 address entry_jshort_arraycopy;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3179 address entry_jint_arraycopy;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3180 address entry_oop_arraycopy;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3181 address entry_jlong_arraycopy;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3182 address entry_checkcast_arraycopy;
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3183
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3184 //*** jbyte
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3185 // Always need aligned and unaligned versions
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3186 StubRoutines::_jbyte_disjoint_arraycopy = generate_disjoint_byte_copy(false, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3187 "jbyte_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3188 StubRoutines::_jbyte_arraycopy = generate_conjoint_byte_copy(false, entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3189 &entry_jbyte_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3190 "jbyte_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3191 StubRoutines::_arrayof_jbyte_disjoint_arraycopy = generate_disjoint_byte_copy(true, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3192 "arrayof_jbyte_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3193 StubRoutines::_arrayof_jbyte_arraycopy = generate_conjoint_byte_copy(true, entry, NULL,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3194 "arrayof_jbyte_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3195
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3196 //*** jshort
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3197 // Always need aligned and unaligned versions
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3198 StubRoutines::_jshort_disjoint_arraycopy = generate_disjoint_short_copy(false, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3199 "jshort_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3200 StubRoutines::_jshort_arraycopy = generate_conjoint_short_copy(false, entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3201 &entry_jshort_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3202 "jshort_arraycopy");
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3203 StubRoutines::_arrayof_jshort_disjoint_arraycopy = generate_disjoint_short_copy(true, &entry,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3204 "arrayof_jshort_disjoint_arraycopy");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3205 StubRoutines::_arrayof_jshort_arraycopy = generate_conjoint_short_copy(true, entry, NULL,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3206 "arrayof_jshort_arraycopy");
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3207
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3208 //*** jint
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3209 // Aligned versions
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3210 StubRoutines::_arrayof_jint_disjoint_arraycopy = generate_disjoint_int_copy(true, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3211 "arrayof_jint_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3212 StubRoutines::_arrayof_jint_arraycopy = generate_conjoint_int_copy(true, entry, &entry_jint_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3213 "arrayof_jint_arraycopy");
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3214 #ifdef _LP64
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3215 // In 64 bit we need both aligned and unaligned versions of jint arraycopy.
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3216 // entry_jint_arraycopy always points to the unaligned version (notice that we overwrite it).
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3217 StubRoutines::_jint_disjoint_arraycopy = generate_disjoint_int_copy(false, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3218 "jint_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3219 StubRoutines::_jint_arraycopy = generate_conjoint_int_copy(false, entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3220 &entry_jint_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3221 "jint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3222 #else
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3223 // In 32 bit jints are always HeapWordSize aligned, so always use the aligned version
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3224 // (in fact in 32bit we always have a pre-loop part even in the aligned version,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3225 // because it uses 64-bit loads/stores, so the aligned flag is actually ignored).
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3226 StubRoutines::_jint_disjoint_arraycopy = StubRoutines::_arrayof_jint_disjoint_arraycopy;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3227 StubRoutines::_jint_arraycopy = StubRoutines::_arrayof_jint_arraycopy;
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3228 #endif
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3229
2324
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3230
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3231 //*** jlong
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3232 // It is always aligned
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3233 StubRoutines::_arrayof_jlong_disjoint_arraycopy = generate_disjoint_long_copy(true, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3234 "arrayof_jlong_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3235 StubRoutines::_arrayof_jlong_arraycopy = generate_conjoint_long_copy(true, entry, &entry_jlong_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3236 "arrayof_jlong_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3237 StubRoutines::_jlong_disjoint_arraycopy = StubRoutines::_arrayof_jlong_disjoint_arraycopy;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3238 StubRoutines::_jlong_arraycopy = StubRoutines::_arrayof_jlong_arraycopy;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3239
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3240
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3241 //*** oops
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3242 // Aligned versions
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3243 StubRoutines::_arrayof_oop_disjoint_arraycopy = generate_disjoint_oop_copy(true, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3244 "arrayof_oop_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3245 StubRoutines::_arrayof_oop_arraycopy = generate_conjoint_oop_copy(true, entry, &entry_oop_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3246 "arrayof_oop_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3247 // Aligned versions without pre-barriers
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3248 StubRoutines::_arrayof_oop_disjoint_arraycopy_uninit = generate_disjoint_oop_copy(true, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3249 "arrayof_oop_disjoint_arraycopy_uninit",
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3250 /*dest_uninitialized*/true);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3251 StubRoutines::_arrayof_oop_arraycopy_uninit = generate_conjoint_oop_copy(true, entry, NULL,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3252 "arrayof_oop_arraycopy_uninit",
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3253 /*dest_uninitialized*/true);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3254 #ifdef _LP64
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3255 if (UseCompressedOops) {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3256 // With compressed oops we need unaligned versions, notice that we overwrite entry_oop_arraycopy.
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3257 StubRoutines::_oop_disjoint_arraycopy = generate_disjoint_oop_copy(false, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3258 "oop_disjoint_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3259 StubRoutines::_oop_arraycopy = generate_conjoint_oop_copy(false, entry, &entry_oop_arraycopy,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3260 "oop_arraycopy");
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3261 // Unaligned versions without pre-barriers
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3262 StubRoutines::_oop_disjoint_arraycopy_uninit = generate_disjoint_oop_copy(false, &entry,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3263 "oop_disjoint_arraycopy_uninit",
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3264 /*dest_uninitialized*/true);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3265 StubRoutines::_oop_arraycopy_uninit = generate_conjoint_oop_copy(false, entry, NULL,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3266 "oop_arraycopy_uninit",
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3267 /*dest_uninitialized*/true);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3268 } else
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3269 #endif
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3270 {
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3271 // oop arraycopy is always aligned on 32bit and 64bit without compressed oops
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3272 StubRoutines::_oop_disjoint_arraycopy = StubRoutines::_arrayof_oop_disjoint_arraycopy;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3273 StubRoutines::_oop_arraycopy = StubRoutines::_arrayof_oop_arraycopy;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3274 StubRoutines::_oop_disjoint_arraycopy_uninit = StubRoutines::_arrayof_oop_disjoint_arraycopy_uninit;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3275 StubRoutines::_oop_arraycopy_uninit = StubRoutines::_arrayof_oop_arraycopy_uninit;
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3276 }
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3277
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3278 StubRoutines::_checkcast_arraycopy = generate_checkcast_copy("checkcast_arraycopy", &entry_checkcast_arraycopy);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3279 StubRoutines::_checkcast_arraycopy_uninit = generate_checkcast_copy("checkcast_arraycopy_uninit", NULL,
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3280 /*dest_uninitialized*/true);
0ac769a57c64 6627983: G1: Bad oop deference during marking
iveresov
parents: 2313
diff changeset
3281
2313
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3282 StubRoutines::_unsafe_arraycopy = generate_unsafe_copy("unsafe_arraycopy",
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3283 entry_jbyte_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3284 entry_jshort_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3285 entry_jint_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3286 entry_jlong_arraycopy);
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3287 StubRoutines::_generic_arraycopy = generate_generic_copy("generic_arraycopy",
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3288 entry_jbyte_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3289 entry_jshort_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3290 entry_jint_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3291 entry_oop_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3292 entry_jlong_arraycopy,
d89a22843c62 7020521: arraycopy stubs place prebarriers incorrectly
iveresov
parents: 1972
diff changeset
3293 entry_checkcast_arraycopy);
1763
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3294
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3295 StubRoutines::_jbyte_fill = generate_fill(T_BYTE, false, "jbyte_fill");
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3296 StubRoutines::_jshort_fill = generate_fill(T_SHORT, false, "jshort_fill");
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3297 StubRoutines::_jint_fill = generate_fill(T_INT, false, "jint_fill");
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3298 StubRoutines::_arrayof_jbyte_fill = generate_fill(T_BYTE, true, "arrayof_jbyte_fill");
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3299 StubRoutines::_arrayof_jshort_fill = generate_fill(T_SHORT, true, "arrayof_jshort_fill");
d6f45b55c972 4809552: Optimize Arrays.fill(...)
never
parents: 1655
diff changeset
3300 StubRoutines::_arrayof_jint_fill = generate_fill(T_INT, true, "arrayof_jint_fill");
3892
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3301
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3302 if (UseBlockZeroing) {
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3303 StubRoutines::_zero_aligned_words = generate_zero_aligned_words("zero_aligned_words");
baf763f388e6 7059037: Use BIS for zeroing on T4
kvn
parents: 3839
diff changeset
3304 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
3305 }
a61af66fc99e Initial load
duke
parents:
diff changeset
3306
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3307 address generate_aescrypt_encryptBlock() {
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3308 // required since we read expanded key 'int' array starting first element without alignment considerations
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3309 assert((arrayOopDesc::base_offset_in_bytes(T_INT) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3310 "the following code assumes that first element of an int array is aligned to 8 bytes");
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3311 __ align(CodeEntryAlignment);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3312 StubCodeMark mark(this, "StubRoutines", "aescrypt_encryptBlock");
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3313 Label L_load_misaligned_input, L_load_expanded_key, L_doLast128bit, L_storeOutput, L_store_misaligned_output;
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3314 address start = __ pc();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3315 Register from = O0; // source byte array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3316 Register to = O1; // destination byte array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3317 Register key = O2; // expanded key array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3318 const Register keylen = O4; //reg for storing expanded key array length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3319
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3320 // read expanded key length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3321 __ ldsw(Address(key, arrayOopDesc::length_offset_in_bytes() - arrayOopDesc::base_offset_in_bytes(T_INT)), keylen, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3322
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3323 // Method to address arbitrary alignment for load instructions:
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3324 // Check last 3 bits of 'from' address to see if it is aligned to 8-byte boundary
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3325 // If zero/aligned then continue with double FP load instructions
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3326 // If not zero/mis-aligned then alignaddr will set GSR.align with number of bytes to skip during faligndata
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3327 // alignaddr will also convert arbitrary aligned 'from' address to nearest 8-byte aligned address
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3328 // load 3 * 8-byte components (to read 16 bytes input) in 3 different FP regs starting at this aligned address
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3329 // faligndata will then extract (based on GSR.align value) the appropriate 8 bytes from the 2 source regs
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3330
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3331 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3332 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3333 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_input);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3334 __ delayed()->alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3335
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3336 // aligned case: load input into F54-F56
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3337 __ ldf(FloatRegisterImpl::D, from, 0, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3338 __ ldf(FloatRegisterImpl::D, from, 8, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3339 __ ba_short(L_load_expanded_key);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3340
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3341 __ BIND(L_load_misaligned_input);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3342 __ ldf(FloatRegisterImpl::D, from, 0, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3343 __ ldf(FloatRegisterImpl::D, from, 8, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3344 __ ldf(FloatRegisterImpl::D, from, 16, F58);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3345 __ faligndata(F54, F56, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3346 __ faligndata(F56, F58, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3347
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3348 __ BIND(L_load_expanded_key);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3349 // Since we load expanded key buffers starting first element, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3350 for ( int i = 0; i <= 38; i += 2 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3351 __ ldf(FloatRegisterImpl::D, key, i*4, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3352 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3353
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3354 // perform cipher transformation
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3355 __ fxor(FloatRegisterImpl::D, F0, F54, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3356 __ fxor(FloatRegisterImpl::D, F2, F56, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3357 // rounds 1 through 8
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3358 for ( int i = 4; i <= 28; i += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3359 __ aes_eround01(as_FloatRegister(i), F54, F56, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3360 __ aes_eround23(as_FloatRegister(i+2), F54, F56, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3361 __ aes_eround01(as_FloatRegister(i+4), F58, F60, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3362 __ aes_eround23(as_FloatRegister(i+6), F58, F60, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3363 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3364 __ aes_eround01(F36, F54, F56, F58); //round 9
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3365 __ aes_eround23(F38, F54, F56, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3366
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3367 // 128-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3368 __ cmp_and_brx_short(keylen, 44, Assembler::equal, Assembler::pt, L_doLast128bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3369
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3370 for ( int i = 40; i <= 50; i += 2 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3371 __ ldf(FloatRegisterImpl::D, key, i*4, as_FloatRegister(i) );
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3372 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3373 __ aes_eround01(F40, F58, F60, F54); //round 10
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3374 __ aes_eround23(F42, F58, F60, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3375 __ aes_eround01(F44, F54, F56, F58); //round 11
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3376 __ aes_eround23(F46, F54, F56, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3377
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3378 // 192-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3379 __ cmp_and_brx_short(keylen, 52, Assembler::equal, Assembler::pt, L_storeOutput);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3380
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3381 __ ldf(FloatRegisterImpl::D, key, 208, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3382 __ aes_eround01(F48, F58, F60, F54); //round 12
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3383 __ aes_eround23(F50, F58, F60, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3384 __ ldf(FloatRegisterImpl::D, key, 216, F46);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3385 __ ldf(FloatRegisterImpl::D, key, 224, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3386 __ ldf(FloatRegisterImpl::D, key, 232, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3387 __ aes_eround01(F52, F54, F56, F58); //round 13
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3388 __ aes_eround23(F46, F54, F56, F60);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3389 __ ba_short(L_storeOutput);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3390
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3391 __ BIND(L_doLast128bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3392 __ ldf(FloatRegisterImpl::D, key, 160, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3393 __ ldf(FloatRegisterImpl::D, key, 168, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3394
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3395 __ BIND(L_storeOutput);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3396 // perform last round of encryption common for all key sizes
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3397 __ aes_eround01_l(F48, F58, F60, F54); //last round
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3398 __ aes_eround23_l(F50, F58, F60, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3399
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3400 // Method to address arbitrary alignment for store instructions:
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3401 // Check last 3 bits of 'dest' address to see if it is aligned to 8-byte boundary
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3402 // If zero/aligned then continue with double FP store instructions
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3403 // If not zero/mis-aligned then edge8n will generate edge mask in result reg (O3 in below case)
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3404 // Example: If dest address is 0x07 and nearest 8-byte aligned address is 0x00 then edge mask will be 00000001
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3405 // Compute (8-n) where n is # of bytes skipped by partial store(stpartialf) inst from edge mask, n=7 in this case
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3406 // We get the value of n from the andcc that checks 'dest' alignment. n is available in O5 in below case.
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3407 // Set GSR.align to (8-n) using alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3408 // Circular byte shift store values by n places so that the original bytes are at correct position for stpartialf
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3409 // Set the arbitrarily aligned 'dest' address to nearest 8-byte aligned address
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3410 // Store (partial) the original first (8-n) bytes starting at the original 'dest' address
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3411 // Negate the edge mask so that the subsequent stpartialf can store the original (8-n-1)th through 8th bytes at appropriate address
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3412 // We need to execute this process for both the 8-byte result values
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3413
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3414 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3415 __ andcc(to, 7, O5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3416 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3417 __ delayed()->edge8n(to, G0, O3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3418
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3419 // aligned case: store output into the destination array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3420 __ stf(FloatRegisterImpl::D, F54, to, 0);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3421 __ retl();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3422 __ delayed()->stf(FloatRegisterImpl::D, F56, to, 8);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3423
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3424 __ BIND(L_store_misaligned_output);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3425 __ add(to, 8, O4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3426 __ mov(8, O2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3427 __ sub(O2, O5, O2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3428 __ alignaddr(O2, G0, O2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3429 __ faligndata(F54, F54, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3430 __ faligndata(F56, F56, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3431 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3432 __ and3(O4, -8, O4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3433 __ stpartialf(to, O3, F54, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3434 __ stpartialf(O4, O3, F56, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3435 __ add(to, 8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3436 __ add(O4, 8, O4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3437 __ orn(G0, O3, O3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3438 __ stpartialf(to, O3, F54, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3439 __ retl();
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3440 __ delayed()->stpartialf(O4, O3, F56, Assembler::ASI_PST8_PRIMARY);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3441
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3442 return start;
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3443 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3444
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3445 address generate_aescrypt_decryptBlock() {
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3446 assert((arrayOopDesc::base_offset_in_bytes(T_INT) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3447 "the following code assumes that first element of an int array is aligned to 8 bytes");
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3448 // required since we read original key 'byte' array as well in the decryption stubs
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3449 assert((arrayOopDesc::base_offset_in_bytes(T_BYTE) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3450 "the following code assumes that first element of a byte array is aligned to 8 bytes");
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3451 __ align(CodeEntryAlignment);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3452 StubCodeMark mark(this, "StubRoutines", "aescrypt_decryptBlock");
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3453 address start = __ pc();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3454 Label L_load_misaligned_input, L_load_original_key, L_expand192bit, L_expand256bit, L_reload_misaligned_input;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3455 Label L_256bit_transform, L_common_transform, L_store_misaligned_output;
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3456 Register from = O0; // source byte array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3457 Register to = O1; // destination byte array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3458 Register key = O2; // expanded key array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3459 Register original_key = O3; // original key array only required during decryption
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3460 const Register keylen = O4; // reg for storing expanded key array length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3461
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3462 // read expanded key array length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3463 __ ldsw(Address(key, arrayOopDesc::length_offset_in_bytes() - arrayOopDesc::base_offset_in_bytes(T_INT)), keylen, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3464
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3465 // save 'from' since we may need to recheck alignment in case of 256-bit decryption
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3466 __ mov(from, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3467
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3468 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3469 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3470 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_input);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3471 __ delayed()->alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3472
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3473 // aligned case: load input into F52-F54
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3474 __ ldf(FloatRegisterImpl::D, from, 0, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3475 __ ldf(FloatRegisterImpl::D, from, 8, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3476 __ ba_short(L_load_original_key);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3477
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3478 __ BIND(L_load_misaligned_input);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3479 __ ldf(FloatRegisterImpl::D, from, 0, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3480 __ ldf(FloatRegisterImpl::D, from, 8, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3481 __ ldf(FloatRegisterImpl::D, from, 16, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3482 __ faligndata(F52, F54, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3483 __ faligndata(F54, F56, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3484
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3485 __ BIND(L_load_original_key);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3486 // load original key from SunJCE expanded decryption key
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3487 // Since we load original key buffer starting first element, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3488 for ( int i = 0; i <= 3; i++ ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3489 __ ldf(FloatRegisterImpl::S, original_key, i*4, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3490 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3491
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3492 // 256-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3493 __ cmp_and_brx_short(keylen, 60, Assembler::equal, Assembler::pn, L_expand256bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3494
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3495 // 192-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3496 __ cmp_and_brx_short(keylen, 52, Assembler::equal, Assembler::pn, L_expand192bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3497
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3498 // 128-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3499 // perform key expansion since SunJCE decryption-key expansion is not compatible with SPARC crypto instructions
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3500 for ( int i = 0; i <= 36; i += 4 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3501 __ aes_kexpand1(as_FloatRegister(i), as_FloatRegister(i+2), i/4, as_FloatRegister(i+4));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3502 __ aes_kexpand2(as_FloatRegister(i+2), as_FloatRegister(i+4), as_FloatRegister(i+6));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3503 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3504
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3505 // perform 128-bit key specific inverse cipher transformation
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3506 __ fxor(FloatRegisterImpl::D, F42, F54, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3507 __ fxor(FloatRegisterImpl::D, F40, F52, F52);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3508 __ ba_short(L_common_transform);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3509
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3510 __ BIND(L_expand192bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3511
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3512 // start loading rest of the 192-bit key
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3513 __ ldf(FloatRegisterImpl::S, original_key, 16, F4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3514 __ ldf(FloatRegisterImpl::S, original_key, 20, F5);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3515
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3516 // perform key expansion since SunJCE decryption-key expansion is not compatible with SPARC crypto instructions
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3517 for ( int i = 0; i <= 36; i += 6 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3518 __ aes_kexpand1(as_FloatRegister(i), as_FloatRegister(i+4), i/6, as_FloatRegister(i+6));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3519 __ aes_kexpand2(as_FloatRegister(i+2), as_FloatRegister(i+6), as_FloatRegister(i+8));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3520 __ aes_kexpand2(as_FloatRegister(i+4), as_FloatRegister(i+8), as_FloatRegister(i+10));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3521 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3522 __ aes_kexpand1(F42, F46, 7, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3523 __ aes_kexpand2(F44, F48, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3524
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3525 // perform 192-bit key specific inverse cipher transformation
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3526 __ fxor(FloatRegisterImpl::D, F50, F54, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3527 __ fxor(FloatRegisterImpl::D, F48, F52, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3528 __ aes_dround23(F46, F52, F54, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3529 __ aes_dround01(F44, F52, F54, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3530 __ aes_dround23(F42, F56, F58, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3531 __ aes_dround01(F40, F56, F58, F52);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3532 __ ba_short(L_common_transform);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3533
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3534 __ BIND(L_expand256bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3535
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3536 // load rest of the 256-bit key
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3537 for ( int i = 4; i <= 7; i++ ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3538 __ ldf(FloatRegisterImpl::S, original_key, i*4, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3539 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3540
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3541 // perform key expansion since SunJCE decryption-key expansion is not compatible with SPARC crypto instructions
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3542 for ( int i = 0; i <= 40; i += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3543 __ aes_kexpand1(as_FloatRegister(i), as_FloatRegister(i+6), i/8, as_FloatRegister(i+8));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3544 __ aes_kexpand2(as_FloatRegister(i+2), as_FloatRegister(i+8), as_FloatRegister(i+10));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3545 __ aes_kexpand0(as_FloatRegister(i+4), as_FloatRegister(i+10), as_FloatRegister(i+12));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3546 __ aes_kexpand2(as_FloatRegister(i+6), as_FloatRegister(i+12), as_FloatRegister(i+14));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3547 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3548 __ aes_kexpand1(F48, F54, 6, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3549 __ aes_kexpand2(F50, F56, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3550
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3551 for ( int i = 0; i <= 6; i += 2 ) {
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3552 __ fsrc2(FloatRegisterImpl::D, as_FloatRegister(58-i), as_FloatRegister(i));
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3553 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3554
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3555 // reload original 'from' address
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3556 __ mov(G1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3557
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3558 // re-check 8-byte alignment
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3559 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3560 __ br(Assembler::notZero, true, Assembler::pn, L_reload_misaligned_input);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3561 __ delayed()->alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3562
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3563 // aligned case: load input into F52-F54
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3564 __ ldf(FloatRegisterImpl::D, from, 0, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3565 __ ldf(FloatRegisterImpl::D, from, 8, F54);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3566 __ ba_short(L_256bit_transform);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3567
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3568 __ BIND(L_reload_misaligned_input);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3569 __ ldf(FloatRegisterImpl::D, from, 0, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3570 __ ldf(FloatRegisterImpl::D, from, 8, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3571 __ ldf(FloatRegisterImpl::D, from, 16, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3572 __ faligndata(F52, F54, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3573 __ faligndata(F54, F56, F54);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3574
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3575 // perform 256-bit key specific inverse cipher transformation
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3576 __ BIND(L_256bit_transform);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3577 __ fxor(FloatRegisterImpl::D, F0, F54, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3578 __ fxor(FloatRegisterImpl::D, F2, F52, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3579 __ aes_dround23(F4, F52, F54, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3580 __ aes_dround01(F6, F52, F54, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3581 __ aes_dround23(F50, F56, F58, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3582 __ aes_dround01(F48, F56, F58, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3583 __ aes_dround23(F46, F52, F54, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3584 __ aes_dround01(F44, F52, F54, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3585 __ aes_dround23(F42, F56, F58, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3586 __ aes_dround01(F40, F56, F58, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3587
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3588 for ( int i = 0; i <= 7; i++ ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3589 __ ldf(FloatRegisterImpl::S, original_key, i*4, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3590 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3591
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3592 // perform inverse cipher transformations common for all key sizes
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3593 __ BIND(L_common_transform);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3594 for ( int i = 38; i >= 6; i -= 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3595 __ aes_dround23(as_FloatRegister(i), F52, F54, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3596 __ aes_dround01(as_FloatRegister(i-2), F52, F54, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3597 if ( i != 6) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3598 __ aes_dround23(as_FloatRegister(i-4), F56, F58, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3599 __ aes_dround01(as_FloatRegister(i-6), F56, F58, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3600 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3601 __ aes_dround23_l(as_FloatRegister(i-4), F56, F58, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3602 __ aes_dround01_l(as_FloatRegister(i-6), F56, F58, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3603 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3604 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3605
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3606 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3607 __ andcc(to, 7, O5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3608 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3609 __ delayed()->edge8n(to, G0, O3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3610
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3611 // aligned case: store output into the destination array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3612 __ stf(FloatRegisterImpl::D, F52, to, 0);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3613 __ retl();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3614 __ delayed()->stf(FloatRegisterImpl::D, F54, to, 8);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3615
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3616 __ BIND(L_store_misaligned_output);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3617 __ add(to, 8, O4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3618 __ mov(8, O2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3619 __ sub(O2, O5, O2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3620 __ alignaddr(O2, G0, O2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3621 __ faligndata(F52, F52, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3622 __ faligndata(F54, F54, F54);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3623 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3624 __ and3(O4, -8, O4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3625 __ stpartialf(to, O3, F52, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3626 __ stpartialf(O4, O3, F54, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3627 __ add(to, 8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3628 __ add(O4, 8, O4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3629 __ orn(G0, O3, O3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3630 __ stpartialf(to, O3, F52, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3631 __ retl();
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3632 __ delayed()->stpartialf(O4, O3, F54, Assembler::ASI_PST8_PRIMARY);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3633
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3634 return start;
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3635 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3636
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3637 address generate_cipherBlockChaining_encryptAESCrypt() {
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3638 assert((arrayOopDesc::base_offset_in_bytes(T_INT) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3639 "the following code assumes that first element of an int array is aligned to 8 bytes");
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3640 assert((arrayOopDesc::base_offset_in_bytes(T_BYTE) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3641 "the following code assumes that first element of a byte array is aligned to 8 bytes");
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3642 __ align(CodeEntryAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3643 StubCodeMark mark(this, "StubRoutines", "cipherBlockChaining_encryptAESCrypt");
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3644 Label L_cbcenc128, L_load_misaligned_input_128bit, L_128bit_transform, L_store_misaligned_output_128bit;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3645 Label L_check_loop_end_128bit, L_cbcenc192, L_load_misaligned_input_192bit, L_192bit_transform;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3646 Label L_store_misaligned_output_192bit, L_check_loop_end_192bit, L_cbcenc256, L_load_misaligned_input_256bit;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3647 Label L_256bit_transform, L_store_misaligned_output_256bit, L_check_loop_end_256bit;
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3648 address start = __ pc();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3649 Register from = I0; // source byte array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3650 Register to = I1; // destination byte array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3651 Register key = I2; // expanded key array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3652 Register rvec = I3; // init vector
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3653 const Register len_reg = I4; // cipher length
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3654 const Register keylen = I5; // reg for storing expanded key array length
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3655
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3656 __ save_frame(0);
17954
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3657 // save cipher len to return in the end
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3658 __ mov(len_reg, L0);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3659
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3660 // read expanded key length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3661 __ ldsw(Address(key, arrayOopDesc::length_offset_in_bytes() - arrayOopDesc::base_offset_in_bytes(T_INT)), keylen, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3662
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3663 // load initial vector, 8-byte alignment is guranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3664 __ ldf(FloatRegisterImpl::D, rvec, 0, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3665 __ ldf(FloatRegisterImpl::D, rvec, 8, F62);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3666 // load key, 8-byte alignment is guranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3667 __ ldx(key,0,G1);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3668 __ ldx(key,8,G5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3669
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3670 // start loading expanded key, 8-byte alignment is guranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3671 for ( int i = 0, j = 16; i <= 38; i += 2, j += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3672 __ ldf(FloatRegisterImpl::D, key, j, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3673 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3674
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3675 // 128-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3676 __ cmp_and_brx_short(keylen, 44, Assembler::equal, Assembler::pt, L_cbcenc128);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3677
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3678 for ( int i = 40, j = 176; i <= 46; i += 2, j += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3679 __ ldf(FloatRegisterImpl::D, key, j, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3680 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3681
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3682 // 192-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3683 __ cmp_and_brx_short(keylen, 52, Assembler::equal, Assembler::pt, L_cbcenc192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3684
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3685 for ( int i = 48, j = 208; i <= 54; i += 2, j += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3686 __ ldf(FloatRegisterImpl::D, key, j, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3687 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3688
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3689 // 256-bit original key size
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3690 __ ba_short(L_cbcenc256);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3691
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3692 __ align(OptoLoopAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3693 __ BIND(L_cbcenc128);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3694 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3695 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3696 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_input_128bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3697 __ delayed()->mov(from, L1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3698
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3699 // aligned case: load input into G3 and G4
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3700 __ ldx(from,0,G3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3701 __ ldx(from,8,G4);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3702 __ ba_short(L_128bit_transform);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3703
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3704 __ BIND(L_load_misaligned_input_128bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3705 // can clobber F48, F50 and F52 as they are not used in 128 and 192-bit key encryption
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3706 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3707 __ ldf(FloatRegisterImpl::D, from, 0, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3708 __ ldf(FloatRegisterImpl::D, from, 8, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3709 __ ldf(FloatRegisterImpl::D, from, 16, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3710 __ faligndata(F48, F50, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3711 __ faligndata(F50, F52, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3712 __ movdtox(F48, G3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3713 __ movdtox(F50, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3714 __ mov(L1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3715
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3716 __ BIND(L_128bit_transform);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3717 __ xor3(G1,G3,G3);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3718 __ xor3(G5,G4,G4);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3719 __ movxtod(G3,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3720 __ movxtod(G4,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3721 __ fxor(FloatRegisterImpl::D, F60, F56, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3722 __ fxor(FloatRegisterImpl::D, F62, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3723
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3724 // TEN_EROUNDS
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3725 for ( int i = 0; i <= 32; i += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3726 __ aes_eround01(as_FloatRegister(i), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3727 __ aes_eround23(as_FloatRegister(i+2), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3728 if (i != 32 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3729 __ aes_eround01(as_FloatRegister(i+4), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3730 __ aes_eround23(as_FloatRegister(i+6), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3731 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3732 __ aes_eround01_l(as_FloatRegister(i+4), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3733 __ aes_eround23_l(as_FloatRegister(i+6), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3734 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3735 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3736
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3737 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3738 __ andcc(to, 7, L1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3739 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_128bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3740 __ delayed()->edge8n(to, G0, L2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3741
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3742 // aligned case: store output into the destination array
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3743 __ stf(FloatRegisterImpl::D, F60, to, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3744 __ stf(FloatRegisterImpl::D, F62, to, 8);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3745 __ ba_short(L_check_loop_end_128bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3746
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3747 __ BIND(L_store_misaligned_output_128bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3748 __ add(to, 8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3749 __ mov(8, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3750 __ sub(L4, L1, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3751 __ alignaddr(L4, G0, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3752 // save cipher text before circular right shift
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3753 // as it needs to be stored as iv for next block (see code before next retl)
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3754 __ movdtox(F60, L6);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3755 __ movdtox(F62, L7);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3756 __ faligndata(F60, F60, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3757 __ faligndata(F62, F62, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3758 __ mov(to, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3759 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3760 __ and3(L3, -8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3761 __ stpartialf(to, L2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3762 __ stpartialf(L3, L2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3763 __ add(to, 8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3764 __ add(L3, 8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3765 __ orn(G0, L2, L2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3766 __ stpartialf(to, L2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3767 __ stpartialf(L3, L2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3768 __ mov(L5, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3769 __ movxtod(L6, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3770 __ movxtod(L7, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3771
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3772 __ BIND(L_check_loop_end_128bit);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3773 __ add(from, 16, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3774 __ add(to, 16, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3775 __ subcc(len_reg, 16, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3776 __ br(Assembler::notEqual, false, Assembler::pt, L_cbcenc128);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3777 __ delayed()->nop();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3778 // re-init intial vector for next block, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3779 __ stf(FloatRegisterImpl::D, F60, rvec, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3780 __ stf(FloatRegisterImpl::D, F62, rvec, 8);
17954
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3781 __ mov(L0, I0);
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3782 __ ret();
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3783 __ delayed()->restore();
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3784
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3785 __ align(OptoLoopAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3786 __ BIND(L_cbcenc192);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3787 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3788 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3789 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_input_192bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3790 __ delayed()->mov(from, L1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3791
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3792 // aligned case: load input into G3 and G4
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3793 __ ldx(from,0,G3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3794 __ ldx(from,8,G4);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3795 __ ba_short(L_192bit_transform);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3796
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3797 __ BIND(L_load_misaligned_input_192bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3798 // can clobber F48, F50 and F52 as they are not used in 128 and 192-bit key encryption
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3799 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3800 __ ldf(FloatRegisterImpl::D, from, 0, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3801 __ ldf(FloatRegisterImpl::D, from, 8, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3802 __ ldf(FloatRegisterImpl::D, from, 16, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3803 __ faligndata(F48, F50, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3804 __ faligndata(F50, F52, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3805 __ movdtox(F48, G3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3806 __ movdtox(F50, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3807 __ mov(L1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3808
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3809 __ BIND(L_192bit_transform);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3810 __ xor3(G1,G3,G3);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3811 __ xor3(G5,G4,G4);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3812 __ movxtod(G3,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3813 __ movxtod(G4,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3814 __ fxor(FloatRegisterImpl::D, F60, F56, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3815 __ fxor(FloatRegisterImpl::D, F62, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3816
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3817 // TWELEVE_EROUNDS
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3818 for ( int i = 0; i <= 40; i += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3819 __ aes_eround01(as_FloatRegister(i), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3820 __ aes_eround23(as_FloatRegister(i+2), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3821 if (i != 40 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3822 __ aes_eround01(as_FloatRegister(i+4), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3823 __ aes_eround23(as_FloatRegister(i+6), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3824 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3825 __ aes_eround01_l(as_FloatRegister(i+4), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3826 __ aes_eround23_l(as_FloatRegister(i+6), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3827 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3828 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3829
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3830 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3831 __ andcc(to, 7, L1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3832 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_192bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3833 __ delayed()->edge8n(to, G0, L2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3834
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3835 // aligned case: store output into the destination array
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3836 __ stf(FloatRegisterImpl::D, F60, to, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3837 __ stf(FloatRegisterImpl::D, F62, to, 8);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3838 __ ba_short(L_check_loop_end_192bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3839
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3840 __ BIND(L_store_misaligned_output_192bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3841 __ add(to, 8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3842 __ mov(8, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3843 __ sub(L4, L1, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3844 __ alignaddr(L4, G0, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3845 __ movdtox(F60, L6);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3846 __ movdtox(F62, L7);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3847 __ faligndata(F60, F60, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3848 __ faligndata(F62, F62, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3849 __ mov(to, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3850 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3851 __ and3(L3, -8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3852 __ stpartialf(to, L2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3853 __ stpartialf(L3, L2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3854 __ add(to, 8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3855 __ add(L3, 8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3856 __ orn(G0, L2, L2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3857 __ stpartialf(to, L2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3858 __ stpartialf(L3, L2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3859 __ mov(L5, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3860 __ movxtod(L6, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3861 __ movxtod(L7, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3862
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3863 __ BIND(L_check_loop_end_192bit);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3864 __ add(from, 16, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3865 __ subcc(len_reg, 16, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3866 __ add(to, 16, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3867 __ br(Assembler::notEqual, false, Assembler::pt, L_cbcenc192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3868 __ delayed()->nop();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3869 // re-init intial vector for next block, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3870 __ stf(FloatRegisterImpl::D, F60, rvec, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3871 __ stf(FloatRegisterImpl::D, F62, rvec, 8);
17954
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3872 __ mov(L0, I0);
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3873 __ ret();
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3874 __ delayed()->restore();
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3875
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3876 __ align(OptoLoopAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3877 __ BIND(L_cbcenc256);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3878 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3879 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3880 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_input_256bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3881 __ delayed()->mov(from, L1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3882
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3883 // aligned case: load input into G3 and G4
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3884 __ ldx(from,0,G3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3885 __ ldx(from,8,G4);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3886 __ ba_short(L_256bit_transform);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3887
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3888 __ BIND(L_load_misaligned_input_256bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3889 // cannot clobber F48, F50 and F52. F56, F58 can be used though
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3890 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3891 __ movdtox(F60, L2); // save F60 before overwriting
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3892 __ ldf(FloatRegisterImpl::D, from, 0, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3893 __ ldf(FloatRegisterImpl::D, from, 8, F58);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3894 __ ldf(FloatRegisterImpl::D, from, 16, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3895 __ faligndata(F56, F58, F56);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3896 __ faligndata(F58, F60, F58);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3897 __ movdtox(F56, G3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3898 __ movdtox(F58, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3899 __ mov(L1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3900 __ movxtod(L2, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3901
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3902 __ BIND(L_256bit_transform);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3903 __ xor3(G1,G3,G3);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3904 __ xor3(G5,G4,G4);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3905 __ movxtod(G3,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3906 __ movxtod(G4,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3907 __ fxor(FloatRegisterImpl::D, F60, F56, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3908 __ fxor(FloatRegisterImpl::D, F62, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3909
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3910 // FOURTEEN_EROUNDS
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3911 for ( int i = 0; i <= 48; i += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3912 __ aes_eround01(as_FloatRegister(i), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3913 __ aes_eround23(as_FloatRegister(i+2), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3914 if (i != 48 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3915 __ aes_eround01(as_FloatRegister(i+4), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3916 __ aes_eround23(as_FloatRegister(i+6), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3917 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3918 __ aes_eround01_l(as_FloatRegister(i+4), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3919 __ aes_eround23_l(as_FloatRegister(i+6), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3920 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3921 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3922
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3923 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3924 __ andcc(to, 7, L1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3925 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_256bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3926 __ delayed()->edge8n(to, G0, L2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3927
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3928 // aligned case: store output into the destination array
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3929 __ stf(FloatRegisterImpl::D, F60, to, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3930 __ stf(FloatRegisterImpl::D, F62, to, 8);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3931 __ ba_short(L_check_loop_end_256bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3932
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3933 __ BIND(L_store_misaligned_output_256bit);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3934 __ add(to, 8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3935 __ mov(8, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3936 __ sub(L4, L1, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3937 __ alignaddr(L4, G0, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3938 __ movdtox(F60, L6);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3939 __ movdtox(F62, L7);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3940 __ faligndata(F60, F60, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3941 __ faligndata(F62, F62, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3942 __ mov(to, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3943 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3944 __ and3(L3, -8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3945 __ stpartialf(to, L2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3946 __ stpartialf(L3, L2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3947 __ add(to, 8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3948 __ add(L3, 8, L3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3949 __ orn(G0, L2, L2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3950 __ stpartialf(to, L2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3951 __ stpartialf(L3, L2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3952 __ mov(L5, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3953 __ movxtod(L6, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3954 __ movxtod(L7, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3955
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3956 __ BIND(L_check_loop_end_256bit);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3957 __ add(from, 16, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3958 __ subcc(len_reg, 16, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3959 __ add(to, 16, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3960 __ br(Assembler::notEqual, false, Assembler::pt, L_cbcenc256);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3961 __ delayed()->nop();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3962 // re-init intial vector for next block, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3963 __ stf(FloatRegisterImpl::D, F60, rvec, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3964 __ stf(FloatRegisterImpl::D, F62, rvec, 8);
17954
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3965 __ mov(L0, I0);
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3966 __ ret();
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3967 __ delayed()->restore();
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3968
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3969 return start;
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3970 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3971
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3972 address generate_cipherBlockChaining_decryptAESCrypt_Parallel() {
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3973 assert((arrayOopDesc::base_offset_in_bytes(T_INT) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3974 "the following code assumes that first element of an int array is aligned to 8 bytes");
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3975 assert((arrayOopDesc::base_offset_in_bytes(T_BYTE) & 7) == 0,
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3976 "the following code assumes that first element of a byte array is aligned to 8 bytes");
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3977 __ align(CodeEntryAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3978 StubCodeMark mark(this, "StubRoutines", "cipherBlockChaining_decryptAESCrypt");
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3979 Label L_cbcdec_end, L_expand192bit, L_expand256bit, L_dec_first_block_start;
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3980 Label L_dec_first_block128, L_dec_first_block192, L_dec_next2_blocks128, L_dec_next2_blocks192, L_dec_next2_blocks256;
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3981 Label L_load_misaligned_input_first_block, L_transform_first_block, L_load_misaligned_next2_blocks128, L_transform_next2_blocks128;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3982 Label L_load_misaligned_next2_blocks192, L_transform_next2_blocks192, L_load_misaligned_next2_blocks256, L_transform_next2_blocks256;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3983 Label L_store_misaligned_output_first_block, L_check_decrypt_end, L_store_misaligned_output_next2_blocks128;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3984 Label L_check_decrypt_loop_end128, L_store_misaligned_output_next2_blocks192, L_check_decrypt_loop_end192;
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
3985 Label L_store_misaligned_output_next2_blocks256, L_check_decrypt_loop_end256;
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3986 address start = __ pc();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3987 Register from = I0; // source byte array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3988 Register to = I1; // destination byte array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3989 Register key = I2; // expanded key array
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3990 Register rvec = I3; // init vector
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3991 const Register len_reg = I4; // cipher length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3992 const Register original_key = I5; // original key array only required during decryption
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3993 const Register keylen = L6; // reg for storing expanded key array length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3994
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3995 __ save_frame(0); //args are read from I* registers since we save the frame in the beginning
17954
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3996 // save cipher len to return in the end
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
3997 __ mov(len_reg, L7);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3998
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
3999 // load original key from SunJCE expanded decryption key
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4000 // Since we load original key buffer starting first element, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4001 for ( int i = 0; i <= 3; i++ ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4002 __ ldf(FloatRegisterImpl::S, original_key, i*4, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4003 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4004
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4005 // load initial vector, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4006 __ ldx(rvec,0,L0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4007 __ ldx(rvec,8,L1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4008
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4009 // read expanded key array length
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4010 __ ldsw(Address(key, arrayOopDesc::length_offset_in_bytes() - arrayOopDesc::base_offset_in_bytes(T_INT)), keylen, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4011
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4012 // 256-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4013 __ cmp_and_brx_short(keylen, 60, Assembler::equal, Assembler::pn, L_expand256bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4014
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4015 // 192-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4016 __ cmp_and_brx_short(keylen, 52, Assembler::equal, Assembler::pn, L_expand192bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4017
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4018 // 128-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4019 // perform key expansion since SunJCE decryption-key expansion is not compatible with SPARC crypto instructions
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4020 for ( int i = 0; i <= 36; i += 4 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4021 __ aes_kexpand1(as_FloatRegister(i), as_FloatRegister(i+2), i/4, as_FloatRegister(i+4));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4022 __ aes_kexpand2(as_FloatRegister(i+2), as_FloatRegister(i+4), as_FloatRegister(i+6));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4023 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4024
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4025 // load expanded key[last-1] and key[last] elements
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4026 __ movdtox(F40,L2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4027 __ movdtox(F42,L3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4028
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4029 __ and3(len_reg, 16, L4);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4030 __ br_null_short(L4, Assembler::pt, L_dec_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4031 __ nop();
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4032
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4033 __ ba_short(L_dec_first_block_start);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4034
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4035 __ BIND(L_expand192bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4036 // load rest of the 192-bit key
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4037 __ ldf(FloatRegisterImpl::S, original_key, 16, F4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4038 __ ldf(FloatRegisterImpl::S, original_key, 20, F5);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4039
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4040 // perform key expansion since SunJCE decryption-key expansion is not compatible with SPARC crypto instructions
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4041 for ( int i = 0; i <= 36; i += 6 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4042 __ aes_kexpand1(as_FloatRegister(i), as_FloatRegister(i+4), i/6, as_FloatRegister(i+6));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4043 __ aes_kexpand2(as_FloatRegister(i+2), as_FloatRegister(i+6), as_FloatRegister(i+8));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4044 __ aes_kexpand2(as_FloatRegister(i+4), as_FloatRegister(i+8), as_FloatRegister(i+10));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4045 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4046 __ aes_kexpand1(F42, F46, 7, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4047 __ aes_kexpand2(F44, F48, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4048
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4049 // load expanded key[last-1] and key[last] elements
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4050 __ movdtox(F48,L2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4051 __ movdtox(F50,L3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4052
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4053 __ and3(len_reg, 16, L4);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4054 __ br_null_short(L4, Assembler::pt, L_dec_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4055 __ nop();
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4056
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4057 __ ba_short(L_dec_first_block_start);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4058
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4059 __ BIND(L_expand256bit);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4060 // load rest of the 256-bit key
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4061 for ( int i = 4; i <= 7; i++ ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4062 __ ldf(FloatRegisterImpl::S, original_key, i*4, as_FloatRegister(i));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4063 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4064
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4065 // perform key expansion since SunJCE decryption-key expansion is not compatible with SPARC crypto instructions
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4066 for ( int i = 0; i <= 40; i += 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4067 __ aes_kexpand1(as_FloatRegister(i), as_FloatRegister(i+6), i/8, as_FloatRegister(i+8));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4068 __ aes_kexpand2(as_FloatRegister(i+2), as_FloatRegister(i+8), as_FloatRegister(i+10));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4069 __ aes_kexpand0(as_FloatRegister(i+4), as_FloatRegister(i+10), as_FloatRegister(i+12));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4070 __ aes_kexpand2(as_FloatRegister(i+6), as_FloatRegister(i+12), as_FloatRegister(i+14));
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4071 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4072 __ aes_kexpand1(F48, F54, 6, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4073 __ aes_kexpand2(F50, F56, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4074
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4075 // load expanded key[last-1] and key[last] elements
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4076 __ movdtox(F56,L2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4077 __ movdtox(F58,L3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4078
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4079 __ and3(len_reg, 16, L4);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4080 __ br_null_short(L4, Assembler::pt, L_dec_next2_blocks256);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4081
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4082 __ BIND(L_dec_first_block_start);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4083 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4084 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4085 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_input_first_block);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4086 __ delayed()->mov(from, G1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4087
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4088 // aligned case: load input into L4 and L5
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4089 __ ldx(from,0,L4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4090 __ ldx(from,8,L5);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4091 __ ba_short(L_transform_first_block);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4092
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4093 __ BIND(L_load_misaligned_input_first_block);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4094 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4095 // F58, F60, F62 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4096 __ ldf(FloatRegisterImpl::D, from, 0, F58);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4097 __ ldf(FloatRegisterImpl::D, from, 8, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4098 __ ldf(FloatRegisterImpl::D, from, 16, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4099 __ faligndata(F58, F60, F58);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4100 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4101 __ movdtox(F58, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4102 __ movdtox(F60, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4103 __ mov(G1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4104
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4105 __ BIND(L_transform_first_block);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4106 __ xor3(L2,L4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4107 __ movxtod(G1,F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4108 __ xor3(L3,L5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4109 __ movxtod(G1,F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4110
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4111 // 128-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4112 __ cmp_and_brx_short(keylen, 44, Assembler::equal, Assembler::pn, L_dec_first_block128);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4113
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4114 // 192-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4115 __ cmp_and_brx_short(keylen, 52, Assembler::equal, Assembler::pn, L_dec_first_block192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4116
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4117 __ aes_dround23(F54, F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4118 __ aes_dround01(F52, F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4119 __ aes_dround23(F50, F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4120 __ aes_dround01(F48, F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4121
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4122 __ BIND(L_dec_first_block192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4123 __ aes_dround23(F46, F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4124 __ aes_dround01(F44, F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4125 __ aes_dround23(F42, F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4126 __ aes_dround01(F40, F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4127
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4128 __ BIND(L_dec_first_block128);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4129 for ( int i = 38; i >= 6; i -= 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4130 __ aes_dround23(as_FloatRegister(i), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4131 __ aes_dround01(as_FloatRegister(i-2), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4132 if ( i != 6) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4133 __ aes_dround23(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4134 __ aes_dround01(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4135 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4136 __ aes_dround23_l(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4137 __ aes_dround01_l(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4138 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4139 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4140
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4141 __ movxtod(L0,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4142 __ movxtod(L1,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4143 __ mov(L4,L0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4144 __ mov(L5,L1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4145 __ fxor(FloatRegisterImpl::D, F56, F60, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4146 __ fxor(FloatRegisterImpl::D, F58, F62, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4147
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4148 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4149 __ andcc(to, 7, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4150 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_first_block);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4151 __ delayed()->edge8n(to, G0, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4152
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4153 // aligned case: store output into the destination array
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4154 __ stf(FloatRegisterImpl::D, F60, to, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4155 __ stf(FloatRegisterImpl::D, F62, to, 8);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4156 __ ba_short(L_check_decrypt_end);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4157
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4158 __ BIND(L_store_misaligned_output_first_block);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4159 __ add(to, 8, G3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4160 __ mov(8, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4161 __ sub(G4, G1, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4162 __ alignaddr(G4, G0, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4163 __ faligndata(F60, F60, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4164 __ faligndata(F62, F62, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4165 __ mov(to, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4166 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4167 __ and3(G3, -8, G3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4168 __ stpartialf(to, G2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4169 __ stpartialf(G3, G2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4170 __ add(to, 8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4171 __ add(G3, 8, G3);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4172 __ orn(G0, G2, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4173 __ stpartialf(to, G2, F60, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4174 __ stpartialf(G3, G2, F62, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4175 __ mov(G1, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4176
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4177 __ BIND(L_check_decrypt_end);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4178 __ add(from, 16, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4179 __ add(to, 16, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4180 __ subcc(len_reg, 16, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4181 __ br(Assembler::equal, false, Assembler::pt, L_cbcdec_end);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4182 __ delayed()->nop();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4183
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4184 // 256-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4185 __ cmp_and_brx_short(keylen, 60, Assembler::equal, Assembler::pn, L_dec_next2_blocks256);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4186
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4187 // 192-bit original key size
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4188 __ cmp_and_brx_short(keylen, 52, Assembler::equal, Assembler::pn, L_dec_next2_blocks192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4189
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4190 __ align(OptoLoopAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4191 __ BIND(L_dec_next2_blocks128);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4192 __ nop();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4193
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4194 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4195 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4196 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4197 __ delayed()->mov(from, G1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4198
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4199 // aligned case: load input into G4, G5, L4 and L5
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4200 __ ldx(from,0,G4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4201 __ ldx(from,8,G5);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4202 __ ldx(from,16,L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4203 __ ldx(from,24,L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4204 __ ba_short(L_transform_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4205
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4206 __ BIND(L_load_misaligned_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4207 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4208 // F40, F42, F58, F60, F62 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4209 __ ldf(FloatRegisterImpl::D, from, 0, F40);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4210 __ ldf(FloatRegisterImpl::D, from, 8, F42);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4211 __ ldf(FloatRegisterImpl::D, from, 16, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4212 __ ldf(FloatRegisterImpl::D, from, 24, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4213 __ ldf(FloatRegisterImpl::D, from, 32, F58);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4214 __ faligndata(F40, F42, F40);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4215 __ faligndata(F42, F60, F42);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4216 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4217 __ faligndata(F62, F58, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4218 __ movdtox(F40, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4219 __ movdtox(F42, G5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4220 __ movdtox(F60, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4221 __ movdtox(F62, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4222 __ mov(G1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4223
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4224 __ BIND(L_transform_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4225 // F40:F42 used for first 16-bytes
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4226 __ xor3(L2,G4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4227 __ movxtod(G1,F40);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4228 __ xor3(L3,G5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4229 __ movxtod(G1,F42);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4230
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4231 // F60:F62 used for next 16-bytes
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4232 __ xor3(L2,L4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4233 __ movxtod(G1,F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4234 __ xor3(L3,L5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4235 __ movxtod(G1,F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4236
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4237 for ( int i = 38; i >= 6; i -= 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4238 __ aes_dround23(as_FloatRegister(i), F40, F42, F44);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4239 __ aes_dround01(as_FloatRegister(i-2), F40, F42, F46);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4240 __ aes_dround23(as_FloatRegister(i), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4241 __ aes_dround01(as_FloatRegister(i-2), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4242 if (i != 6 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4243 __ aes_dround23(as_FloatRegister(i-4), F46, F44, F42);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4244 __ aes_dround01(as_FloatRegister(i-6), F46, F44, F40);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4245 __ aes_dround23(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4246 __ aes_dround01(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4247 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4248 __ aes_dround23_l(as_FloatRegister(i-4), F46, F44, F42);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4249 __ aes_dround01_l(as_FloatRegister(i-6), F46, F44, F40);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4250 __ aes_dround23_l(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4251 __ aes_dround01_l(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4252 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4253 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4254
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4255 __ movxtod(L0,F46);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4256 __ movxtod(L1,F44);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4257 __ fxor(FloatRegisterImpl::D, F46, F40, F40);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4258 __ fxor(FloatRegisterImpl::D, F44, F42, F42);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4259
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4260 __ movxtod(G4,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4261 __ movxtod(G5,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4262 __ mov(L4,L0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4263 __ mov(L5,L1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4264 __ fxor(FloatRegisterImpl::D, F56, F60, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4265 __ fxor(FloatRegisterImpl::D, F58, F62, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4266
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4267 // For mis-aligned store of 32 bytes of result we can do:
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4268 // Circular right-shift all 4 FP registers so that 'head' and 'tail'
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4269 // parts that need to be stored starting at mis-aligned address are in a FP reg
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4270 // the other 3 FP regs can thus be stored using regular store
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4271 // we then use the edge + partial-store mechanism to store the 'head' and 'tail' parts
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4272
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4273 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4274 __ andcc(to, 7, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4275 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4276 __ delayed()->edge8n(to, G0, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4277
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4278 // aligned case: store output into the destination array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4279 __ stf(FloatRegisterImpl::D, F40, to, 0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4280 __ stf(FloatRegisterImpl::D, F42, to, 8);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4281 __ stf(FloatRegisterImpl::D, F60, to, 16);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4282 __ stf(FloatRegisterImpl::D, F62, to, 24);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4283 __ ba_short(L_check_decrypt_loop_end128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4284
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4285 __ BIND(L_store_misaligned_output_next2_blocks128);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4286 __ mov(8, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4287 __ sub(G4, G1, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4288 __ alignaddr(G4, G0, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4289 __ faligndata(F40, F42, F56); // F56 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4290 __ faligndata(F42, F60, F42);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4291 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4292 __ faligndata(F62, F40, F40);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4293 __ mov(to, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4294 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4295 __ stpartialf(to, G2, F40, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4296 __ stf(FloatRegisterImpl::D, F56, to, 8);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4297 __ stf(FloatRegisterImpl::D, F42, to, 16);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4298 __ stf(FloatRegisterImpl::D, F60, to, 24);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4299 __ add(to, 32, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4300 __ orn(G0, G2, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4301 __ stpartialf(to, G2, F40, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4302 __ mov(G1, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4303
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4304 __ BIND(L_check_decrypt_loop_end128);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4305 __ add(from, 32, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4306 __ add(to, 32, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4307 __ subcc(len_reg, 32, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4308 __ br(Assembler::notEqual, false, Assembler::pt, L_dec_next2_blocks128);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4309 __ delayed()->nop();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4310 __ ba_short(L_cbcdec_end);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4311
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4312 __ align(OptoLoopAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4313 __ BIND(L_dec_next2_blocks192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4314 __ nop();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4315
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4316 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4317 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4318 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4319 __ delayed()->mov(from, G1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4320
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4321 // aligned case: load input into G4, G5, L4 and L5
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4322 __ ldx(from,0,G4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4323 __ ldx(from,8,G5);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4324 __ ldx(from,16,L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4325 __ ldx(from,24,L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4326 __ ba_short(L_transform_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4327
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4328 __ BIND(L_load_misaligned_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4329 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4330 // F48, F50, F52, F60, F62 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4331 __ ldf(FloatRegisterImpl::D, from, 0, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4332 __ ldf(FloatRegisterImpl::D, from, 8, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4333 __ ldf(FloatRegisterImpl::D, from, 16, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4334 __ ldf(FloatRegisterImpl::D, from, 24, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4335 __ ldf(FloatRegisterImpl::D, from, 32, F52);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4336 __ faligndata(F48, F50, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4337 __ faligndata(F50, F60, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4338 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4339 __ faligndata(F62, F52, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4340 __ movdtox(F48, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4341 __ movdtox(F50, G5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4342 __ movdtox(F60, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4343 __ movdtox(F62, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4344 __ mov(G1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4345
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4346 __ BIND(L_transform_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4347 // F48:F50 used for first 16-bytes
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4348 __ xor3(L2,G4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4349 __ movxtod(G1,F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4350 __ xor3(L3,G5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4351 __ movxtod(G1,F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4352
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4353 // F60:F62 used for next 16-bytes
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4354 __ xor3(L2,L4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4355 __ movxtod(G1,F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4356 __ xor3(L3,L5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4357 __ movxtod(G1,F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4358
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4359 for ( int i = 46; i >= 6; i -= 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4360 __ aes_dround23(as_FloatRegister(i), F48, F50, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4361 __ aes_dround01(as_FloatRegister(i-2), F48, F50, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4362 __ aes_dround23(as_FloatRegister(i), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4363 __ aes_dround01(as_FloatRegister(i-2), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4364 if (i != 6 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4365 __ aes_dround23(as_FloatRegister(i-4), F54, F52, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4366 __ aes_dround01(as_FloatRegister(i-6), F54, F52, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4367 __ aes_dround23(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4368 __ aes_dround01(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4369 } else {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4370 __ aes_dround23_l(as_FloatRegister(i-4), F54, F52, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4371 __ aes_dround01_l(as_FloatRegister(i-6), F54, F52, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4372 __ aes_dround23_l(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4373 __ aes_dround01_l(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4374 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4375 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4376
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4377 __ movxtod(L0,F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4378 __ movxtod(L1,F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4379 __ fxor(FloatRegisterImpl::D, F54, F48, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4380 __ fxor(FloatRegisterImpl::D, F52, F50, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4381
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4382 __ movxtod(G4,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4383 __ movxtod(G5,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4384 __ mov(L4,L0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4385 __ mov(L5,L1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4386 __ fxor(FloatRegisterImpl::D, F56, F60, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4387 __ fxor(FloatRegisterImpl::D, F58, F62, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4388
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4389 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4390 __ andcc(to, 7, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4391 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4392 __ delayed()->edge8n(to, G0, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4393
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4394 // aligned case: store output into the destination array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4395 __ stf(FloatRegisterImpl::D, F48, to, 0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4396 __ stf(FloatRegisterImpl::D, F50, to, 8);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4397 __ stf(FloatRegisterImpl::D, F60, to, 16);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4398 __ stf(FloatRegisterImpl::D, F62, to, 24);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4399 __ ba_short(L_check_decrypt_loop_end192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4400
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4401 __ BIND(L_store_misaligned_output_next2_blocks192);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4402 __ mov(8, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4403 __ sub(G4, G1, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4404 __ alignaddr(G4, G0, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4405 __ faligndata(F48, F50, F56); // F56 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4406 __ faligndata(F50, F60, F50);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4407 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4408 __ faligndata(F62, F48, F48);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4409 __ mov(to, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4410 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4411 __ stpartialf(to, G2, F48, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4412 __ stf(FloatRegisterImpl::D, F56, to, 8);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4413 __ stf(FloatRegisterImpl::D, F50, to, 16);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4414 __ stf(FloatRegisterImpl::D, F60, to, 24);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4415 __ add(to, 32, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4416 __ orn(G0, G2, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4417 __ stpartialf(to, G2, F48, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4418 __ mov(G1, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4419
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4420 __ BIND(L_check_decrypt_loop_end192);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4421 __ add(from, 32, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4422 __ add(to, 32, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4423 __ subcc(len_reg, 32, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4424 __ br(Assembler::notEqual, false, Assembler::pt, L_dec_next2_blocks192);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4425 __ delayed()->nop();
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4426 __ ba_short(L_cbcdec_end);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4427
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4428 __ align(OptoLoopAlignment);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4429 __ BIND(L_dec_next2_blocks256);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4430 __ nop();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4431
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4432 // check for 8-byte alignment since source byte array may have an arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4433 __ andcc(from, 7, G0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4434 __ br(Assembler::notZero, true, Assembler::pn, L_load_misaligned_next2_blocks256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4435 __ delayed()->mov(from, G1); // save original 'from' address before alignaddr
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4436
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4437 // aligned case: load input into G4, G5, L4 and L5
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4438 __ ldx(from,0,G4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4439 __ ldx(from,8,G5);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4440 __ ldx(from,16,L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4441 __ ldx(from,24,L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4442 __ ba_short(L_transform_next2_blocks256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4443
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4444 __ BIND(L_load_misaligned_next2_blocks256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4445 __ alignaddr(from, G0, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4446 // F0, F2, F4, F60, F62 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4447 __ ldf(FloatRegisterImpl::D, from, 0, F0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4448 __ ldf(FloatRegisterImpl::D, from, 8, F2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4449 __ ldf(FloatRegisterImpl::D, from, 16, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4450 __ ldf(FloatRegisterImpl::D, from, 24, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4451 __ ldf(FloatRegisterImpl::D, from, 32, F4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4452 __ faligndata(F0, F2, F0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4453 __ faligndata(F2, F60, F2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4454 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4455 __ faligndata(F62, F4, F62);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4456 __ movdtox(F0, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4457 __ movdtox(F2, G5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4458 __ movdtox(F60, L4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4459 __ movdtox(F62, L5);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4460 __ mov(G1, from);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4461
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4462 __ BIND(L_transform_next2_blocks256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4463 // F0:F2 used for first 16-bytes
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4464 __ xor3(L2,G4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4465 __ movxtod(G1,F0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4466 __ xor3(L3,G5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4467 __ movxtod(G1,F2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4468
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4469 // F60:F62 used for next 16-bytes
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4470 __ xor3(L2,L4,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4471 __ movxtod(G1,F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4472 __ xor3(L3,L5,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4473 __ movxtod(G1,F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4474
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4475 __ aes_dround23(F54, F0, F2, F4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4476 __ aes_dround01(F52, F0, F2, F6);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4477 __ aes_dround23(F54, F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4478 __ aes_dround01(F52, F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4479 __ aes_dround23(F50, F6, F4, F2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4480 __ aes_dround01(F48, F6, F4, F0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4481 __ aes_dround23(F50, F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4482 __ aes_dround01(F48, F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4483 // save F48:F54 in temp registers
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4484 __ movdtox(F54,G2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4485 __ movdtox(F52,G3);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4486 __ movdtox(F50,G6);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4487 __ movdtox(F48,G1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4488 for ( int i = 46; i >= 14; i -= 8 ) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4489 __ aes_dround23(as_FloatRegister(i), F0, F2, F4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4490 __ aes_dround01(as_FloatRegister(i-2), F0, F2, F6);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4491 __ aes_dround23(as_FloatRegister(i), F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4492 __ aes_dround01(as_FloatRegister(i-2), F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4493 __ aes_dround23(as_FloatRegister(i-4), F6, F4, F2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4494 __ aes_dround01(as_FloatRegister(i-6), F6, F4, F0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4495 __ aes_dround23(as_FloatRegister(i-4), F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4496 __ aes_dround01(as_FloatRegister(i-6), F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4497 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4498 // init F48:F54 with F0:F6 values (original key)
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4499 __ ldf(FloatRegisterImpl::D, original_key, 0, F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4500 __ ldf(FloatRegisterImpl::D, original_key, 8, F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4501 __ ldf(FloatRegisterImpl::D, original_key, 16, F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4502 __ ldf(FloatRegisterImpl::D, original_key, 24, F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4503 __ aes_dround23(F54, F0, F2, F4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4504 __ aes_dround01(F52, F0, F2, F6);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4505 __ aes_dround23(F54, F60, F62, F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4506 __ aes_dround01(F52, F60, F62, F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4507 __ aes_dround23_l(F50, F6, F4, F2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4508 __ aes_dround01_l(F48, F6, F4, F0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4509 __ aes_dround23_l(F50, F56, F58, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4510 __ aes_dround01_l(F48, F56, F58, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4511 // re-init F48:F54 with their original values
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4512 __ movxtod(G2,F54);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4513 __ movxtod(G3,F52);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4514 __ movxtod(G6,F50);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4515 __ movxtod(G1,F48);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4516
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4517 __ movxtod(L0,F6);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4518 __ movxtod(L1,F4);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4519 __ fxor(FloatRegisterImpl::D, F6, F0, F0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4520 __ fxor(FloatRegisterImpl::D, F4, F2, F2);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4521
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4522 __ movxtod(G4,F56);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4523 __ movxtod(G5,F58);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4524 __ mov(L4,L0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4525 __ mov(L5,L1);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4526 __ fxor(FloatRegisterImpl::D, F56, F60, F60);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4527 __ fxor(FloatRegisterImpl::D, F58, F62, F62);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4528
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4529 // check for 8-byte alignment since dest byte array may have arbitrary alignment if offset mod 8 is non-zero
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4530 __ andcc(to, 7, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4531 __ br(Assembler::notZero, true, Assembler::pn, L_store_misaligned_output_next2_blocks256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4532 __ delayed()->edge8n(to, G0, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4533
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4534 // aligned case: store output into the destination array
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4535 __ stf(FloatRegisterImpl::D, F0, to, 0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4536 __ stf(FloatRegisterImpl::D, F2, to, 8);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4537 __ stf(FloatRegisterImpl::D, F60, to, 16);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4538 __ stf(FloatRegisterImpl::D, F62, to, 24);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4539 __ ba_short(L_check_decrypt_loop_end256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4540
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4541 __ BIND(L_store_misaligned_output_next2_blocks256);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4542 __ mov(8, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4543 __ sub(G4, G1, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4544 __ alignaddr(G4, G0, G4);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4545 __ faligndata(F0, F2, F56); // F56 can be clobbered
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4546 __ faligndata(F2, F60, F2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4547 __ faligndata(F60, F62, F60);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4548 __ faligndata(F62, F0, F0);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4549 __ mov(to, G1);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4550 __ and3(to, -8, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4551 __ stpartialf(to, G2, F0, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4552 __ stf(FloatRegisterImpl::D, F56, to, 8);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4553 __ stf(FloatRegisterImpl::D, F2, to, 16);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4554 __ stf(FloatRegisterImpl::D, F60, to, 24);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4555 __ add(to, 32, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4556 __ orn(G0, G2, G2);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4557 __ stpartialf(to, G2, F0, Assembler::ASI_PST8_PRIMARY);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4558 __ mov(G1, to);
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4559
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4560 __ BIND(L_check_decrypt_loop_end256);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4561 __ add(from, 32, from);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4562 __ add(to, 32, to);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4563 __ subcc(len_reg, 32, len_reg);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4564 __ br(Assembler::notEqual, false, Assembler::pt, L_dec_next2_blocks256);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4565 __ delayed()->nop();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4566
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4567 __ BIND(L_cbcdec_end);
17910
03214612e77e 8035936: SIGBUS in StubRoutines::aesencryptBlock, solaris-sparc
kvn
parents: 14261
diff changeset
4568 // re-init intial vector for next block, 8-byte alignment is guaranteed
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4569 __ stx(L0, rvec, 0);
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4570 __ stx(L1, rvec, 8);
17954
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
4571 __ mov(L7, I0);
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
4572 __ ret();
0342d80559e0 8043274: Test compiler/7184394/TestAESMain.java gets NPE on solaris
kvn
parents: 17939
diff changeset
4573 __ delayed()->restore();
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4574
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4575 return start;
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4576 }
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4577
20313
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4578 address generate_sha1_implCompress(bool multi_block, const char *name) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4579 __ align(CodeEntryAlignment);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4580 StubCodeMark mark(this, "StubRoutines", name);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4581 address start = __ pc();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4582
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4583 Label L_sha1_loop, L_sha1_unaligned_input, L_sha1_unaligned_input_loop;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4584 int i;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4585
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4586 Register buf = O0; // byte[] source+offset
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4587 Register state = O1; // int[] SHA.state
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4588 Register ofs = O2; // int offset
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4589 Register limit = O3; // int limit
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4590
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4591 // load state into F0-F4
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4592 for (i = 0; i < 5; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4593 __ ldf(FloatRegisterImpl::S, state, i*4, as_FloatRegister(i));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4594 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4595
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4596 __ andcc(buf, 7, G0);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4597 __ br(Assembler::notZero, false, Assembler::pn, L_sha1_unaligned_input);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4598 __ delayed()->nop();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4599
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4600 __ BIND(L_sha1_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4601 // load buf into F8-F22
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4602 for (i = 0; i < 8; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4603 __ ldf(FloatRegisterImpl::D, buf, i*8, as_FloatRegister(i*2 + 8));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4604 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4605 __ sha1();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4606 if (multi_block) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4607 __ add(ofs, 64, ofs);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4608 __ add(buf, 64, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4609 __ cmp_and_brx_short(ofs, limit, Assembler::lessEqual, Assembler::pt, L_sha1_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4610 __ mov(ofs, O0); // to be returned
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4611 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4612
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4613 // store F0-F4 into state and return
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4614 for (i = 0; i < 4; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4615 __ stf(FloatRegisterImpl::S, as_FloatRegister(i), state, i*4);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4616 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4617 __ retl();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4618 __ delayed()->stf(FloatRegisterImpl::S, F4, state, 0x10);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4619
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4620 __ BIND(L_sha1_unaligned_input);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4621 __ alignaddr(buf, G0, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4622
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4623 __ BIND(L_sha1_unaligned_input_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4624 // load buf into F8-F22
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4625 for (i = 0; i < 9; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4626 __ ldf(FloatRegisterImpl::D, buf, i*8, as_FloatRegister(i*2 + 8));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4627 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4628 for (i = 0; i < 8; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4629 __ faligndata(as_FloatRegister(i*2 + 8), as_FloatRegister(i*2 + 10), as_FloatRegister(i*2 + 8));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4630 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4631 __ sha1();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4632 if (multi_block) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4633 __ add(ofs, 64, ofs);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4634 __ add(buf, 64, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4635 __ cmp_and_brx_short(ofs, limit, Assembler::lessEqual, Assembler::pt, L_sha1_unaligned_input_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4636 __ mov(ofs, O0); // to be returned
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4637 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4638
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4639 // store F0-F4 into state and return
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4640 for (i = 0; i < 4; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4641 __ stf(FloatRegisterImpl::S, as_FloatRegister(i), state, i*4);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4642 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4643 __ retl();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4644 __ delayed()->stf(FloatRegisterImpl::S, F4, state, 0x10);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4645
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4646 return start;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4647 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4648
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4649 address generate_sha256_implCompress(bool multi_block, const char *name) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4650 __ align(CodeEntryAlignment);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4651 StubCodeMark mark(this, "StubRoutines", name);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4652 address start = __ pc();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4653
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4654 Label L_sha256_loop, L_sha256_unaligned_input, L_sha256_unaligned_input_loop;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4655 int i;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4656
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4657 Register buf = O0; // byte[] source+offset
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4658 Register state = O1; // int[] SHA2.state
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4659 Register ofs = O2; // int offset
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4660 Register limit = O3; // int limit
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4661
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4662 // load state into F0-F7
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4663 for (i = 0; i < 8; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4664 __ ldf(FloatRegisterImpl::S, state, i*4, as_FloatRegister(i));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4665 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4666
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4667 __ andcc(buf, 7, G0);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4668 __ br(Assembler::notZero, false, Assembler::pn, L_sha256_unaligned_input);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4669 __ delayed()->nop();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4670
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4671 __ BIND(L_sha256_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4672 // load buf into F8-F22
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4673 for (i = 0; i < 8; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4674 __ ldf(FloatRegisterImpl::D, buf, i*8, as_FloatRegister(i*2 + 8));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4675 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4676 __ sha256();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4677 if (multi_block) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4678 __ add(ofs, 64, ofs);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4679 __ add(buf, 64, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4680 __ cmp_and_brx_short(ofs, limit, Assembler::lessEqual, Assembler::pt, L_sha256_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4681 __ mov(ofs, O0); // to be returned
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4682 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4683
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4684 // store F0-F7 into state and return
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4685 for (i = 0; i < 7; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4686 __ stf(FloatRegisterImpl::S, as_FloatRegister(i), state, i*4);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4687 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4688 __ retl();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4689 __ delayed()->stf(FloatRegisterImpl::S, F7, state, 0x1c);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4690
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4691 __ BIND(L_sha256_unaligned_input);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4692 __ alignaddr(buf, G0, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4693
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4694 __ BIND(L_sha256_unaligned_input_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4695 // load buf into F8-F22
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4696 for (i = 0; i < 9; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4697 __ ldf(FloatRegisterImpl::D, buf, i*8, as_FloatRegister(i*2 + 8));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4698 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4699 for (i = 0; i < 8; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4700 __ faligndata(as_FloatRegister(i*2 + 8), as_FloatRegister(i*2 + 10), as_FloatRegister(i*2 + 8));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4701 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4702 __ sha256();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4703 if (multi_block) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4704 __ add(ofs, 64, ofs);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4705 __ add(buf, 64, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4706 __ cmp_and_brx_short(ofs, limit, Assembler::lessEqual, Assembler::pt, L_sha256_unaligned_input_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4707 __ mov(ofs, O0); // to be returned
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4708 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4709
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4710 // store F0-F7 into state and return
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4711 for (i = 0; i < 7; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4712 __ stf(FloatRegisterImpl::S, as_FloatRegister(i), state, i*4);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4713 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4714 __ retl();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4715 __ delayed()->stf(FloatRegisterImpl::S, F7, state, 0x1c);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4716
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4717 return start;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4718 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4719
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4720 address generate_sha512_implCompress(bool multi_block, const char *name) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4721 __ align(CodeEntryAlignment);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4722 StubCodeMark mark(this, "StubRoutines", name);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4723 address start = __ pc();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4724
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4725 Label L_sha512_loop, L_sha512_unaligned_input, L_sha512_unaligned_input_loop;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4726 int i;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4727
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4728 Register buf = O0; // byte[] source+offset
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4729 Register state = O1; // long[] SHA5.state
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4730 Register ofs = O2; // int offset
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4731 Register limit = O3; // int limit
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4732
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4733 // load state into F0-F14
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4734 for (i = 0; i < 8; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4735 __ ldf(FloatRegisterImpl::D, state, i*8, as_FloatRegister(i*2));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4736 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4737
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4738 __ andcc(buf, 7, G0);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4739 __ br(Assembler::notZero, false, Assembler::pn, L_sha512_unaligned_input);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4740 __ delayed()->nop();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4741
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4742 __ BIND(L_sha512_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4743 // load buf into F16-F46
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4744 for (i = 0; i < 16; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4745 __ ldf(FloatRegisterImpl::D, buf, i*8, as_FloatRegister(i*2 + 16));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4746 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4747 __ sha512();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4748 if (multi_block) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4749 __ add(ofs, 128, ofs);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4750 __ add(buf, 128, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4751 __ cmp_and_brx_short(ofs, limit, Assembler::lessEqual, Assembler::pt, L_sha512_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4752 __ mov(ofs, O0); // to be returned
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4753 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4754
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4755 // store F0-F14 into state and return
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4756 for (i = 0; i < 7; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4757 __ stf(FloatRegisterImpl::D, as_FloatRegister(i*2), state, i*8);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4758 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4759 __ retl();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4760 __ delayed()->stf(FloatRegisterImpl::D, F14, state, 0x38);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4761
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4762 __ BIND(L_sha512_unaligned_input);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4763 __ alignaddr(buf, G0, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4764
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4765 __ BIND(L_sha512_unaligned_input_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4766 // load buf into F16-F46
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4767 for (i = 0; i < 17; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4768 __ ldf(FloatRegisterImpl::D, buf, i*8, as_FloatRegister(i*2 + 16));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4769 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4770 for (i = 0; i < 16; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4771 __ faligndata(as_FloatRegister(i*2 + 16), as_FloatRegister(i*2 + 18), as_FloatRegister(i*2 + 16));
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4772 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4773 __ sha512();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4774 if (multi_block) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4775 __ add(ofs, 128, ofs);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4776 __ add(buf, 128, buf);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4777 __ cmp_and_brx_short(ofs, limit, Assembler::lessEqual, Assembler::pt, L_sha512_unaligned_input_loop);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4778 __ mov(ofs, O0); // to be returned
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4779 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4780
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4781 // store F0-F14 into state and return
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4782 for (i = 0; i < 7; i++) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4783 __ stf(FloatRegisterImpl::D, as_FloatRegister(i*2), state, i*8);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4784 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4785 __ retl();
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4786 __ delayed()->stf(FloatRegisterImpl::D, F14, state, 0x38);
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4787
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4788 return start;
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4789 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4790
0
a61af66fc99e Initial load
duke
parents:
diff changeset
4791 void generate_initial() {
a61af66fc99e Initial load
duke
parents:
diff changeset
4792 // Generates all stubs and initializes the entry points
a61af66fc99e Initial load
duke
parents:
diff changeset
4793
a61af66fc99e Initial load
duke
parents:
diff changeset
4794 //------------------------------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
4795 // entry points that exist in all platforms
a61af66fc99e Initial load
duke
parents:
diff changeset
4796 // Note: This is code that could be shared among different platforms - however the benefit seems to be smaller than
a61af66fc99e Initial load
duke
parents:
diff changeset
4797 // the disadvantage of having a much more complicated generator structure. See also comment in stubRoutines.hpp.
a61af66fc99e Initial load
duke
parents:
diff changeset
4798 StubRoutines::_forward_exception_entry = generate_forward_exception();
a61af66fc99e Initial load
duke
parents:
diff changeset
4799
a61af66fc99e Initial load
duke
parents:
diff changeset
4800 StubRoutines::_call_stub_entry = generate_call_stub(StubRoutines::_call_stub_return_address);
a61af66fc99e Initial load
duke
parents:
diff changeset
4801 StubRoutines::_catch_exception_entry = generate_catch_exception();
a61af66fc99e Initial load
duke
parents:
diff changeset
4802
a61af66fc99e Initial load
duke
parents:
diff changeset
4803 //------------------------------------------------------------------------------------------------------------------------
a61af66fc99e Initial load
duke
parents:
diff changeset
4804 // entry points that are platform specific
a61af66fc99e Initial load
duke
parents:
diff changeset
4805 StubRoutines::Sparc::_test_stop_entry = generate_test_stop();
a61af66fc99e Initial load
duke
parents:
diff changeset
4806
a61af66fc99e Initial load
duke
parents:
diff changeset
4807 StubRoutines::Sparc::_stop_subroutine_entry = generate_stop_subroutine();
a61af66fc99e Initial load
duke
parents:
diff changeset
4808 StubRoutines::Sparc::_flush_callers_register_windows_entry = generate_flush_callers_register_windows();
a61af66fc99e Initial load
duke
parents:
diff changeset
4809
a61af66fc99e Initial load
duke
parents:
diff changeset
4810 #if !defined(COMPILER2) && !defined(_LP64)
a61af66fc99e Initial load
duke
parents:
diff changeset
4811 StubRoutines::_atomic_xchg_entry = generate_atomic_xchg();
a61af66fc99e Initial load
duke
parents:
diff changeset
4812 StubRoutines::_atomic_cmpxchg_entry = generate_atomic_cmpxchg();
a61af66fc99e Initial load
duke
parents:
diff changeset
4813 StubRoutines::_atomic_add_entry = generate_atomic_add();
a61af66fc99e Initial load
duke
parents:
diff changeset
4814 StubRoutines::_atomic_xchg_ptr_entry = StubRoutines::_atomic_xchg_entry;
a61af66fc99e Initial load
duke
parents:
diff changeset
4815 StubRoutines::_atomic_cmpxchg_ptr_entry = StubRoutines::_atomic_cmpxchg_entry;
a61af66fc99e Initial load
duke
parents:
diff changeset
4816 StubRoutines::_atomic_cmpxchg_long_entry = generate_atomic_cmpxchg_long();
a61af66fc99e Initial load
duke
parents:
diff changeset
4817 StubRoutines::_atomic_add_ptr_entry = StubRoutines::_atomic_add_entry;
a61af66fc99e Initial load
duke
parents:
diff changeset
4818 #endif // COMPILER2 !=> _LP64
3451
38fa55e5e792 7055355: JSR 292: crash while throwing WrongMethodTypeException
never
parents: 2324
diff changeset
4819
4743
dca455dea3a7 7116216: StackOverflow GC crash
bdelsart
parents: 3961
diff changeset
4820 // Build this early so it's available for the interpreter.
dca455dea3a7 7116216: StackOverflow GC crash
bdelsart
parents: 3961
diff changeset
4821 StubRoutines::_throw_StackOverflowError_entry = generate_throw_exception("StackOverflowError throw_exception", CAST_FROM_FN_PTR(address, SharedRuntime::throw_StackOverflowError));
0
a61af66fc99e Initial load
duke
parents:
diff changeset
4822 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4823
a61af66fc99e Initial load
duke
parents:
diff changeset
4824
a61af66fc99e Initial load
duke
parents:
diff changeset
4825 void generate_all() {
a61af66fc99e Initial load
duke
parents:
diff changeset
4826 // Generates all stubs and initializes the entry points
a61af66fc99e Initial load
duke
parents:
diff changeset
4827
642
660978a2a31a 6791178: Specialize for zero as the compressed oop vm heap base
kvn
parents: 422
diff changeset
4828 // Generate partial_subtype_check first here since its code depends on
660978a2a31a 6791178: Specialize for zero as the compressed oop vm heap base
kvn
parents: 422
diff changeset
4829 // UseZeroBaseCompressedOops which is defined after heap initialization.
660978a2a31a 6791178: Specialize for zero as the compressed oop vm heap base
kvn
parents: 422
diff changeset
4830 StubRoutines::Sparc::_partial_subtype_check = generate_partial_subtype_check();
0
a61af66fc99e Initial load
duke
parents:
diff changeset
4831 // These entry points require SharedInfo::stack0 to be set up in non-core builds
3937
c565834fb592 7088020: SEGV in JNIHandleBlock::release_block
never
parents: 3903
diff changeset
4832 StubRoutines::_throw_AbstractMethodError_entry = generate_throw_exception("AbstractMethodError throw_exception", CAST_FROM_FN_PTR(address, SharedRuntime::throw_AbstractMethodError));
c565834fb592 7088020: SEGV in JNIHandleBlock::release_block
never
parents: 3903
diff changeset
4833 StubRoutines::_throw_IncompatibleClassChangeError_entry= generate_throw_exception("IncompatibleClassChangeError throw_exception", CAST_FROM_FN_PTR(address, SharedRuntime::throw_IncompatibleClassChangeError));
c565834fb592 7088020: SEGV in JNIHandleBlock::release_block
never
parents: 3903
diff changeset
4834 StubRoutines::_throw_NullPointerException_at_call_entry= generate_throw_exception("NullPointerException at call throw_exception", CAST_FROM_FN_PTR(address, SharedRuntime::throw_NullPointerException_at_call));
0
a61af66fc99e Initial load
duke
parents:
diff changeset
4835
a61af66fc99e Initial load
duke
parents:
diff changeset
4836 StubRoutines::_handler_for_unsafe_access_entry =
a61af66fc99e Initial load
duke
parents:
diff changeset
4837 generate_handler_for_unsafe_access();
a61af66fc99e Initial load
duke
parents:
diff changeset
4838
a61af66fc99e Initial load
duke
parents:
diff changeset
4839 // support for verify_oop (must happen after universe_init)
a61af66fc99e Initial load
duke
parents:
diff changeset
4840 StubRoutines::_verify_oop_subroutine_entry = generate_verify_oop_subroutine();
a61af66fc99e Initial load
duke
parents:
diff changeset
4841
a61af66fc99e Initial load
duke
parents:
diff changeset
4842 // arraycopy stubs used by compilers
a61af66fc99e Initial load
duke
parents:
diff changeset
4843 generate_arraycopy_stubs();
1174
ddb7834449d0 6849984: Value methods for platform dependent math functions constant fold incorrectly
never
parents: 727
diff changeset
4844
ddb7834449d0 6849984: Value methods for platform dependent math functions constant fold incorrectly
never
parents: 727
diff changeset
4845 // Don't initialize the platform math functions since sparc
ddb7834449d0 6849984: Value methods for platform dependent math functions constant fold incorrectly
never
parents: 727
diff changeset
4846 // doesn't have intrinsics for these operations.
11127
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4847
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4848 // Safefetch stubs.
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4849 generate_safefetch("SafeFetch32", sizeof(int), &StubRoutines::_safefetch32_entry,
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4850 &StubRoutines::_safefetch32_fault_pc,
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4851 &StubRoutines::_safefetch32_continuation_pc);
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4852 generate_safefetch("SafeFetchN", sizeof(intptr_t), &StubRoutines::_safefetchN_entry,
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4853 &StubRoutines::_safefetchN_fault_pc,
980532a806a5 8016697: Use stubs to implement safefetch
goetz
parents: 10997
diff changeset
4854 &StubRoutines::_safefetchN_continuation_pc);
14261
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4855
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4856 // generate AES intrinsics code
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4857 if (UseAESIntrinsics) {
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4858 StubRoutines::_aescrypt_encryptBlock = generate_aescrypt_encryptBlock();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4859 StubRoutines::_aescrypt_decryptBlock = generate_aescrypt_decryptBlock();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4860 StubRoutines::_cipherBlockChaining_encryptAESCrypt = generate_cipherBlockChaining_encryptAESCrypt();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4861 StubRoutines::_cipherBlockChaining_decryptAESCrypt = generate_cipherBlockChaining_decryptAESCrypt_Parallel();
00f5eff62d18 8002074: Support for AES on SPARC
kvn
parents: 14223
diff changeset
4862 }
20313
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4863
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4864 // generate SHA1/SHA256/SHA512 intrinsics code
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4865 if (UseSHA1Intrinsics) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4866 StubRoutines::_sha1_implCompress = generate_sha1_implCompress(false, "sha1_implCompress");
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4867 StubRoutines::_sha1_implCompressMB = generate_sha1_implCompress(true, "sha1_implCompressMB");
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4868 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4869 if (UseSHA256Intrinsics) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4870 StubRoutines::_sha256_implCompress = generate_sha256_implCompress(false, "sha256_implCompress");
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4871 StubRoutines::_sha256_implCompressMB = generate_sha256_implCompress(true, "sha256_implCompressMB");
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4872 }
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4873 if (UseSHA512Intrinsics) {
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4874 StubRoutines::_sha512_implCompress = generate_sha512_implCompress(false, "sha512_implCompress");
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4875 StubRoutines::_sha512_implCompressMB = generate_sha512_implCompress(true, "sha512_implCompressMB");
b20a35eae442 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 17954
diff changeset
4876 }
0
a61af66fc99e Initial load
duke
parents:
diff changeset
4877 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4878
a61af66fc99e Initial load
duke
parents:
diff changeset
4879
a61af66fc99e Initial load
duke
parents:
diff changeset
4880 public:
a61af66fc99e Initial load
duke
parents:
diff changeset
4881 StubGenerator(CodeBuffer* code, bool all) : StubCodeGenerator(code) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4882 // replace the standard masm with a special one:
a61af66fc99e Initial load
duke
parents:
diff changeset
4883 _masm = new MacroAssembler(code);
a61af66fc99e Initial load
duke
parents:
diff changeset
4884
a61af66fc99e Initial load
duke
parents:
diff changeset
4885 _stub_count = !all ? 0x100 : 0x200;
a61af66fc99e Initial load
duke
parents:
diff changeset
4886 if (all) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4887 generate_all();
a61af66fc99e Initial load
duke
parents:
diff changeset
4888 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
4889 generate_initial();
a61af66fc99e Initial load
duke
parents:
diff changeset
4890 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4891
a61af66fc99e Initial load
duke
parents:
diff changeset
4892 // make sure this stub is available for all local calls
a61af66fc99e Initial load
duke
parents:
diff changeset
4893 if (_atomic_add_stub.is_unbound()) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4894 // generate a second time, if necessary
a61af66fc99e Initial load
duke
parents:
diff changeset
4895 (void) generate_atomic_add();
a61af66fc99e Initial load
duke
parents:
diff changeset
4896 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4897 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4898
a61af66fc99e Initial load
duke
parents:
diff changeset
4899
a61af66fc99e Initial load
duke
parents:
diff changeset
4900 private:
a61af66fc99e Initial load
duke
parents:
diff changeset
4901 int _stub_count;
a61af66fc99e Initial load
duke
parents:
diff changeset
4902 void stub_prolog(StubCodeDesc* cdesc) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4903 # ifdef ASSERT
a61af66fc99e Initial load
duke
parents:
diff changeset
4904 // put extra information in the stub code, to make it more readable
a61af66fc99e Initial load
duke
parents:
diff changeset
4905 #ifdef _LP64
a61af66fc99e Initial load
duke
parents:
diff changeset
4906 // Write the high part of the address
a61af66fc99e Initial load
duke
parents:
diff changeset
4907 // [RGV] Check if there is a dependency on the size of this prolog
a61af66fc99e Initial load
duke
parents:
diff changeset
4908 __ emit_data((intptr_t)cdesc >> 32, relocInfo::none);
a61af66fc99e Initial load
duke
parents:
diff changeset
4909 #endif
a61af66fc99e Initial load
duke
parents:
diff changeset
4910 __ emit_data((intptr_t)cdesc, relocInfo::none);
a61af66fc99e Initial load
duke
parents:
diff changeset
4911 __ emit_data(++_stub_count, relocInfo::none);
a61af66fc99e Initial load
duke
parents:
diff changeset
4912 # endif
a61af66fc99e Initial load
duke
parents:
diff changeset
4913 align(true);
a61af66fc99e Initial load
duke
parents:
diff changeset
4914 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4915
a61af66fc99e Initial load
duke
parents:
diff changeset
4916 void align(bool at_header = false) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4917 // %%%%% move this constant somewhere else
a61af66fc99e Initial load
duke
parents:
diff changeset
4918 // UltraSPARC cache line size is 8 instructions:
a61af66fc99e Initial load
duke
parents:
diff changeset
4919 const unsigned int icache_line_size = 32;
a61af66fc99e Initial load
duke
parents:
diff changeset
4920 const unsigned int icache_half_line_size = 16;
a61af66fc99e Initial load
duke
parents:
diff changeset
4921
a61af66fc99e Initial load
duke
parents:
diff changeset
4922 if (at_header) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4923 while ((intptr_t)(__ pc()) % icache_line_size != 0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4924 __ emit_data(0, relocInfo::none);
a61af66fc99e Initial load
duke
parents:
diff changeset
4925 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4926 } else {
a61af66fc99e Initial load
duke
parents:
diff changeset
4927 while ((intptr_t)(__ pc()) % icache_half_line_size != 0) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4928 __ nop();
a61af66fc99e Initial load
duke
parents:
diff changeset
4929 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4930 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4931 }
a61af66fc99e Initial load
duke
parents:
diff changeset
4932
a61af66fc99e Initial load
duke
parents:
diff changeset
4933 }; // end class declaration
a61af66fc99e Initial load
duke
parents:
diff changeset
4934
a61af66fc99e Initial load
duke
parents:
diff changeset
4935 void StubGenerator_generate(CodeBuffer* code, bool all) {
a61af66fc99e Initial load
duke
parents:
diff changeset
4936 StubGenerator g(code, all);
a61af66fc99e Initial load
duke
parents:
diff changeset
4937 }