graal-compiler: src/cpu/x86/vm/nativeInst

annotate src/cpu/x86/vm/nativeInst_x86.cpp @ 1172:b2b6a9bf6238

6894779: Loop Predication for Loop Optimizer in C2 Summary: Loop predication implementation Reviewed-by: never, kvn

author	cfang
date	Tue, 12 Jan 2010 14:37:35 -0800
parents	dc7f315e41f7
children	c18cbe5936b8

rev	line source
0 a61af66fc99e Initial load duke parents: diff changeset	1 /*
196 d1605aabd0a1 6719955: Update copyright year xdono parents: 116 diff changeset	2 * Copyright 1997-2008 Sun Microsystems, Inc. All Rights Reserved.
0 a61af66fc99e Initial load duke parents: diff changeset	3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
a61af66fc99e Initial load duke parents: diff changeset	4 *
a61af66fc99e Initial load duke parents: diff changeset	5 * This code is free software; you can redistribute it and/or modify it
a61af66fc99e Initial load duke parents: diff changeset	6 * under the terms of the GNU General Public License version 2 only, as
a61af66fc99e Initial load duke parents: diff changeset	7 * published by the Free Software Foundation.
a61af66fc99e Initial load duke parents: diff changeset	8 *
a61af66fc99e Initial load duke parents: diff changeset	9 * This code is distributed in the hope that it will be useful, but WITHOUT
a61af66fc99e Initial load duke parents: diff changeset	10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
a61af66fc99e Initial load duke parents: diff changeset	11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
a61af66fc99e Initial load duke parents: diff changeset	12 * version 2 for more details (a copy is included in the LICENSE file that
a61af66fc99e Initial load duke parents: diff changeset	13 * accompanied this code).
a61af66fc99e Initial load duke parents: diff changeset	14 *
a61af66fc99e Initial load duke parents: diff changeset	15 * You should have received a copy of the GNU General Public License version
a61af66fc99e Initial load duke parents: diff changeset	16 * 2 along with this work; if not, write to the Free Software Foundation,
a61af66fc99e Initial load duke parents: diff changeset	17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
a61af66fc99e Initial load duke parents: diff changeset	18 *
a61af66fc99e Initial load duke parents: diff changeset	19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
a61af66fc99e Initial load duke parents: diff changeset	20 * CA 95054 USA or visit www.sun.com if you need additional information or
a61af66fc99e Initial load duke parents: diff changeset	21 * have any questions.
a61af66fc99e Initial load duke parents: diff changeset	22 *
a61af66fc99e Initial load duke parents: diff changeset	23 */
a61af66fc99e Initial load duke parents: diff changeset	24
a61af66fc99e Initial load duke parents: diff changeset	25 # include "incls/_precompiled.incl"
a61af66fc99e Initial load duke parents: diff changeset	26 # include "incls/_nativeInst_x86.cpp.incl"
a61af66fc99e Initial load duke parents: diff changeset	27
a61af66fc99e Initial load duke parents: diff changeset	28 void NativeInstruction::wrote(int offset) {
a61af66fc99e Initial load duke parents: diff changeset	29 ICache::invalidate_word(addr_at(offset));
a61af66fc99e Initial load duke parents: diff changeset	30 }
a61af66fc99e Initial load duke parents: diff changeset	31
a61af66fc99e Initial load duke parents: diff changeset	32
a61af66fc99e Initial load duke parents: diff changeset	33 void NativeCall::verify() {
a61af66fc99e Initial load duke parents: diff changeset	34 // Make sure code pattern is actually a call imm32 instruction.
a61af66fc99e Initial load duke parents: diff changeset	35 int inst = ubyte_at(0);
a61af66fc99e Initial load duke parents: diff changeset	36 if (inst != instruction_code) {
a61af66fc99e Initial load duke parents: diff changeset	37 tty->print_cr("Addr: " INTPTR_FORMAT " Code: 0x%x", instruction_address(),
a61af66fc99e Initial load duke parents: diff changeset	38 inst);
a61af66fc99e Initial load duke parents: diff changeset	39 fatal("not a call disp32");
a61af66fc99e Initial load duke parents: diff changeset	40 }
a61af66fc99e Initial load duke parents: diff changeset	41 }
a61af66fc99e Initial load duke parents: diff changeset	42
a61af66fc99e Initial load duke parents: diff changeset	43 address NativeCall::destination() const {
a61af66fc99e Initial load duke parents: diff changeset	44 // Getting the destination of a call isn't safe because that call can
a61af66fc99e Initial load duke parents: diff changeset	45 // be getting patched while you're calling this. There's only special
a61af66fc99e Initial load duke parents: diff changeset	46 // places where this can be called but not automatically verifiable by
a61af66fc99e Initial load duke parents: diff changeset	47 // checking which locks are held. The solution is true atomic patching
a61af66fc99e Initial load duke parents: diff changeset	48 // on x86, nyi.
a61af66fc99e Initial load duke parents: diff changeset	49 return return_address() + displacement();
a61af66fc99e Initial load duke parents: diff changeset	50 }
a61af66fc99e Initial load duke parents: diff changeset	51
a61af66fc99e Initial load duke parents: diff changeset	52 void NativeCall::print() {
a61af66fc99e Initial load duke parents: diff changeset	53 tty->print_cr(PTR_FORMAT ": call " PTR_FORMAT,
a61af66fc99e Initial load duke parents: diff changeset	54 instruction_address(), destination());
a61af66fc99e Initial load duke parents: diff changeset	55 }
a61af66fc99e Initial load duke parents: diff changeset	56
a61af66fc99e Initial load duke parents: diff changeset	57 // Inserts a native call instruction at a given pc
a61af66fc99e Initial load duke parents: diff changeset	58 void NativeCall::insert(address code_pos, address entry) {
a61af66fc99e Initial load duke parents: diff changeset	59 intptr_t disp = (intptr_t)entry - ((intptr_t)code_pos + 1 + 4);
a61af66fc99e Initial load duke parents: diff changeset	60 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	61 guarantee(disp == (intptr_t)(jint)disp, "must be 32-bit offset");
a61af66fc99e Initial load duke parents: diff changeset	62 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	63 *code_pos = instruction_code;
a61af66fc99e Initial load duke parents: diff changeset	64 ((int32_t )(code_pos+1)) = (int32_t) disp;
a61af66fc99e Initial load duke parents: diff changeset	65 ICache::invalidate_range(code_pos, instruction_size);
a61af66fc99e Initial load duke parents: diff changeset	66 }
a61af66fc99e Initial load duke parents: diff changeset	67
a61af66fc99e Initial load duke parents: diff changeset	68 // MT-safe patching of a call instruction.
a61af66fc99e Initial load duke parents: diff changeset	69 // First patches first word of instruction to two jmp's that jmps to them
a61af66fc99e Initial load duke parents: diff changeset	70 // selfs (spinlock). Then patches the last byte, and then atomicly replaces
a61af66fc99e Initial load duke parents: diff changeset	71 // the jmp's with the first 4 byte of the new instruction.
a61af66fc99e Initial load duke parents: diff changeset	72 void NativeCall::replace_mt_safe(address instr_addr, address code_buffer) {
a61af66fc99e Initial load duke parents: diff changeset	73 assert(Patching_lock->is_locked() \|\|
a61af66fc99e Initial load duke parents: diff changeset	74 SafepointSynchronize::is_at_safepoint(), "concurrent code patching");
a61af66fc99e Initial load duke parents: diff changeset	75 assert (instr_addr != NULL, "illegal address for code patching");
a61af66fc99e Initial load duke parents: diff changeset	76
a61af66fc99e Initial load duke parents: diff changeset	77 NativeCall* n_call = nativeCall_at (instr_addr); // checking that it is a call
a61af66fc99e Initial load duke parents: diff changeset	78 if (os::is_MP()) {
a61af66fc99e Initial load duke parents: diff changeset	79 guarantee((intptr_t)instr_addr % BytesPerWord == 0, "must be aligned");
a61af66fc99e Initial load duke parents: diff changeset	80 }
a61af66fc99e Initial load duke parents: diff changeset	81
a61af66fc99e Initial load duke parents: diff changeset	82 // First patch dummy jmp in place
a61af66fc99e Initial load duke parents: diff changeset	83 unsigned char patch[4];
a61af66fc99e Initial load duke parents: diff changeset	84 assert(sizeof(patch)==sizeof(jint), "sanity check");
a61af66fc99e Initial load duke parents: diff changeset	85 patch[0] = 0xEB; // jmp rel8
a61af66fc99e Initial load duke parents: diff changeset	86 patch[1] = 0xFE; // jmp to self
a61af66fc99e Initial load duke parents: diff changeset	87 patch[2] = 0xEB;
a61af66fc99e Initial load duke parents: diff changeset	88 patch[3] = 0xFE;
a61af66fc99e Initial load duke parents: diff changeset	89
a61af66fc99e Initial load duke parents: diff changeset	90 // First patch dummy jmp in place
a61af66fc99e Initial load duke parents: diff changeset	91 (jint)instr_addr = (jint )patch;
a61af66fc99e Initial load duke parents: diff changeset	92
a61af66fc99e Initial load duke parents: diff changeset	93 // Invalidate. Opteron requires a flush after every write.
a61af66fc99e Initial load duke parents: diff changeset	94 n_call->wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	95
a61af66fc99e Initial load duke parents: diff changeset	96 // Patch 4th byte
a61af66fc99e Initial load duke parents: diff changeset	97 instr_addr[4] = code_buffer[4];
a61af66fc99e Initial load duke parents: diff changeset	98
a61af66fc99e Initial load duke parents: diff changeset	99 n_call->wrote(4);
a61af66fc99e Initial load duke parents: diff changeset	100
a61af66fc99e Initial load duke parents: diff changeset	101 // Patch bytes 0-3
a61af66fc99e Initial load duke parents: diff changeset	102 (jint)instr_addr = (jint )code_buffer;
a61af66fc99e Initial load duke parents: diff changeset	103
a61af66fc99e Initial load duke parents: diff changeset	104 n_call->wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	105
a61af66fc99e Initial load duke parents: diff changeset	106 #ifdef ASSERT
a61af66fc99e Initial load duke parents: diff changeset	107 // verify patching
a61af66fc99e Initial load duke parents: diff changeset	108 for ( int i = 0; i < instruction_size; i++) {
a61af66fc99e Initial load duke parents: diff changeset	109 address ptr = (address)((intptr_t)code_buffer + i);
a61af66fc99e Initial load duke parents: diff changeset	110 int a_byte = (*ptr) & 0xFF;
a61af66fc99e Initial load duke parents: diff changeset	111 assert(*((address)((intptr_t)instr_addr + i)) == a_byte, "mt safe patching failed");
a61af66fc99e Initial load duke parents: diff changeset	112 }
a61af66fc99e Initial load duke parents: diff changeset	113 #endif
a61af66fc99e Initial load duke parents: diff changeset	114
a61af66fc99e Initial load duke parents: diff changeset	115 }
a61af66fc99e Initial load duke parents: diff changeset	116
a61af66fc99e Initial load duke parents: diff changeset	117
a61af66fc99e Initial load duke parents: diff changeset	118 // Similar to replace_mt_safe, but just changes the destination. The
a61af66fc99e Initial load duke parents: diff changeset	119 // important thing is that free-running threads are able to execute this
a61af66fc99e Initial load duke parents: diff changeset	120 // call instruction at all times. If the displacement field is aligned
a61af66fc99e Initial load duke parents: diff changeset	121 // we can simply rely on atomicity of 32-bit writes to make sure other threads
a61af66fc99e Initial load duke parents: diff changeset	122 // will see no intermediate states. Otherwise, the first two bytes of the
a61af66fc99e Initial load duke parents: diff changeset	123 // call are guaranteed to be aligned, and can be atomically patched to a
a61af66fc99e Initial load duke parents: diff changeset	124 // self-loop to guard the instruction while we change the other bytes.
a61af66fc99e Initial load duke parents: diff changeset	125
a61af66fc99e Initial load duke parents: diff changeset	126 // We cannot rely on locks here, since the free-running threads must run at
a61af66fc99e Initial load duke parents: diff changeset	127 // full speed.
a61af66fc99e Initial load duke parents: diff changeset	128 //
a61af66fc99e Initial load duke parents: diff changeset	129 // Used in the runtime linkage of calls; see class CompiledIC.
a61af66fc99e Initial load duke parents: diff changeset	130 // (Cf. 4506997 and 4479829, where threads witnessed garbage displacements.)
a61af66fc99e Initial load duke parents: diff changeset	131 void NativeCall::set_destination_mt_safe(address dest) {
a61af66fc99e Initial load duke parents: diff changeset	132 debug_only(verify());
a61af66fc99e Initial load duke parents: diff changeset	133 // Make sure patching code is locked. No two threads can patch at the same
a61af66fc99e Initial load duke parents: diff changeset	134 // time but one may be executing this code.
a61af66fc99e Initial load duke parents: diff changeset	135 assert(Patching_lock->is_locked() \|\|
a61af66fc99e Initial load duke parents: diff changeset	136 SafepointSynchronize::is_at_safepoint(), "concurrent code patching");
a61af66fc99e Initial load duke parents: diff changeset	137 // Both C1 and C2 should now be generating code which aligns the patched address
a61af66fc99e Initial load duke parents: diff changeset	138 // to be within a single cache line except that C1 does not do the alignment on
a61af66fc99e Initial load duke parents: diff changeset	139 // uniprocessor systems.
a61af66fc99e Initial load duke parents: diff changeset	140 bool is_aligned = ((uintptr_t)displacement_address() + 0) / cache_line_size ==
a61af66fc99e Initial load duke parents: diff changeset	141 ((uintptr_t)displacement_address() + 3) / cache_line_size;
a61af66fc99e Initial load duke parents: diff changeset	142
a61af66fc99e Initial load duke parents: diff changeset	143 guarantee(!os::is_MP() \|\| is_aligned, "destination must be aligned");
a61af66fc99e Initial load duke parents: diff changeset	144
a61af66fc99e Initial load duke parents: diff changeset	145 if (is_aligned) {
a61af66fc99e Initial load duke parents: diff changeset	146 // Simple case: The destination lies within a single cache line.
a61af66fc99e Initial load duke parents: diff changeset	147 set_destination(dest);
a61af66fc99e Initial load duke parents: diff changeset	148 } else if ((uintptr_t)instruction_address() / cache_line_size ==
a61af66fc99e Initial load duke parents: diff changeset	149 ((uintptr_t)instruction_address()+1) / cache_line_size) {
a61af66fc99e Initial load duke parents: diff changeset	150 // Tricky case: The instruction prefix lies within a single cache line.
a61af66fc99e Initial load duke parents: diff changeset	151 intptr_t disp = dest - return_address();
a61af66fc99e Initial load duke parents: diff changeset	152 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	153 guarantee(disp == (intptr_t)(jint)disp, "must be 32-bit offset");
a61af66fc99e Initial load duke parents: diff changeset	154 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	155
a61af66fc99e Initial load duke parents: diff changeset	156 int call_opcode = instruction_address()[0];
a61af66fc99e Initial load duke parents: diff changeset	157
a61af66fc99e Initial load duke parents: diff changeset	158 // First patch dummy jump in place:
a61af66fc99e Initial load duke parents: diff changeset	159 {
a61af66fc99e Initial load duke parents: diff changeset	160 u_char patch_jump[2];
a61af66fc99e Initial load duke parents: diff changeset	161 patch_jump[0] = 0xEB; // jmp rel8
a61af66fc99e Initial load duke parents: diff changeset	162 patch_jump[1] = 0xFE; // jmp to self
a61af66fc99e Initial load duke parents: diff changeset	163
a61af66fc99e Initial load duke parents: diff changeset	164 assert(sizeof(patch_jump)==sizeof(short), "sanity check");
a61af66fc99e Initial load duke parents: diff changeset	165 (short)instruction_address() = (short)patch_jump;
a61af66fc99e Initial load duke parents: diff changeset	166 }
a61af66fc99e Initial load duke parents: diff changeset	167 // Invalidate. Opteron requires a flush after every write.
a61af66fc99e Initial load duke parents: diff changeset	168 wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	169
a61af66fc99e Initial load duke parents: diff changeset	170 // (Note: We assume any reader which has already started to read
a61af66fc99e Initial load duke parents: diff changeset	171 // the unpatched call will completely read the whole unpatched call
a61af66fc99e Initial load duke parents: diff changeset	172 // without seeing the next writes we are about to make.)
a61af66fc99e Initial load duke parents: diff changeset	173
a61af66fc99e Initial load duke parents: diff changeset	174 // Next, patch the last three bytes:
a61af66fc99e Initial load duke parents: diff changeset	175 u_char patch_disp[5];
a61af66fc99e Initial load duke parents: diff changeset	176 patch_disp[0] = call_opcode;
a61af66fc99e Initial load duke parents: diff changeset	177 (int32_t)&patch_disp[1] = (int32_t)disp;
a61af66fc99e Initial load duke parents: diff changeset	178 assert(sizeof(patch_disp)==instruction_size, "sanity check");
a61af66fc99e Initial load duke parents: diff changeset	179 for (int i = sizeof(short); i < instruction_size; i++)
a61af66fc99e Initial load duke parents: diff changeset	180 instruction_address()[i] = patch_disp[i];
a61af66fc99e Initial load duke parents: diff changeset	181
a61af66fc99e Initial load duke parents: diff changeset	182 // Invalidate. Opteron requires a flush after every write.
a61af66fc99e Initial load duke parents: diff changeset	183 wrote(sizeof(short));
a61af66fc99e Initial load duke parents: diff changeset	184
a61af66fc99e Initial load duke parents: diff changeset	185 // (Note: We assume that any reader which reads the opcode we are
a61af66fc99e Initial load duke parents: diff changeset	186 // about to repatch will also read the writes we just made.)
a61af66fc99e Initial load duke parents: diff changeset	187
a61af66fc99e Initial load duke parents: diff changeset	188 // Finally, overwrite the jump:
a61af66fc99e Initial load duke parents: diff changeset	189 (short)instruction_address() = (short)patch_disp;
a61af66fc99e Initial load duke parents: diff changeset	190 // Invalidate. Opteron requires a flush after every write.
a61af66fc99e Initial load duke parents: diff changeset	191 wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	192
a61af66fc99e Initial load duke parents: diff changeset	193 debug_only(verify());
a61af66fc99e Initial load duke parents: diff changeset	194 guarantee(destination() == dest, "patch succeeded");
a61af66fc99e Initial load duke parents: diff changeset	195 } else {
a61af66fc99e Initial load duke parents: diff changeset	196 // Impossible: One or the other must be atomically writable.
a61af66fc99e Initial load duke parents: diff changeset	197 ShouldNotReachHere();
a61af66fc99e Initial load duke parents: diff changeset	198 }
a61af66fc99e Initial load duke parents: diff changeset	199 }
a61af66fc99e Initial load duke parents: diff changeset	200
a61af66fc99e Initial load duke parents: diff changeset	201
a61af66fc99e Initial load duke parents: diff changeset	202 void NativeMovConstReg::verify() {
a61af66fc99e Initial load duke parents: diff changeset	203 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	204 // make sure code pattern is actually a mov reg64, imm64 instruction
a61af66fc99e Initial load duke parents: diff changeset	205 if ((ubyte_at(0) != Assembler::REX_W && ubyte_at(0) != Assembler::REX_WB) \|\|
a61af66fc99e Initial load duke parents: diff changeset	206 (ubyte_at(1) & (0xff ^ register_mask)) != 0xB8) {
a61af66fc99e Initial load duke parents: diff changeset	207 print();
a61af66fc99e Initial load duke parents: diff changeset	208 fatal("not a REX.W[B] mov reg64, imm64");
a61af66fc99e Initial load duke parents: diff changeset	209 }
a61af66fc99e Initial load duke parents: diff changeset	210 #else
a61af66fc99e Initial load duke parents: diff changeset	211 // make sure code pattern is actually a mov reg, imm32 instruction
a61af66fc99e Initial load duke parents: diff changeset	212 u_char test_byte = (u_char)instruction_address();
a61af66fc99e Initial load duke parents: diff changeset	213 u_char test_byte_2 = test_byte & ( 0xff ^ register_mask);
a61af66fc99e Initial load duke parents: diff changeset	214 if (test_byte_2 != instruction_code) fatal("not a mov reg, imm32");
a61af66fc99e Initial load duke parents: diff changeset	215 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	216 }
a61af66fc99e Initial load duke parents: diff changeset	217
a61af66fc99e Initial load duke parents: diff changeset	218
a61af66fc99e Initial load duke parents: diff changeset	219 void NativeMovConstReg::print() {
a61af66fc99e Initial load duke parents: diff changeset	220 tty->print_cr(PTR_FORMAT ": mov reg, " INTPTR_FORMAT,
a61af66fc99e Initial load duke parents: diff changeset	221 instruction_address(), data());
a61af66fc99e Initial load duke parents: diff changeset	222 }
a61af66fc99e Initial load duke parents: diff changeset	223
a61af66fc99e Initial load duke parents: diff changeset	224 //-------------------------------------------------------------------
a61af66fc99e Initial load duke parents: diff changeset	225
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	226 int NativeMovRegMem::instruction_start() const {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	227 int off = 0;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	228 u_char instr_0 = ubyte_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	229
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	230 // First check to see if we have a (prefixed or not) xor
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	231 if ( instr_0 >= instruction_prefix_wide_lo && // 0x40
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	232 instr_0 <= instruction_prefix_wide_hi) { // 0x4f
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	233 off++;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	234 instr_0 = ubyte_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	235 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	236
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	237 if (instr_0 == instruction_code_xor) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	238 off += 2;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	239 instr_0 = ubyte_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	240 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	241
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	242 // Now look for the real instruction and the many prefix/size specifiers.
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	243
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	244 if (instr_0 == instruction_operandsize_prefix ) { // 0x66
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	245 off++; // Not SSE instructions
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	246 instr_0 = ubyte_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	247 }
0 a61af66fc99e Initial load duke parents: diff changeset	248
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	249 if ( instr_0 == instruction_code_xmm_ss_prefix \|\| // 0xf3
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	250 instr_0 == instruction_code_xmm_sd_prefix) { // 0xf2
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	251 off++;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	252 instr_0 = ubyte_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	253 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	254
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	255 if ( instr_0 >= instruction_prefix_wide_lo && // 0x40
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	256 instr_0 <= instruction_prefix_wide_hi) { // 0x4f
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	257 off++;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	258 instr_0 = ubyte_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	259 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	260
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	261
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	262 if (instr_0 == instruction_extended_prefix ) { // 0x0f
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	263 off++;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	264 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	265
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	266 return off;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	267 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	268
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	269 address NativeMovRegMem::instruction_address() const {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	270 return addr_at(instruction_start());
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	271 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	272
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	273 address NativeMovRegMem::next_instruction_address() const {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	274 address ret = instruction_address() + instruction_size;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	275 u_char instr_0 = (u_char) instruction_address();
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	276 switch (instr_0) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	277 case instruction_operandsize_prefix:
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	278
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	279 fatal("should have skipped instruction_operandsize_prefix");
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	280 break;
0 a61af66fc99e Initial load duke parents: diff changeset	281
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	282 case instruction_extended_prefix:
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	283 fatal("should have skipped instruction_extended_prefix");
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	284 break;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	285
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	286 case instruction_code_mem2reg_movslq: // 0x63
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	287 case instruction_code_mem2reg_movzxb: // 0xB6
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	288 case instruction_code_mem2reg_movsxb: // 0xBE
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	289 case instruction_code_mem2reg_movzxw: // 0xB7
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	290 case instruction_code_mem2reg_movsxw: // 0xBF
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	291 case instruction_code_reg2mem: // 0x89 (q/l)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	292 case instruction_code_mem2reg: // 0x8B (q/l)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	293 case instruction_code_reg2memb: // 0x88
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	294 case instruction_code_mem2regb: // 0x8a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	295
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	296 case instruction_code_float_s: // 0xd9 fld_s a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	297 case instruction_code_float_d: // 0xdd fld_d a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	298
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	299 case instruction_code_xmm_load: // 0x10
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	300 case instruction_code_xmm_store: // 0x11
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	301 case instruction_code_xmm_lpd: // 0x12
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	302 {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	303 // If there is an SIB then instruction is longer than expected
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	304 u_char mod_rm = (u_char)(instruction_address() + 1);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	305 if ((mod_rm & 7) == 0x4) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	306 ret++;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	307 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	308 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	309 case instruction_code_xor:
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	310 fatal("should have skipped xor lead in");
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	311 break;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	312
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	313 default:
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	314 fatal("not a NativeMovRegMem");
0 a61af66fc99e Initial load duke parents: diff changeset	315 }
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	316 return ret;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	317
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	318 }
0 a61af66fc99e Initial load duke parents: diff changeset	319
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	320 int NativeMovRegMem::offset() const{
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	321 int off = data_offset + instruction_start();
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	322 u_char mod_rm = (u_char)(instruction_address() + 1);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	323 // nnnn(r12\|rsp) isn't coded as simple mod/rm since that is
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	324 // the encoding to use an SIB byte. Which will have the nnnn
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	325 // field off by one byte
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	326 if ((mod_rm & 7) == 0x4) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	327 off++;
0 a61af66fc99e Initial load duke parents: diff changeset	328 }
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	329 return int_at(off);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	330 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	331
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	332 void NativeMovRegMem::set_offset(int x) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	333 int off = data_offset + instruction_start();
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	334 u_char mod_rm = (u_char)(instruction_address() + 1);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	335 // nnnn(r12\|rsp) isn't coded as simple mod/rm since that is
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	336 // the encoding to use an SIB byte. Which will have the nnnn
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	337 // field off by one byte
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	338 if ((mod_rm & 7) == 0x4) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	339 off++;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	340 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	341 set_int_at(off, x);
0 a61af66fc99e Initial load duke parents: diff changeset	342 }
a61af66fc99e Initial load duke parents: diff changeset	343
a61af66fc99e Initial load duke parents: diff changeset	344 void NativeMovRegMem::verify() {
a61af66fc99e Initial load duke parents: diff changeset	345 // make sure code pattern is actually a mov [reg+offset], reg instruction
a61af66fc99e Initial load duke parents: diff changeset	346 u_char test_byte = (u_char)instruction_address();
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	347 switch (test_byte) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	348 case instruction_code_reg2memb: // 0x88 movb a, r
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	349 case instruction_code_reg2mem: // 0x89 movl a, r (can be movq in 64bit)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	350 case instruction_code_mem2regb: // 0x8a movb r, a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	351 case instruction_code_mem2reg: // 0x8b movl r, a (can be movq in 64bit)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	352 break;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	353
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	354 case instruction_code_mem2reg_movslq: // 0x63 movsql r, a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	355 case instruction_code_mem2reg_movzxb: // 0xb6 movzbl r, a (movzxb)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	356 case instruction_code_mem2reg_movzxw: // 0xb7 movzwl r, a (movzxw)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	357 case instruction_code_mem2reg_movsxb: // 0xbe movsbl r, a (movsxb)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	358 case instruction_code_mem2reg_movsxw: // 0xbf movswl r, a (movsxw)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	359 break;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	360
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	361 case instruction_code_float_s: // 0xd9 fld_s a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	362 case instruction_code_float_d: // 0xdd fld_d a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	363 case instruction_code_xmm_load: // 0x10 movsd xmm, a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	364 case instruction_code_xmm_store: // 0x11 movsd a, xmm
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	365 case instruction_code_xmm_lpd: // 0x12 movlpd xmm, a
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	366 break;
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	367
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	368 default:
0 a61af66fc99e Initial load duke parents: diff changeset	369 fatal ("not a mov [reg+offs], reg instruction");
a61af66fc99e Initial load duke parents: diff changeset	370 }
a61af66fc99e Initial load duke parents: diff changeset	371 }
a61af66fc99e Initial load duke parents: diff changeset	372
a61af66fc99e Initial load duke parents: diff changeset	373
a61af66fc99e Initial load duke parents: diff changeset	374 void NativeMovRegMem::print() {
a61af66fc99e Initial load duke parents: diff changeset	375 tty->print_cr("0x%x: mov reg, [reg + %x]", instruction_address(), offset());
a61af66fc99e Initial load duke parents: diff changeset	376 }
a61af66fc99e Initial load duke parents: diff changeset	377
a61af66fc99e Initial load duke parents: diff changeset	378 //-------------------------------------------------------------------
a61af66fc99e Initial load duke parents: diff changeset	379
a61af66fc99e Initial load duke parents: diff changeset	380 void NativeLoadAddress::verify() {
a61af66fc99e Initial load duke parents: diff changeset	381 // make sure code pattern is actually a mov [reg+offset], reg instruction
a61af66fc99e Initial load duke parents: diff changeset	382 u_char test_byte = (u_char)instruction_address();
304 dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	383 #ifdef _LP64
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	384 if ( (test_byte == instruction_prefix_wide \|\|
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	385 test_byte == instruction_prefix_wide_extended) ) {
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	386 test_byte = (u_char)(instruction_address() + 1);
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	387 }
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	388 #endif // _LP64
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	389 if ( ! ((test_byte == lea_instruction_code)
dc7f315e41f7 5108146: Merge i486 and amd64 cpu directories never parents: 196 diff changeset	390 LP64_ONLY(\|\| (test_byte == mov64_instruction_code) ))) {
0 a61af66fc99e Initial load duke parents: diff changeset	391 fatal ("not a lea reg, [reg+offs] instruction");
a61af66fc99e Initial load duke parents: diff changeset	392 }
a61af66fc99e Initial load duke parents: diff changeset	393 }
a61af66fc99e Initial load duke parents: diff changeset	394
a61af66fc99e Initial load duke parents: diff changeset	395
a61af66fc99e Initial load duke parents: diff changeset	396 void NativeLoadAddress::print() {
a61af66fc99e Initial load duke parents: diff changeset	397 tty->print_cr("0x%x: lea [reg + %x], reg", instruction_address(), offset());
a61af66fc99e Initial load duke parents: diff changeset	398 }
a61af66fc99e Initial load duke parents: diff changeset	399
a61af66fc99e Initial load duke parents: diff changeset	400 //--------------------------------------------------------------------------------
a61af66fc99e Initial load duke parents: diff changeset	401
a61af66fc99e Initial load duke parents: diff changeset	402 void NativeJump::verify() {
a61af66fc99e Initial load duke parents: diff changeset	403 if ((u_char)instruction_address() != instruction_code) {
a61af66fc99e Initial load duke parents: diff changeset	404 fatal("not a jump instruction");
a61af66fc99e Initial load duke parents: diff changeset	405 }
a61af66fc99e Initial load duke parents: diff changeset	406 }
a61af66fc99e Initial load duke parents: diff changeset	407
a61af66fc99e Initial load duke parents: diff changeset	408
a61af66fc99e Initial load duke parents: diff changeset	409 void NativeJump::insert(address code_pos, address entry) {
a61af66fc99e Initial load duke parents: diff changeset	410 intptr_t disp = (intptr_t)entry - ((intptr_t)code_pos + 1 + 4);
a61af66fc99e Initial load duke parents: diff changeset	411 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	412 guarantee(disp == (intptr_t)(int32_t)disp, "must be 32-bit offset");
a61af66fc99e Initial load duke parents: diff changeset	413 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	414
a61af66fc99e Initial load duke parents: diff changeset	415 *code_pos = instruction_code;
a61af66fc99e Initial load duke parents: diff changeset	416 ((int32_t)(code_pos + 1)) = (int32_t)disp;
a61af66fc99e Initial load duke parents: diff changeset	417
a61af66fc99e Initial load duke parents: diff changeset	418 ICache::invalidate_range(code_pos, instruction_size);
a61af66fc99e Initial load duke parents: diff changeset	419 }
a61af66fc99e Initial load duke parents: diff changeset	420
a61af66fc99e Initial load duke parents: diff changeset	421 void NativeJump::check_verified_entry_alignment(address entry, address verified_entry) {
a61af66fc99e Initial load duke parents: diff changeset	422 // Patching to not_entrant can happen while activations of the method are
a61af66fc99e Initial load duke parents: diff changeset	423 // in use. The patching in that instance must happen only when certain
a61af66fc99e Initial load duke parents: diff changeset	424 // alignment restrictions are true. These guarantees check those
a61af66fc99e Initial load duke parents: diff changeset	425 // conditions.
a61af66fc99e Initial load duke parents: diff changeset	426 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	427 const int linesize = 64;
a61af66fc99e Initial load duke parents: diff changeset	428 #else
a61af66fc99e Initial load duke parents: diff changeset	429 const int linesize = 32;
a61af66fc99e Initial load duke parents: diff changeset	430 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	431
a61af66fc99e Initial load duke parents: diff changeset	432 // Must be wordSize aligned
a61af66fc99e Initial load duke parents: diff changeset	433 guarantee(((uintptr_t) verified_entry & (wordSize -1)) == 0,
a61af66fc99e Initial load duke parents: diff changeset	434 "illegal address for code patching 2");
a61af66fc99e Initial load duke parents: diff changeset	435 // First 5 bytes must be within the same cache line - 4827828
a61af66fc99e Initial load duke parents: diff changeset	436 guarantee((uintptr_t) verified_entry / linesize ==
a61af66fc99e Initial load duke parents: diff changeset	437 ((uintptr_t) verified_entry + 4) / linesize,
a61af66fc99e Initial load duke parents: diff changeset	438 "illegal address for code patching 3");
a61af66fc99e Initial load duke parents: diff changeset	439 }
a61af66fc99e Initial load duke parents: diff changeset	440
a61af66fc99e Initial load duke parents: diff changeset	441
a61af66fc99e Initial load duke parents: diff changeset	442 // MT safe inserting of a jump over an unknown instruction sequence (used by nmethod::makeZombie)
a61af66fc99e Initial load duke parents: diff changeset	443 // The problem: jmp <dest> is a 5-byte instruction. Atomical write can be only with 4 bytes.
a61af66fc99e Initial load duke parents: diff changeset	444 // First patches the first word atomically to be a jump to itself.
a61af66fc99e Initial load duke parents: diff changeset	445 // Then patches the last byte and then atomically patches the first word (4-bytes),
a61af66fc99e Initial load duke parents: diff changeset	446 // thus inserting the desired jump
a61af66fc99e Initial load duke parents: diff changeset	447 // This code is mt-safe with the following conditions: entry point is 4 byte aligned,
a61af66fc99e Initial load duke parents: diff changeset	448 // entry point is in same cache line as unverified entry point, and the instruction being
a61af66fc99e Initial load duke parents: diff changeset	449 // patched is >= 5 byte (size of patch).
a61af66fc99e Initial load duke parents: diff changeset	450 //
a61af66fc99e Initial load duke parents: diff changeset	451 // In C2 the 5+ byte sized instruction is enforced by code in MachPrologNode::emit.
a61af66fc99e Initial load duke parents: diff changeset	452 // In C1 the restriction is enforced by CodeEmitter::method_entry
a61af66fc99e Initial load duke parents: diff changeset	453 //
a61af66fc99e Initial load duke parents: diff changeset	454 void NativeJump::patch_verified_entry(address entry, address verified_entry, address dest) {
a61af66fc99e Initial load duke parents: diff changeset	455 // complete jump instruction (to be inserted) is in code_buffer;
a61af66fc99e Initial load duke parents: diff changeset	456 unsigned char code_buffer[5];
a61af66fc99e Initial load duke parents: diff changeset	457 code_buffer[0] = instruction_code;
a61af66fc99e Initial load duke parents: diff changeset	458 intptr_t disp = (intptr_t)dest - ((intptr_t)verified_entry + 1 + 4);
a61af66fc99e Initial load duke parents: diff changeset	459 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	460 guarantee(disp == (intptr_t)(int32_t)disp, "must be 32-bit offset");
a61af66fc99e Initial load duke parents: diff changeset	461 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	462 (int32_t)(code_buffer + 1) = (int32_t)disp;
a61af66fc99e Initial load duke parents: diff changeset	463
a61af66fc99e Initial load duke parents: diff changeset	464 check_verified_entry_alignment(entry, verified_entry);
a61af66fc99e Initial load duke parents: diff changeset	465
a61af66fc99e Initial load duke parents: diff changeset	466 // Can't call nativeJump_at() because it's asserts jump exists
a61af66fc99e Initial load duke parents: diff changeset	467 NativeJump* n_jump = (NativeJump*) verified_entry;
a61af66fc99e Initial load duke parents: diff changeset	468
a61af66fc99e Initial load duke parents: diff changeset	469 //First patch dummy jmp in place
a61af66fc99e Initial load duke parents: diff changeset	470
a61af66fc99e Initial load duke parents: diff changeset	471 unsigned char patch[4];
a61af66fc99e Initial load duke parents: diff changeset	472 assert(sizeof(patch)==sizeof(int32_t), "sanity check");
a61af66fc99e Initial load duke parents: diff changeset	473 patch[0] = 0xEB; // jmp rel8
a61af66fc99e Initial load duke parents: diff changeset	474 patch[1] = 0xFE; // jmp to self
a61af66fc99e Initial load duke parents: diff changeset	475 patch[2] = 0xEB;
a61af66fc99e Initial load duke parents: diff changeset	476 patch[3] = 0xFE;
a61af66fc99e Initial load duke parents: diff changeset	477
a61af66fc99e Initial load duke parents: diff changeset	478 // First patch dummy jmp in place
a61af66fc99e Initial load duke parents: diff changeset	479 (int32_t)verified_entry = (int32_t )patch;
a61af66fc99e Initial load duke parents: diff changeset	480
a61af66fc99e Initial load duke parents: diff changeset	481 n_jump->wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	482
a61af66fc99e Initial load duke parents: diff changeset	483 // Patch 5th byte (from jump instruction)
a61af66fc99e Initial load duke parents: diff changeset	484 verified_entry[4] = code_buffer[4];
a61af66fc99e Initial load duke parents: diff changeset	485
a61af66fc99e Initial load duke parents: diff changeset	486 n_jump->wrote(4);
a61af66fc99e Initial load duke parents: diff changeset	487
a61af66fc99e Initial load duke parents: diff changeset	488 // Patch bytes 0-3 (from jump instruction)
a61af66fc99e Initial load duke parents: diff changeset	489 (int32_t)verified_entry = (int32_t )code_buffer;
a61af66fc99e Initial load duke parents: diff changeset	490 // Invalidate. Opteron requires a flush after every write.
a61af66fc99e Initial load duke parents: diff changeset	491 n_jump->wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	492
a61af66fc99e Initial load duke parents: diff changeset	493 }
a61af66fc99e Initial load duke parents: diff changeset	494
a61af66fc99e Initial load duke parents: diff changeset	495 void NativePopReg::insert(address code_pos, Register reg) {
a61af66fc99e Initial load duke parents: diff changeset	496 assert(reg->encoding() < 8, "no space for REX");
a61af66fc99e Initial load duke parents: diff changeset	497 assert(NativePopReg::instruction_size == sizeof(char), "right address unit for update");
a61af66fc99e Initial load duke parents: diff changeset	498 *code_pos = (u_char)(instruction_code \| reg->encoding());
a61af66fc99e Initial load duke parents: diff changeset	499 ICache::invalidate_range(code_pos, instruction_size);
a61af66fc99e Initial load duke parents: diff changeset	500 }
a61af66fc99e Initial load duke parents: diff changeset	501
a61af66fc99e Initial load duke parents: diff changeset	502
a61af66fc99e Initial load duke parents: diff changeset	503 void NativeIllegalInstruction::insert(address code_pos) {
a61af66fc99e Initial load duke parents: diff changeset	504 assert(NativeIllegalInstruction::instruction_size == sizeof(short), "right address unit for update");
a61af66fc99e Initial load duke parents: diff changeset	505 (short )code_pos = instruction_code;
a61af66fc99e Initial load duke parents: diff changeset	506 ICache::invalidate_range(code_pos, instruction_size);
a61af66fc99e Initial load duke parents: diff changeset	507 }
a61af66fc99e Initial load duke parents: diff changeset	508
a61af66fc99e Initial load duke parents: diff changeset	509 void NativeGeneralJump::verify() {
a61af66fc99e Initial load duke parents: diff changeset	510 assert(((NativeInstruction *)this)->is_jump() \|\|
a61af66fc99e Initial load duke parents: diff changeset	511 ((NativeInstruction *)this)->is_cond_jump(), "not a general jump instruction");
a61af66fc99e Initial load duke parents: diff changeset	512 }
a61af66fc99e Initial load duke parents: diff changeset	513
a61af66fc99e Initial load duke parents: diff changeset	514
a61af66fc99e Initial load duke parents: diff changeset	515 void NativeGeneralJump::insert_unconditional(address code_pos, address entry) {
a61af66fc99e Initial load duke parents: diff changeset	516 intptr_t disp = (intptr_t)entry - ((intptr_t)code_pos + 1 + 4);
a61af66fc99e Initial load duke parents: diff changeset	517 #ifdef AMD64
a61af66fc99e Initial load duke parents: diff changeset	518 guarantee(disp == (intptr_t)(int32_t)disp, "must be 32-bit offset");
a61af66fc99e Initial load duke parents: diff changeset	519 #endif // AMD64
a61af66fc99e Initial load duke parents: diff changeset	520
a61af66fc99e Initial load duke parents: diff changeset	521 *code_pos = unconditional_long_jump;
a61af66fc99e Initial load duke parents: diff changeset	522 ((int32_t )(code_pos+1)) = (int32_t) disp;
a61af66fc99e Initial load duke parents: diff changeset	523 ICache::invalidate_range(code_pos, instruction_size);
a61af66fc99e Initial load duke parents: diff changeset	524 }
a61af66fc99e Initial load duke parents: diff changeset	525
a61af66fc99e Initial load duke parents: diff changeset	526
a61af66fc99e Initial load duke parents: diff changeset	527 // MT-safe patching of a long jump instruction.
a61af66fc99e Initial load duke parents: diff changeset	528 // First patches first word of instruction to two jmp's that jmps to them
a61af66fc99e Initial load duke parents: diff changeset	529 // selfs (spinlock). Then patches the last byte, and then atomicly replaces
a61af66fc99e Initial load duke parents: diff changeset	530 // the jmp's with the first 4 byte of the new instruction.
a61af66fc99e Initial load duke parents: diff changeset	531 void NativeGeneralJump::replace_mt_safe(address instr_addr, address code_buffer) {
a61af66fc99e Initial load duke parents: diff changeset	532 assert (instr_addr != NULL, "illegal address for code patching (4)");
a61af66fc99e Initial load duke parents: diff changeset	533 NativeGeneralJump* n_jump = nativeGeneralJump_at (instr_addr); // checking that it is a jump
a61af66fc99e Initial load duke parents: diff changeset	534
a61af66fc99e Initial load duke parents: diff changeset	535 // Temporary code
a61af66fc99e Initial load duke parents: diff changeset	536 unsigned char patch[4];
a61af66fc99e Initial load duke parents: diff changeset	537 assert(sizeof(patch)==sizeof(int32_t), "sanity check");
a61af66fc99e Initial load duke parents: diff changeset	538 patch[0] = 0xEB; // jmp rel8
a61af66fc99e Initial load duke parents: diff changeset	539 patch[1] = 0xFE; // jmp to self
a61af66fc99e Initial load duke parents: diff changeset	540 patch[2] = 0xEB;
a61af66fc99e Initial load duke parents: diff changeset	541 patch[3] = 0xFE;
a61af66fc99e Initial load duke parents: diff changeset	542
a61af66fc99e Initial load duke parents: diff changeset	543 // First patch dummy jmp in place
a61af66fc99e Initial load duke parents: diff changeset	544 (int32_t)instr_addr = (int32_t )patch;
a61af66fc99e Initial load duke parents: diff changeset	545 n_jump->wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	546
a61af66fc99e Initial load duke parents: diff changeset	547 // Patch 4th byte
a61af66fc99e Initial load duke parents: diff changeset	548 instr_addr[4] = code_buffer[4];
a61af66fc99e Initial load duke parents: diff changeset	549
a61af66fc99e Initial load duke parents: diff changeset	550 n_jump->wrote(4);
a61af66fc99e Initial load duke parents: diff changeset	551
a61af66fc99e Initial load duke parents: diff changeset	552 // Patch bytes 0-3
a61af66fc99e Initial load duke parents: diff changeset	553 (jint)instr_addr = (jint )code_buffer;
a61af66fc99e Initial load duke parents: diff changeset	554
a61af66fc99e Initial load duke parents: diff changeset	555 n_jump->wrote(0);
a61af66fc99e Initial load duke parents: diff changeset	556
a61af66fc99e Initial load duke parents: diff changeset	557 #ifdef ASSERT
a61af66fc99e Initial load duke parents: diff changeset	558 // verify patching
a61af66fc99e Initial load duke parents: diff changeset	559 for ( int i = 0; i < instruction_size; i++) {
a61af66fc99e Initial load duke parents: diff changeset	560 address ptr = (address)((intptr_t)code_buffer + i);
a61af66fc99e Initial load duke parents: diff changeset	561 int a_byte = (*ptr) & 0xFF;
a61af66fc99e Initial load duke parents: diff changeset	562 assert(*((address)((intptr_t)instr_addr + i)) == a_byte, "mt safe patching failed");
a61af66fc99e Initial load duke parents: diff changeset	563 }
a61af66fc99e Initial load duke parents: diff changeset	564 #endif
a61af66fc99e Initial load duke parents: diff changeset	565
a61af66fc99e Initial load duke parents: diff changeset	566 }
a61af66fc99e Initial load duke parents: diff changeset	567
a61af66fc99e Initial load duke parents: diff changeset	568
a61af66fc99e Initial load duke parents: diff changeset	569
a61af66fc99e Initial load duke parents: diff changeset	570 address NativeGeneralJump::jump_destination() const {
a61af66fc99e Initial load duke parents: diff changeset	571 int op_code = ubyte_at(0);
a61af66fc99e Initial load duke parents: diff changeset	572 bool is_rel32off = (op_code == 0xE9 \|\| op_code == 0x0F);
a61af66fc99e Initial load duke parents: diff changeset	573 int offset = (op_code == 0x0F) ? 2 : 1;
a61af66fc99e Initial load duke parents: diff changeset	574 int length = offset + ((is_rel32off) ? 4 : 1);
a61af66fc99e Initial load duke parents: diff changeset	575
a61af66fc99e Initial load duke parents: diff changeset	576 if (is_rel32off)
a61af66fc99e Initial load duke parents: diff changeset	577 return addr_at(0) + length + int_at(offset);
a61af66fc99e Initial load duke parents: diff changeset	578 else
a61af66fc99e Initial load duke parents: diff changeset	579 return addr_at(0) + length + sbyte_at(offset);
a61af66fc99e Initial load duke parents: diff changeset	580 }
116 018d5b58dd4f 6537506: Provide a mechanism for specifying Java-level USDT-like dtrace probes kamg parents: 0 diff changeset	581
018d5b58dd4f 6537506: Provide a mechanism for specifying Java-level USDT-like dtrace probes kamg parents: 0 diff changeset	582 bool NativeInstruction::is_dtrace_trap() {
018d5b58dd4f 6537506: Provide a mechanism for specifying Java-level USDT-like dtrace probes kamg parents: 0 diff changeset	583 return ((int32_t)this & 0xff) == 0xcc;
018d5b58dd4f 6537506: Provide a mechanism for specifying Java-level USDT-like dtrace probes kamg parents: 0 diff changeset	584 }

Mercurial > hg > graal-compiler

annotate src/cpu/x86/vm/nativeInst_x86.cpp @ 1172:b2b6a9bf6238