Thu, 27 May 2010 18:01:56 -0700
6916623: Align object to 16 bytes to use Compressed Oops with java heap up to 64Gb
Summary: Added new product ObjectAlignmentInBytes flag to control object alignment.
Reviewed-by: twisti, ysr, iveresov
1 /*
2 * Copyright 1997-2010 Sun Microsystems, Inc. All Rights Reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.
8 *
9 * This code is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
12 * version 2 for more details (a copy is included in the LICENSE file that
13 * accompanied this code).
14 *
15 * You should have received a copy of the GNU General Public License version
16 * 2 along with this work; if not, write to the Free Software Foundation,
17 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
18 *
19 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
20 * CA 95054 USA or visit www.sun.com if you need additional information or
21 * have any questions.
22 *
23 */
25 typedef class BytecodeInterpreter* interpreterState;
27 class CodeBlob;
30 // A frame represents a physical stack frame (an activation). Frames
31 // can be C or Java frames, and the Java frames can be interpreted or
32 // compiled. In contrast, vframes represent source-level activations,
33 // so that one physical frame can correspond to multiple source level
34 // frames because of inlining.
36 class frame VALUE_OBJ_CLASS_SPEC {
37 private:
38 // Instance variables:
39 intptr_t* _sp; // stack pointer (from Thread::last_Java_sp)
40 address _pc; // program counter (the next instruction after the call)
42 CodeBlob* _cb; // CodeBlob that "owns" pc
43 enum deopt_state {
44 not_deoptimized,
45 is_deoptimized,
46 unknown
47 };
49 deopt_state _deopt_state;
51 public:
52 // Constructors
53 frame();
55 // Accessors
57 // pc: Returns the pc at which this frame will continue normally.
58 // It must point at the beginning of the next instruction to execute.
59 address pc() const { return _pc; }
61 // This returns the pc that if you were in the debugger you'd see. Not
62 // the idealized value in the frame object. This undoes the magic conversion
63 // that happens for deoptimized frames. In addition it makes the value the
64 // hardware would want to see in the native frame. The only user (at this point)
65 // is deoptimization. It likely no one else should ever use it.
66 address raw_pc() const;
68 void set_pc( address newpc );
70 intptr_t* sp() const { return _sp; }
71 void set_sp( intptr_t* newsp ) { _sp = newsp; }
74 CodeBlob* cb() const { return _cb; }
76 // patching operations
77 void patch_pc(Thread* thread, address pc);
79 // Every frame needs to return a unique id which distinguishes it from all other frames.
80 // For sparc and ia32 use sp. ia64 can have memory frames that are empty so multiple frames
81 // will have identical sp values. For ia64 the bsp (fp) value will serve. No real frame
82 // should have an id() of NULL so it is a distinguishing value for an unmatchable frame.
83 // We also have relationals which allow comparing a frame to anoth frame's id() allow
84 // us to distinguish younger (more recent activation) from older (less recent activations)
85 // A NULL id is only valid when comparing for equality.
87 intptr_t* id(void) const;
88 bool is_younger(intptr_t* id) const;
89 bool is_older(intptr_t* id) const;
91 // testers
93 // Compares for strict equality. Rarely used or needed.
94 // It can return a different result than f1.id() == f2.id()
95 bool equal(frame other) const;
97 // type testers
98 bool is_interpreted_frame() const;
99 bool is_java_frame() const;
100 bool is_entry_frame() const; // Java frame called from C?
101 bool is_native_frame() const;
102 bool is_runtime_frame() const;
103 bool is_compiled_frame() const;
104 bool is_safepoint_blob_frame() const;
105 bool is_deoptimized_frame() const;
107 // testers
108 bool is_first_frame() const; // oldest frame? (has no sender)
109 bool is_first_java_frame() const; // same for Java frame
111 bool is_interpreted_frame_valid(JavaThread* thread) const; // performs sanity checks on interpreted frames.
113 // tells whether this frame is marked for deoptimization
114 bool should_be_deoptimized() const;
116 // tells whether this frame can be deoptimized
117 bool can_be_deoptimized() const;
119 // returns the frame size in stack slots
120 int frame_size(RegisterMap* map) const;
122 // returns the sending frame
123 frame sender(RegisterMap* map) const;
125 // for Profiling - acting on another frame. walks sender frames
126 // if valid.
127 frame profile_find_Java_sender_frame(JavaThread *thread);
128 bool safe_for_sender(JavaThread *thread);
130 // returns the sender, but skips conversion frames
131 frame real_sender(RegisterMap* map) const;
133 // returns the the sending Java frame, skipping any intermediate C frames
134 // NB: receiver must not be first frame
135 frame java_sender() const;
137 private:
138 // Helper methods for better factored code in frame::sender
139 frame sender_for_compiled_frame(RegisterMap* map) const;
140 frame sender_for_entry_frame(RegisterMap* map) const;
141 frame sender_for_interpreter_frame(RegisterMap* map) const;
142 frame sender_for_native_frame(RegisterMap* map) const;
144 // All frames:
146 // A low-level interface for vframes:
148 public:
150 intptr_t* addr_at(int index) const { return &fp()[index]; }
151 intptr_t at(int index) const { return *addr_at(index); }
153 // accessors for locals
154 oop obj_at(int offset) const { return *obj_at_addr(offset); }
155 void obj_at_put(int offset, oop value) { *obj_at_addr(offset) = value; }
157 jint int_at(int offset) const { return *int_at_addr(offset); }
158 void int_at_put(int offset, jint value) { *int_at_addr(offset) = value; }
160 oop* obj_at_addr(int offset) const { return (oop*) addr_at(offset); }
162 oop* adjusted_obj_at_addr(methodOop method, int index) { return obj_at_addr(adjust_offset(method, index)); }
164 private:
165 jint* int_at_addr(int offset) const { return (jint*) addr_at(offset); }
167 public:
168 // Link (i.e., the pointer to the previous frame)
169 intptr_t* link() const;
170 void set_link(intptr_t* addr);
172 // Return address
173 address sender_pc() const;
175 // Support for deoptimization
176 void deoptimize(JavaThread* thread, bool thread_is_known_safe = false);
178 // The frame's original SP, before any extension by an interpreted callee;
179 // used for packing debug info into vframeArray objects and vframeArray lookup.
180 intptr_t* unextended_sp() const;
182 // returns the stack pointer of the calling frame
183 intptr_t* sender_sp() const;
186 // Interpreter frames:
188 private:
189 intptr_t** interpreter_frame_locals_addr() const;
190 intptr_t* interpreter_frame_bcx_addr() const;
191 intptr_t* interpreter_frame_mdx_addr() const;
193 public:
194 // Locals
196 // The _at version returns a pointer because the address is used for GC.
197 intptr_t* interpreter_frame_local_at(int index) const;
199 void interpreter_frame_set_locals(intptr_t* locs);
201 // byte code index/pointer (use these functions for unchecked frame access only!)
202 intptr_t interpreter_frame_bcx() const { return *interpreter_frame_bcx_addr(); }
203 void interpreter_frame_set_bcx(intptr_t bcx);
205 // byte code index
206 jint interpreter_frame_bci() const;
207 void interpreter_frame_set_bci(jint bci);
209 // byte code pointer
210 address interpreter_frame_bcp() const;
211 void interpreter_frame_set_bcp(address bcp);
213 // Unchecked access to the method data index/pointer.
214 // Only use this if you know what you are doing.
215 intptr_t interpreter_frame_mdx() const { return *interpreter_frame_mdx_addr(); }
216 void interpreter_frame_set_mdx(intptr_t mdx);
218 // method data pointer
219 address interpreter_frame_mdp() const;
220 void interpreter_frame_set_mdp(address dp);
222 // Find receiver out of caller's (compiled) argument list
223 oop retrieve_receiver(RegisterMap *reg_map);
225 // Return the monitor owner and BasicLock for compiled synchronized
226 // native methods so that biased locking can revoke the receiver's
227 // bias if necessary. Takes optional nmethod for this frame as
228 // argument to avoid performing repeated lookups in code cache.
229 BasicLock* compiled_synchronized_native_monitor (nmethod* nm = NULL);
230 oop compiled_synchronized_native_monitor_owner(nmethod* nm = NULL);
232 // Find receiver for an invoke when arguments are just pushed on stack (i.e., callee stack-frame is
233 // not setup)
234 oop interpreter_callee_receiver(symbolHandle signature) { return *interpreter_callee_receiver_addr(signature); }
237 oop* interpreter_callee_receiver_addr(symbolHandle signature);
240 // expression stack (may go up or down, direction == 1 or -1)
241 public:
242 intptr_t* interpreter_frame_expression_stack() const;
243 static jint interpreter_frame_expression_stack_direction();
245 // The _at version returns a pointer because the address is used for GC.
246 intptr_t* interpreter_frame_expression_stack_at(jint offset) const;
248 // top of expression stack
249 intptr_t* interpreter_frame_tos_at(jint offset) const;
250 intptr_t* interpreter_frame_tos_address() const;
253 jint interpreter_frame_expression_stack_size() const;
255 intptr_t* interpreter_frame_sender_sp() const;
257 #ifndef CC_INTERP
258 // template based interpreter deoptimization support
259 void set_interpreter_frame_sender_sp(intptr_t* sender_sp);
260 void interpreter_frame_set_monitor_end(BasicObjectLock* value);
261 #endif // CC_INTERP
263 // BasicObjectLocks:
264 //
265 // interpreter_frame_monitor_begin is higher in memory than interpreter_frame_monitor_end
266 // Interpreter_frame_monitor_begin points to one element beyond the oldest one,
267 // interpreter_frame_monitor_end points to the youngest one, or if there are none,
268 // it points to one beyond where the first element will be.
269 // interpreter_frame_monitor_size reports the allocation size of a monitor in the interpreter stack.
270 // this value is >= BasicObjectLock::size(), and may be rounded up
272 BasicObjectLock* interpreter_frame_monitor_begin() const;
273 BasicObjectLock* interpreter_frame_monitor_end() const;
274 BasicObjectLock* next_monitor_in_interpreter_frame(BasicObjectLock* current) const;
275 BasicObjectLock* previous_monitor_in_interpreter_frame(BasicObjectLock* current) const;
276 static int interpreter_frame_monitor_size();
278 void interpreter_frame_verify_monitor(BasicObjectLock* value) const;
280 // Tells whether the current interpreter_frame frame pointer
281 // corresponds to the old compiled/deoptimized fp
282 // The receiver used to be a top level frame
283 bool interpreter_frame_equals_unpacked_fp(intptr_t* fp);
285 // Return/result value from this interpreter frame
286 // If the method return type is T_OBJECT or T_ARRAY populates oop_result
287 // For other (non-T_VOID) the appropriate field in the jvalue is populated
288 // with the result value.
289 // Should only be called when at method exit when the method is not
290 // exiting due to an exception.
291 BasicType interpreter_frame_result(oop* oop_result, jvalue* value_result);
293 public:
294 // Method & constant pool cache
295 methodOop interpreter_frame_method() const;
296 void interpreter_frame_set_method(methodOop method);
297 methodOop* interpreter_frame_method_addr() const;
298 constantPoolCacheOop* interpreter_frame_cache_addr() const;
300 public:
301 // Entry frames
302 JavaCallWrapper* entry_frame_call_wrapper() const;
303 intptr_t* entry_frame_argument_at(int offset) const;
305 // tells whether there is another chunk of Delta stack above
306 bool entry_frame_is_first() const;
308 // Compiled frames:
310 public:
311 // Given the index of a local, and the number of argument words
312 // in this stack frame, tell which word of the stack frame to find
313 // the local in. Arguments are stored above the ofp/rpc pair,
314 // while other locals are stored below it.
315 // Since monitors (BasicLock blocks) are also assigned indexes,
316 // but may have different storage requirements, their presence
317 // can also affect the calculation of offsets.
318 static int local_offset_for_compiler(int local_index, int nof_args, int max_nof_locals, int max_nof_monitors);
320 // Given the index of a monitor, etc., tell which word of the
321 // stack frame contains the start of the BasicLock block.
322 // Note that the local index by convention is the __higher__
323 // of the two indexes allocated to the block.
324 static int monitor_offset_for_compiler(int local_index, int nof_args, int max_nof_locals, int max_nof_monitors);
326 // Tell the smallest value that local_offset_for_compiler will attain.
327 // This is used to help determine how much stack frame to allocate.
328 static int min_local_offset_for_compiler(int nof_args, int max_nof_locals, int max_nof_monitors);
330 // Tells if this register must be spilled during a call.
331 // On Intel, all registers are smashed by calls.
332 static bool volatile_across_calls(Register reg);
335 // Safepoints
337 public:
338 oop saved_oop_result(RegisterMap* map) const;
339 void set_saved_oop_result(RegisterMap* map, oop obj);
341 // For debugging
342 private:
343 const char* print_name() const;
345 public:
346 void print_value() const { print_value_on(tty,NULL); }
347 void print_value_on(outputStream* st, JavaThread *thread) const;
348 void print_on(outputStream* st) const;
349 void interpreter_frame_print_on(outputStream* st) const;
350 void print_on_error(outputStream* st, char* buf, int buflen, bool verbose = false) const;
352 // Conversion from an VMReg to physical stack location
353 oop* oopmapreg_to_location(VMReg reg, const RegisterMap* regmap) const;
355 // Oops-do's
356 void oops_compiled_arguments_do(symbolHandle signature, bool has_receiver, const RegisterMap* reg_map, OopClosure* f);
357 void oops_interpreted_do(OopClosure* f, const RegisterMap* map, bool query_oop_map_cache = true);
359 private:
360 void oops_interpreted_arguments_do(symbolHandle signature, bool has_receiver, OopClosure* f);
362 // Iteration of oops
363 void oops_do_internal(OopClosure* f, CodeBlobClosure* cf, RegisterMap* map, bool use_interpreter_oop_map_cache);
364 void oops_entry_do(OopClosure* f, const RegisterMap* map);
365 void oops_code_blob_do(OopClosure* f, CodeBlobClosure* cf, const RegisterMap* map);
366 int adjust_offset(methodOop method, int index); // helper for above fn
367 public:
368 // Memory management
369 void oops_do(OopClosure* f, CodeBlobClosure* cf, RegisterMap* map) { oops_do_internal(f, cf, map, true); }
370 void nmethods_do(CodeBlobClosure* cf);
372 void gc_prologue();
373 void gc_epilogue();
374 void pd_gc_epilog();
376 # ifdef ENABLE_ZAP_DEAD_LOCALS
377 private:
378 class CheckValueClosure: public OopClosure {
379 public:
380 void do_oop(oop* p);
381 void do_oop(narrowOop* p) { ShouldNotReachHere(); }
382 };
383 static CheckValueClosure _check_value;
385 class CheckOopClosure: public OopClosure {
386 public:
387 void do_oop(oop* p);
388 void do_oop(narrowOop* p) { ShouldNotReachHere(); }
389 };
390 static CheckOopClosure _check_oop;
392 static void check_derived_oop(oop* base, oop* derived);
394 class ZapDeadClosure: public OopClosure {
395 public:
396 void do_oop(oop* p);
397 void do_oop(narrowOop* p) { ShouldNotReachHere(); }
398 };
399 static ZapDeadClosure _zap_dead;
401 public:
402 // Zapping
403 void zap_dead_locals (JavaThread* thread, const RegisterMap* map);
404 void zap_dead_interpreted_locals(JavaThread* thread, const RegisterMap* map);
405 void zap_dead_compiled_locals (JavaThread* thread, const RegisterMap* map);
406 void zap_dead_entry_locals (JavaThread* thread, const RegisterMap* map);
407 void zap_dead_deoptimized_locals(JavaThread* thread, const RegisterMap* map);
408 # endif
409 // Verification
410 void verify(const RegisterMap* map);
411 static bool verify_return_pc(address x);
412 static bool is_bci(intptr_t bcx);
413 // Usage:
414 // assert(frame::verify_return_pc(return_address), "must be a return pc");
416 int pd_oop_map_offset_adjustment() const;
418 # include "incls/_frame_pd.hpp.incl"
419 };
422 //
423 // StackFrameStream iterates through the frames of a thread starting from
424 // top most frame. It automatically takes care of updating the location of
425 // all (callee-saved) registers. Notice: If a thread is stopped at
426 // a safepoint, all registers are saved, not only the callee-saved ones.
427 //
428 // Use:
429 //
430 // for(StackFrameStream fst(thread); !fst.is_done(); fst.next()) {
431 // ...
432 // }
433 //
434 class StackFrameStream : public StackObj {
435 private:
436 frame _fr;
437 RegisterMap _reg_map;
438 bool _is_done;
439 public:
440 StackFrameStream(JavaThread *thread, bool update = true);
442 // Iteration
443 bool is_done() { return (_is_done) ? true : (_is_done = _fr.is_first_frame(), false); }
444 void next() { if (!_is_done) _fr = _fr.sender(&_reg_map); }
446 // Query
447 frame *current() { return &_fr; }
448 RegisterMap* register_map() { return &_reg_map; }
449 };