2007-12-01 00:00:00 +00:00
/*
2015-02-13 14:37:35 +01:00
* Copyright ( c ) 1997 , 2015 , Oracle and / or its affiliates . All rights reserved .
2007-12-01 00:00:00 +00:00
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER .
*
* This code is free software ; you can redistribute it and / or modify it
* under the terms of the GNU General Public License version 2 only , as
* published by the Free Software Foundation .
*
* This code is distributed in the hope that it will be useful , but WITHOUT
* ANY WARRANTY ; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE . See the GNU General Public License
* version 2 for more details ( a copy is included in the LICENSE file that
* accompanied this code ) .
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work ; if not , write to the Free Software Foundation ,
* Inc . , 51 Franklin St , Fifth Floor , Boston , MA 02110 - 1301 USA .
*
2010-05-27 19:08:38 -07:00
* Please contact Oracle , 500 Oracle Parkway , Redwood Shores , CA 94065 USA
* or visit www . oracle . com if you need additional information or have any
* questions .
2007-12-01 00:00:00 +00:00
*
*/
2010-11-23 13:22:55 -08:00
# include "precompiled.hpp"
2012-11-30 15:23:16 -08:00
# include "asm/macroAssembler.hpp"
# include "asm/macroAssembler.inline.hpp"
2014-01-08 10:25:50 -08:00
# include "ci/ciReplay.hpp"
2010-11-23 13:22:55 -08:00
# include "classfile/systemDictionary.hpp"
# include "code/exceptionHandlerTable.hpp"
# include "code/nmethod.hpp"
2014-07-03 08:46:44 +02:00
# include "compiler/compileBroker.hpp"
2010-11-23 13:22:55 -08:00
# include "compiler/compileLog.hpp"
2012-11-30 15:23:16 -08:00
# include "compiler/disassembler.hpp"
2010-11-23 13:22:55 -08:00
# include "compiler/oopMap.hpp"
# include "opto/addnode.hpp"
# include "opto/block.hpp"
# include "opto/c2compiler.hpp"
# include "opto/callGenerator.hpp"
# include "opto/callnode.hpp"
# include "opto/cfgnode.hpp"
# include "opto/chaitin.hpp"
# include "opto/compile.hpp"
# include "opto/connode.hpp"
2015-02-18 18:14:07 +01:00
# include "opto/convertnode.hpp"
2010-11-23 13:22:55 -08:00
# include "opto/divnode.hpp"
# include "opto/escape.hpp"
# include "opto/idealGraphPrinter.hpp"
# include "opto/loopnode.hpp"
# include "opto/machnode.hpp"
# include "opto/macro.hpp"
# include "opto/matcher.hpp"
2013-10-11 12:06:14 +02:00
# include "opto/mathexactnode.hpp"
2010-11-23 13:22:55 -08:00
# include "opto/memnode.hpp"
# include "opto/mulnode.hpp"
2014-04-01 09:05:20 -07:00
# include "opto/narrowptrnode.hpp"
2010-11-23 13:22:55 -08:00
# include "opto/node.hpp"
# include "opto/opcodes.hpp"
# include "opto/output.hpp"
# include "opto/parse.hpp"
# include "opto/phaseX.hpp"
# include "opto/rootnode.hpp"
# include "opto/runtime.hpp"
# include "opto/stringopts.hpp"
# include "opto/type.hpp"
# include "opto/vectornode.hpp"
# include "runtime/arguments.hpp"
2015-02-13 14:37:35 +01:00
# include "runtime/sharedRuntime.hpp"
2010-11-23 13:22:55 -08:00
# include "runtime/signature.hpp"
# include "runtime/stubRoutines.hpp"
# include "runtime/timer.hpp"
# include "utilities/copy.hpp"
2007-12-01 00:00:00 +00:00
2010-12-03 01:34:31 -08:00
// -------------------- Compile::mach_constant_base_node -----------------------
// Constant table base node singleton.
MachConstantBaseNode * Compile : : mach_constant_base_node ( ) {
if ( _mach_constant_base_node = = NULL ) {
2014-06-02 08:07:29 +02:00
_mach_constant_base_node = new MachConstantBaseNode ( ) ;
2010-12-03 01:34:31 -08:00
_mach_constant_base_node - > add_req ( C - > root ( ) ) ;
}
return _mach_constant_base_node ;
}
2007-12-01 00:00:00 +00:00
/// Support for intrinsics.
// Return the index at which m must be inserted (or already exists).
// The sort order is by the address of the ciMethod, with is_virtual as minor key.
int Compile : : intrinsic_insertion_index ( ciMethod * m , bool is_virtual ) {
# ifdef ASSERT
for ( int i = 1 ; i < _intrinsics - > length ( ) ; i + + ) {
CallGenerator * cg1 = _intrinsics - > at ( i - 1 ) ;
CallGenerator * cg2 = _intrinsics - > at ( i ) ;
assert ( cg1 - > method ( ) ! = cg2 - > method ( )
? cg1 - > method ( ) < cg2 - > method ( )
: cg1 - > is_virtual ( ) < cg2 - > is_virtual ( ) ,
" compiler intrinsics list must stay sorted " ) ;
}
# endif
// Binary search sorted list, in decreasing intervals [lo, hi].
int lo = 0 , hi = _intrinsics - > length ( ) - 1 ;
while ( lo < = hi ) {
int mid = ( uint ) ( hi + lo ) / 2 ;
ciMethod * mid_m = _intrinsics - > at ( mid ) - > method ( ) ;
if ( m < mid_m ) {
hi = mid - 1 ;
} else if ( m > mid_m ) {
lo = mid + 1 ;
} else {
// look at minor sort key
bool mid_virt = _intrinsics - > at ( mid ) - > is_virtual ( ) ;
if ( is_virtual < mid_virt ) {
hi = mid - 1 ;
} else if ( is_virtual > mid_virt ) {
lo = mid + 1 ;
} else {
return mid ; // exact match
}
}
}
return lo ; // inexact match
}
void Compile : : register_intrinsic ( CallGenerator * cg ) {
if ( _intrinsics = = NULL ) {
2012-12-23 17:08:22 +01:00
_intrinsics = new ( comp_arena ( ) ) GrowableArray < CallGenerator * > ( comp_arena ( ) , 60 , 0 , NULL ) ;
2007-12-01 00:00:00 +00:00
}
// This code is stolen from ciObjectFactory::insert.
// Really, GrowableArray should have methods for
// insert_at, remove_at, and binary_search.
int len = _intrinsics - > length ( ) ;
int index = intrinsic_insertion_index ( cg - > method ( ) , cg - > is_virtual ( ) ) ;
if ( index = = len ) {
_intrinsics - > append ( cg ) ;
} else {
# ifdef ASSERT
CallGenerator * oldcg = _intrinsics - > at ( index ) ;
assert ( oldcg - > method ( ) ! = cg - > method ( ) | | oldcg - > is_virtual ( ) ! = cg - > is_virtual ( ) , " don't register twice " ) ;
# endif
_intrinsics - > append ( _intrinsics - > at ( len - 1 ) ) ;
int pos ;
for ( pos = len - 2 ; pos > = index ; pos - - ) {
_intrinsics - > at_put ( pos + 1 , _intrinsics - > at ( pos ) ) ;
}
_intrinsics - > at_put ( index , cg ) ;
}
assert ( find_intrinsic ( cg - > method ( ) , cg - > is_virtual ( ) ) = = cg , " registration worked " ) ;
}
CallGenerator * Compile : : find_intrinsic ( ciMethod * m , bool is_virtual ) {
assert ( m - > is_loaded ( ) , " don't try this on unloaded methods " ) ;
if ( _intrinsics ! = NULL ) {
int index = intrinsic_insertion_index ( m , is_virtual ) ;
if ( index < _intrinsics - > length ( )
& & _intrinsics - > at ( index ) - > method ( ) = = m
& & _intrinsics - > at ( index ) - > is_virtual ( ) = = is_virtual ) {
return _intrinsics - > at ( index ) ;
}
}
// Lazily create intrinsics for intrinsic IDs well-known in the runtime.
2009-07-21 16:56:06 -07:00
if ( m - > intrinsic_id ( ) ! = vmIntrinsics : : _none & &
m - > intrinsic_id ( ) < = vmIntrinsics : : LAST_COMPILER_INLINE ) {
2007-12-01 00:00:00 +00:00
CallGenerator * cg = make_vm_intrinsic ( m , is_virtual ) ;
if ( cg ! = NULL ) {
// Save it for next time:
register_intrinsic ( cg ) ;
return cg ;
} else {
gather_intrinsic_statistics ( m - > intrinsic_id ( ) , is_virtual , _intrinsic_disabled ) ;
}
}
return NULL ;
}
// Compile:: register_library_intrinsics and make_vm_intrinsic are defined
// in library_call.cpp.
# ifndef PRODUCT
// statistics gathering...
juint Compile : : _intrinsic_hist_count [ vmIntrinsics : : ID_LIMIT ] = { 0 } ;
jubyte Compile : : _intrinsic_hist_flags [ vmIntrinsics : : ID_LIMIT ] = { 0 } ;
bool Compile : : gather_intrinsic_statistics ( vmIntrinsics : : ID id , bool is_virtual , int flags ) {
assert ( id > vmIntrinsics : : _none & & id < vmIntrinsics : : ID_LIMIT , " oob " ) ;
int oflags = _intrinsic_hist_flags [ id ] ;
assert ( flags ! = 0 , " what happened? " ) ;
if ( is_virtual ) {
flags | = _intrinsic_virtual ;
}
bool changed = ( flags ! = oflags ) ;
if ( ( flags & _intrinsic_worked ) ! = 0 ) {
juint count = ( _intrinsic_hist_count [ id ] + = 1 ) ;
if ( count = = 1 ) {
changed = true ; // first time
}
// increment the overall count also:
_intrinsic_hist_count [ vmIntrinsics : : _none ] + = 1 ;
}
if ( changed ) {
if ( ( ( oflags ^ flags ) & _intrinsic_virtual ) ! = 0 ) {
// Something changed about the intrinsic's virtuality.
if ( ( flags & _intrinsic_virtual ) ! = 0 ) {
// This is the first use of this intrinsic as a virtual call.
if ( oflags ! = 0 ) {
// We already saw it as a non-virtual, so note both cases.
flags | = _intrinsic_both ;
}
} else if ( ( oflags & _intrinsic_both ) = = 0 ) {
// This is the first use of this intrinsic as a non-virtual
flags | = _intrinsic_both ;
}
}
_intrinsic_hist_flags [ id ] = ( jubyte ) ( oflags | flags ) ;
}
// update the overall flags also:
_intrinsic_hist_flags [ vmIntrinsics : : _none ] | = ( jubyte ) flags ;
return changed ;
}
static char * format_flags ( int flags , char * buf ) {
buf [ 0 ] = 0 ;
if ( ( flags & Compile : : _intrinsic_worked ) ! = 0 ) strcat ( buf , " ,worked " ) ;
if ( ( flags & Compile : : _intrinsic_failed ) ! = 0 ) strcat ( buf , " ,failed " ) ;
if ( ( flags & Compile : : _intrinsic_disabled ) ! = 0 ) strcat ( buf , " ,disabled " ) ;
if ( ( flags & Compile : : _intrinsic_virtual ) ! = 0 ) strcat ( buf , " ,virtual " ) ;
if ( ( flags & Compile : : _intrinsic_both ) ! = 0 ) strcat ( buf , " ,nonvirtual " ) ;
if ( buf [ 0 ] = = 0 ) strcat ( buf , " , " ) ;
assert ( buf [ 0 ] = = ' , ' , " must be " ) ;
return & buf [ 1 ] ;
}
void Compile : : print_intrinsic_statistics ( ) {
char flagsbuf [ 100 ] ;
ttyLocker ttyl ;
if ( xtty ! = NULL ) xtty - > head ( " statistics type='intrinsic' " ) ;
tty - > print_cr ( " Compiler intrinsic usage: " ) ;
juint total = _intrinsic_hist_count [ vmIntrinsics : : _none ] ;
if ( total = = 0 ) total = 1 ; // avoid div0 in case of no successes
# define PRINT_STAT_LINE(name, c, f) \
tty - > print_cr ( " %4d (%4.1f%%) %s (%s) " , ( int ) ( c ) , ( ( c ) * 100.0 ) / total , name , f ) ;
for ( int index = 1 + ( int ) vmIntrinsics : : _none ; index < ( int ) vmIntrinsics : : ID_LIMIT ; index + + ) {
vmIntrinsics : : ID id = ( vmIntrinsics : : ID ) index ;
int flags = _intrinsic_hist_flags [ id ] ;
juint count = _intrinsic_hist_count [ id ] ;
if ( ( flags | count ) ! = 0 ) {
PRINT_STAT_LINE ( vmIntrinsics : : name_at ( id ) , count , format_flags ( flags , flagsbuf ) ) ;
}
}
PRINT_STAT_LINE ( " total " , total , format_flags ( _intrinsic_hist_flags [ vmIntrinsics : : _none ] , flagsbuf ) ) ;
if ( xtty ! = NULL ) xtty - > tail ( " statistics " ) ;
}
void Compile : : print_statistics ( ) {
{ ttyLocker ttyl ;
if ( xtty ! = NULL ) xtty - > head ( " statistics type='opto' " ) ;
Parse : : print_statistics ( ) ;
PhaseCCP : : print_statistics ( ) ;
PhaseRegAlloc : : print_statistics ( ) ;
Scheduling : : print_statistics ( ) ;
PhasePeephole : : print_statistics ( ) ;
PhaseIdealLoop : : print_statistics ( ) ;
if ( xtty ! = NULL ) xtty - > tail ( " statistics " ) ;
}
if ( _intrinsic_hist_flags [ vmIntrinsics : : _none ] ! = 0 ) {
// put this under its own <statistics> element.
print_intrinsic_statistics ( ) ;
}
}
# endif //PRODUCT
// Support for bundling info
Bundle * Compile : : node_bundling ( const Node * n ) {
assert ( valid_bundle_info ( n ) , " oob " ) ;
return & _node_bundling_base [ n - > _idx ] ;
}
bool Compile : : valid_bundle_info ( const Node * n ) {
return ( _node_bundling_limit > n - > _idx ) ;
}
2009-11-12 09:24:21 -08:00
void Compile : : gvn_replace_by ( Node * n , Node * nn ) {
for ( DUIterator_Last imin , i = n - > last_outs ( imin ) ; i > = imin ; ) {
Node * use = n - > last_out ( i ) ;
bool is_in_table = initial_gvn ( ) - > hash_delete ( use ) ;
uint uses_found = 0 ;
for ( uint j = 0 ; j < use - > len ( ) ; j + + ) {
if ( use - > in ( j ) = = n ) {
if ( j < use - > req ( ) )
use - > set_req ( j , nn ) ;
else
use - > set_prec ( j , nn ) ;
uses_found + + ;
}
}
if ( is_in_table ) {
// reinsert into table
initial_gvn ( ) - > hash_find_insert ( use ) ;
}
record_for_igvn ( use ) ;
i - = uses_found ; // we deleted 1 or more copies of this edge
}
}
2012-11-27 17:24:15 -08:00
static inline bool not_a_node ( const Node * n ) {
if ( n = = NULL ) return true ;
if ( ( ( intptr_t ) n & 1 ) ! = 0 ) return true ; // uninitialized, etc.
if ( * ( address * ) n = = badAddress ) return true ; // kill by Node::destruct
return false ;
}
2009-11-12 09:24:21 -08:00
2007-12-01 00:00:00 +00:00
// Identify all nodes that are reachable from below, useful.
// Use breadth-first pass that records state in a Unique_Node_List,
// recursive traversal is slower.
void Compile : : identify_useful_nodes ( Unique_Node_List & useful ) {
2015-10-08 12:10:19 +02:00
int estimated_worklist_size = live_nodes ( ) ;
2007-12-01 00:00:00 +00:00
useful . map ( estimated_worklist_size , NULL ) ; // preallocate space
// Initialize worklist
if ( root ( ) ! = NULL ) { useful . push ( root ( ) ) ; }
// If 'top' is cached, declare it useful to preserve cached node
if ( cached_top_node ( ) ) { useful . push ( cached_top_node ( ) ) ; }
// Push all useful nodes onto the list, breadthfirst
for ( uint next = 0 ; next < useful . size ( ) ; + + next ) {
assert ( next < unique ( ) , " Unique useful nodes < total nodes " ) ;
Node * n = useful . at ( next ) ;
uint max = n - > len ( ) ;
for ( uint i = 0 ; i < max ; + + i ) {
Node * m = n - > in ( i ) ;
2012-11-27 17:24:15 -08:00
if ( not_a_node ( m ) ) continue ;
2007-12-01 00:00:00 +00:00
useful . push ( m ) ;
}
}
}
2012-11-27 17:24:15 -08:00
// Update dead_node_list with any missing dead nodes using useful
// list. Consider all non-useful nodes to be useless i.e., dead nodes.
void Compile : : update_dead_node_list ( Unique_Node_List & useful ) {
uint max_idx = unique ( ) ;
VectorSet & useful_node_set = useful . member_set ( ) ;
for ( uint node_idx = 0 ; node_idx < max_idx ; node_idx + + ) {
// If node with index node_idx is not in useful set,
// mark it as dead in dead node list.
if ( ! useful_node_set . test ( node_idx ) ) {
record_dead_node ( node_idx ) ;
}
}
}
2012-12-23 17:08:22 +01:00
void Compile : : remove_useless_late_inlines ( GrowableArray < CallGenerator * > * inlines , Unique_Node_List & useful ) {
int shift = 0 ;
for ( int i = 0 ; i < inlines - > length ( ) ; i + + ) {
CallGenerator * cg = inlines - > at ( i ) ;
CallNode * call = cg - > call_node ( ) ;
if ( shift > 0 ) {
inlines - > at_put ( i - shift , cg ) ;
}
if ( ! useful . member ( call ) ) {
shift + + ;
}
}
inlines - > trunc_to ( inlines - > length ( ) - shift ) ;
}
2007-12-01 00:00:00 +00:00
// Disconnect all useless nodes by disconnecting those at the boundary.
void Compile : : remove_useless_nodes ( Unique_Node_List & useful ) {
uint next = 0 ;
2011-11-09 07:25:51 -08:00
while ( next < useful . size ( ) ) {
2007-12-01 00:00:00 +00:00
Node * n = useful . at ( next + + ) ;
2014-06-10 13:37:16 +02:00
if ( n - > is_SafePoint ( ) ) {
// We're done with a parsing phase. Replaced nodes are not valid
// beyond that point.
n - > as_SafePoint ( ) - > delete_replaced_nodes ( ) ;
}
2007-12-01 00:00:00 +00:00
// Use raw traversal of out edges since this code removes out edges
int max = n - > outcnt ( ) ;
2011-11-09 07:25:51 -08:00
for ( int j = 0 ; j < max ; + + j ) {
2007-12-01 00:00:00 +00:00
Node * child = n - > raw_out ( j ) ;
2011-11-09 07:25:51 -08:00
if ( ! useful . member ( child ) ) {
assert ( ! child - > is_top ( ) | | child ! = top ( ) ,
" If top is cached in Compile object it is in useful list " ) ;
2007-12-01 00:00:00 +00:00
// Only need to remove this out-edge to the useless node
n - > raw_del_out ( j ) ;
- - j ;
- - max ;
}
}
if ( n - > outcnt ( ) = = 1 & & n - > has_special_unique_user ( ) ) {
2011-11-09 07:25:51 -08:00
record_for_igvn ( n - > unique_out ( ) ) ;
}
}
// Remove useless macro and predicate opaq nodes
for ( int i = C - > macro_count ( ) - 1 ; i > = 0 ; i - - ) {
Node * n = C - > macro_node ( i ) ;
if ( ! useful . member ( n ) ) {
remove_macro_node ( n ) ;
2007-12-01 00:00:00 +00:00
}
}
2013-02-12 12:56:11 +01:00
// Remove useless expensive node
for ( int i = C - > expensive_count ( ) - 1 ; i > = 0 ; i - - ) {
Node * n = C - > expensive_node ( i ) ;
if ( ! useful . member ( n ) ) {
remove_expensive_node ( n ) ;
}
}
2012-12-23 17:08:22 +01:00
// clean up the late inline lists
remove_useless_late_inlines ( & _string_late_inlines , useful ) ;
2013-05-08 15:08:01 -07:00
remove_useless_late_inlines ( & _boxing_late_inlines , useful ) ;
2012-12-23 17:08:22 +01:00
remove_useless_late_inlines ( & _late_inlines , useful ) ;
2007-12-01 00:00:00 +00:00
debug_only ( verify_graph_edges ( true /*check for no_dead_code*/ ) ; )
}
//------------------------------frame_size_in_words-----------------------------
// frame_slots in units of words
int Compile : : frame_size_in_words ( ) const {
// shift is 0 in LP32 and 1 in LP64
const int shift = ( LogBytesPerWord - LogBytesPerInt ) ;
int words = _frame_slots > > shift ;
assert ( words < < shift = = _frame_slots , " frame size must be properly aligned in LP64 " ) ;
return words ;
}
2014-04-01 09:36:49 +02:00
// To bang the stack of this compiled method we use the stack size
// that the interpreter would need in case of a deoptimization. This
// removes the need to bang the stack in the deoptimization blob which
// in turn simplifies stack overflow handling.
int Compile : : bang_size_in_bytes ( ) const {
2014-09-04 13:11:25 +04:00
return MAX2 ( frame_size_in_bytes ( ) + os : : extra_bang_size_in_bytes ( ) , _interpreter_frame_size ) ;
2014-04-01 09:36:49 +02:00
}
2007-12-01 00:00:00 +00:00
// ============================================================================
//------------------------------CompileWrapper---------------------------------
class CompileWrapper : public StackObj {
Compile * const _compile ;
public :
CompileWrapper ( Compile * compile ) ;
~ CompileWrapper ( ) ;
} ;
CompileWrapper : : CompileWrapper ( Compile * compile ) : _compile ( compile ) {
// the Compile* pointer is stored in the current ciEnv:
ciEnv * env = compile - > env ( ) ;
assert ( env = = ciEnv : : current ( ) , " must already be a ciEnv active " ) ;
assert ( env - > compiler_data ( ) = = NULL , " compile already active? " ) ;
env - > set_compiler_data ( compile ) ;
assert ( compile = = Compile : : current ( ) , " sanity " ) ;
compile - > set_type_dict ( NULL ) ;
2015-05-05 12:33:57 -07:00
compile - > set_clone_map ( new Dict ( cmpkey , hashkey , _compile - > comp_arena ( ) ) ) ;
compile - > clone_map ( ) . set_clone_idx ( 0 ) ;
2007-12-01 00:00:00 +00:00
compile - > set_type_hwm ( NULL ) ;
compile - > set_type_last_size ( 0 ) ;
compile - > set_last_tf ( NULL , NULL ) ;
compile - > set_indexSet_arena ( NULL ) ;
compile - > set_indexSet_free_block_list ( NULL ) ;
compile - > init_type_arena ( ) ;
Type : : Initialize ( compile ) ;
_compile - > set_scratch_buffer_blob ( NULL ) ;
_compile - > begin_method ( ) ;
2015-10-20 18:07:28 +02:00
_compile - > clone_map ( ) . set_debug ( _compile - > has_method ( ) & & _compile - > directive ( ) - > CloneMapDebugOption ) ;
2007-12-01 00:00:00 +00:00
}
CompileWrapper : : ~ CompileWrapper ( ) {
_compile - > end_method ( ) ;
if ( _compile - > scratch_buffer_blob ( ) ! = NULL )
BufferBlob : : free ( _compile - > scratch_buffer_blob ( ) ) ;
_compile - > env ( ) - > set_compiler_data ( NULL ) ;
}
//----------------------------print_compile_messages---------------------------
void Compile : : print_compile_messages ( ) {
# ifndef PRODUCT
// Check if recompiling
if ( _subsume_loads = = false & & PrintOpto ) {
// Recompiling without allowing machine instructions to subsume loads
tty - > print_cr ( " ********************************************************* " ) ;
tty - > print_cr ( " ** Bailout: Recompile without subsuming loads ** " ) ;
tty - > print_cr ( " ********************************************************* " ) ;
}
2008-03-06 10:30:17 -08:00
if ( _do_escape_analysis ! = DoEscapeAnalysis & & PrintOpto ) {
// Recompiling without escape analysis
tty - > print_cr ( " ********************************************************* " ) ;
tty - > print_cr ( " ** Bailout: Recompile without escape analysis ** " ) ;
tty - > print_cr ( " ********************************************************* " ) ;
}
2013-05-08 15:08:01 -07:00
if ( _eliminate_boxing ! = EliminateAutoBox & & PrintOpto ) {
// Recompiling without boxing elimination
tty - > print_cr ( " ********************************************************* " ) ;
tty - > print_cr ( " ** Bailout: Recompile without boxing elimination ** " ) ;
tty - > print_cr ( " ********************************************************* " ) ;
}
2015-10-20 18:07:28 +02:00
if ( C - > directive ( ) - > BreakAtCompileOption ) {
2009-02-27 13:27:09 -08:00
// Open the debugger when compiling this method.
2007-12-01 00:00:00 +00:00
tty - > print ( " ### Breaking when compiling: " ) ;
method ( ) - > print_short_name ( ) ;
tty - > cr ( ) ;
BREAKPOINT ;
}
if ( PrintOpto ) {
if ( is_osr_compilation ( ) ) {
tty - > print ( " [OSR]%3d " , _compile_id ) ;
} else {
tty - > print ( " %3d " , _compile_id ) ;
}
}
# endif
}
2010-12-29 10:41:43 -08:00
//-----------------------init_scratch_buffer_blob------------------------------
// Construct a temporary BufferBlob and cache it for this compile.
2010-12-03 01:34:31 -08:00
void Compile : : init_scratch_buffer_blob ( int const_size ) {
2010-12-29 10:41:43 -08:00
// If there is already a scratch buffer blob allocated and the
// constant section is big enough, use it. Otherwise free the
// current and allocate a new one.
BufferBlob * blob = scratch_buffer_blob ( ) ;
if ( ( blob ! = NULL ) & & ( const_size < = _scratch_const_size ) ) {
// Use the current blob.
} else {
if ( blob ! = NULL ) {
BufferBlob : : free ( blob ) ;
}
ResourceMark rm ;
_scratch_const_size = const_size ;
int size = ( MAX_inst_size + MAX_stubs_size + _scratch_const_size ) ;
blob = BufferBlob : : create ( " Compile::scratch_buffer " , size ) ;
// Record the buffer blob for next time.
set_scratch_buffer_blob ( blob ) ;
// Have we run out of code space?
if ( scratch_buffer_blob ( ) = = NULL ) {
// Let CompilerBroker disable further compilations.
record_failure ( " Not enough space for scratch buffer in CodeCache " ) ;
return ;
}
2008-05-21 10:45:07 -07:00
}
2007-12-01 00:00:00 +00:00
// Initialize the relocation buffers
2010-08-25 05:27:54 -07:00
relocInfo * locs_buf = ( relocInfo * ) blob - > content_end ( ) - MAX_locs_size ;
2007-12-01 00:00:00 +00:00
set_scratch_locs_memory ( locs_buf ) ;
}
//-----------------------scratch_emit_size-------------------------------------
// Helper function that computes size by emitting code
uint Compile : : scratch_emit_size ( const Node * n ) {
2010-12-03 01:34:31 -08:00
// Start scratch_emit_size section.
set_in_scratch_emit_size ( true ) ;
2007-12-01 00:00:00 +00:00
// Emit into a trash buffer and count bytes emitted.
// This is a pretty expensive way to compute a size,
// but it works well enough if seldom used.
// All common fixed-size instructions are given a size
// method by the AD file.
// Note that the scratch buffer blob and locs memory are
// allocated at the beginning of the compile task, and
// may be shared by several calls to scratch_emit_size.
// The allocation of the scratch buffer blob is particularly
// expensive, since it has to grab the code cache lock.
BufferBlob * blob = this - > scratch_buffer_blob ( ) ;
assert ( blob ! = NULL , " Initialize BufferBlob at start " ) ;
assert ( blob - > size ( ) > MAX_inst_size , " sanity " ) ;
relocInfo * locs_buf = scratch_locs_memory ( ) ;
2010-08-25 05:27:54 -07:00
address blob_begin = blob - > content_begin ( ) ;
2007-12-01 00:00:00 +00:00
address blob_end = ( address ) locs_buf ;
2010-08-25 05:27:54 -07:00
assert ( blob - > content_contains ( blob_end ) , " sanity " ) ;
2007-12-01 00:00:00 +00:00
CodeBuffer buf ( blob_begin , blob_end - blob_begin ) ;
2010-12-03 01:34:31 -08:00
buf . initialize_consts_size ( _scratch_const_size ) ;
2007-12-01 00:00:00 +00:00
buf . initialize_stubs_size ( MAX_stubs_size ) ;
assert ( locs_buf ! = NULL , " sanity " ) ;
2010-12-03 01:34:31 -08:00
int lsize = MAX_locs_size / 3 ;
buf . consts ( ) - > initialize_shared_locs ( & locs_buf [ lsize * 0 ] , lsize ) ;
buf . insts ( ) - > initialize_shared_locs ( & locs_buf [ lsize * 1 ] , lsize ) ;
buf . stubs ( ) - > initialize_shared_locs ( & locs_buf [ lsize * 2 ] , lsize ) ;
// Do the emission.
2011-07-21 11:25:07 -07:00
Label fakeL ; // Fake label for branch instructions.
2011-08-16 11:53:57 -07:00
Label * saveL = NULL ;
uint save_bnum = 0 ;
bool is_branch = n - > is_MachBranch ( ) ;
2011-07-21 11:25:07 -07:00
if ( is_branch ) {
MacroAssembler masm ( & buf ) ;
masm . bind ( fakeL ) ;
2011-08-16 11:53:57 -07:00
n - > as_MachBranch ( ) - > save_label ( & saveL , & save_bnum ) ;
n - > as_MachBranch ( ) - > label_set ( & fakeL , 0 ) ;
2011-07-21 11:25:07 -07:00
}
2007-12-01 00:00:00 +00:00
n - > emit ( buf , this - > regalloc ( ) ) ;
2015-07-29 08:05:21 +02:00
// Emitting into the scratch buffer should not fail
2015-09-29 11:02:08 +02:00
assert ( ! failing ( ) , " Must not have pending failure. Reason is: %s " , failure_reason ( ) ) ;
2015-07-29 08:05:21 +02:00
2011-08-16 11:53:57 -07:00
if ( is_branch ) // Restore label.
n - > as_MachBranch ( ) - > label_set ( saveL , save_bnum ) ;
2010-12-03 01:34:31 -08:00
// End scratch_emit_size section.
set_in_scratch_emit_size ( false ) ;
2010-08-25 05:27:54 -07:00
return buf . insts_size ( ) ;
2007-12-01 00:00:00 +00:00
}
// ============================================================================
//------------------------------Compile standard-------------------------------
debug_only ( int Compile : : _debug_idx = 100000 ; )
// Compile a method. entry_bci is -1 for normal compilations and indicates
// the continuation bci for on stack replacement.
2013-05-08 15:08:01 -07:00
Compile : : Compile ( ciEnv * ci_env , C2Compiler * compiler , ciMethod * target , int osr_bci ,
2015-10-20 18:07:28 +02:00
bool subsume_loads , bool do_escape_analysis , bool eliminate_boxing , DirectiveSet * directive )
2007-12-01 00:00:00 +00:00
: Phase ( Compiler ) ,
_env ( ci_env ) ,
2015-10-20 18:07:28 +02:00
_directive ( directive ) ,
2007-12-01 00:00:00 +00:00
_log ( ci_env - > log ( ) ) ,
_compile_id ( ci_env - > compile_id ( ) ) ,
_save_argument_registers ( false ) ,
_stub_name ( NULL ) ,
_stub_function ( NULL ) ,
_stub_entry_point ( NULL ) ,
_method ( target ) ,
_entry_bci ( osr_bci ) ,
_initial_gvn ( NULL ) ,
_for_igvn ( NULL ) ,
_warm_calls ( NULL ) ,
_subsume_loads ( subsume_loads ) ,
2008-03-06 10:30:17 -08:00
_do_escape_analysis ( do_escape_analysis ) ,
2013-05-08 15:08:01 -07:00
_eliminate_boxing ( eliminate_boxing ) ,
2007-12-01 00:00:00 +00:00
_failure_reason ( NULL ) ,
_code_buffer ( " Compile::Fill_buffer " ) ,
_orig_pc_slot ( 0 ) ,
_orig_pc_slot_offset_in_bytes ( 0 ) ,
2010-02-18 11:35:41 +01:00
_has_method_handle_invokes ( false ) ,
2010-12-03 01:34:31 -08:00
_mach_constant_base_node ( NULL ) ,
2007-12-01 00:00:00 +00:00
_node_bundling_limit ( 0 ) ,
_node_bundling_base ( NULL ) ,
2009-07-23 14:53:56 -07:00
_java_calls ( 0 ) ,
_inner_loops ( 0 ) ,
2010-12-03 01:34:31 -08:00
_scratch_const_size ( - 1 ) ,
_in_scratch_emit_size ( false ) ,
2012-11-27 17:24:15 -08:00
_dead_node_list ( comp_arena ( ) ) ,
_dead_node_count ( 0 ) ,
2007-12-01 00:00:00 +00:00
# ifndef PRODUCT
2015-10-20 18:07:28 +02:00
_trace_opto_output ( directive - > TraceOptoOutputOption ) ,
2013-11-22 12:14:09 -08:00
_in_dump_cnt ( 0 ) ,
2007-12-01 00:00:00 +00:00
_printer ( IdealGraphPrinter : : printer ( ) ) ,
# endif
2012-12-18 14:55:25 +01:00
_congraph ( NULL ) ,
2014-08-07 12:18:58 -07:00
_comp_arena ( mtCompiler ) ,
_node_arena ( mtCompiler ) ,
_old_arena ( mtCompiler ) ,
_Compile_types ( mtCompiler ) ,
2014-01-08 10:25:50 -08:00
_replay_inline_data ( NULL ) ,
2012-12-23 17:08:22 +01:00
_late_inlines ( comp_arena ( ) , 2 , 0 , NULL ) ,
_string_late_inlines ( comp_arena ( ) , 2 , 0 , NULL ) ,
2013-05-08 15:08:01 -07:00
_boxing_late_inlines ( comp_arena ( ) , 2 , 0 , NULL ) ,
2012-12-23 17:08:22 +01:00
_late_inlines_pos ( 0 ) ,
_number_of_mh_late_inlines ( 0 ) ,
_inlining_progress ( false ) ,
_inlining_incrementally ( false ) ,
2012-12-18 14:55:25 +01:00
_print_inlining_list ( NULL ) ,
2014-04-09 09:17:43 +02:00
_print_inlining_stream ( NULL ) ,
2013-10-19 12:16:43 +02:00
_print_inlining_idx ( 0 ) ,
2014-05-26 14:27:01 +02:00
_print_inlining_output ( NULL ) ,
2014-11-24 07:29:03 -08:00
_interpreter_frame_size ( 0 ) ,
_max_node_limit ( MaxNodeLimit ) {
2007-12-01 00:00:00 +00:00
C = this ;
2015-10-20 18:07:28 +02:00
# ifndef PRODUCT
if ( _printer ! = NULL ) {
_printer - > set_compile ( this ) ;
}
# endif
2007-12-01 00:00:00 +00:00
CompileWrapper cw ( this ) ;
2014-09-25 12:10:57 +04:00
if ( CITimeVerbose ) {
2007-12-01 00:00:00 +00:00
tty - > print ( " " ) ;
target - > holder ( ) - > name ( ) - > print ( ) ;
tty - > print ( " . " ) ;
target - > print_short_name ( ) ;
tty - > print ( " " ) ;
}
2014-09-25 12:10:57 +04:00
TraceTime t1 ( " Total compilation time " , & _t_totalCompilation , CITime , CITimeVerbose ) ;
TraceTime t2 ( NULL , & _t_methodCompilation , CITime , false ) ;
# ifndef PRODUCT
2015-10-20 18:07:28 +02:00
bool print_opto_assembly = directive - > PrintOptoAssemblyOption ;
2008-04-02 12:09:59 -07:00
if ( ! print_opto_assembly ) {
2015-10-20 18:07:28 +02:00
bool print_assembly = directive - > PrintAssemblyOption ;
2008-04-02 12:09:59 -07:00
if ( print_assembly & & ! Disassembler : : can_decode ( ) ) {
tty - > print_cr ( " PrintAssembly request changed to PrintOptoAssembly " ) ;
print_opto_assembly = true ;
}
}
set_print_assembly ( print_opto_assembly ) ;
2008-09-17 12:59:52 -07:00
set_parsed_irreducible_loop ( false ) ;
2014-01-08 10:25:50 -08:00
2015-10-20 18:07:28 +02:00
if ( directive - > ReplayInlineOption ) {
2014-01-08 10:25:50 -08:00
_replay_inline_data = ciReplay : : load_inline_data ( method ( ) , entry_bci ( ) , ci_env - > comp_level ( ) ) ;
}
2007-12-01 00:00:00 +00:00
# endif
2015-10-20 18:07:28 +02:00
set_print_inlining ( directive - > PrintInliningOption NOT_PRODUCT ( | | PrintOptoInlining ) ) ;
set_print_intrinsics ( directive - > PrintIntrinsicsOption ) ;
2014-05-02 16:44:54 -07:00
set_has_irreducible_loop ( true ) ; // conservative until build_loop_tree() reset it
2007-12-01 00:00:00 +00:00
2014-03-20 17:49:27 -07:00
if ( ProfileTraps RTM_OPT_ONLY ( | | UseRTMLocking ) ) {
2007-12-01 00:00:00 +00:00
// Make sure the method being compiled gets its own MDO,
// so we can at least track the decompile_count().
2014-03-20 17:49:27 -07:00
// Need MDO to record RTM code generation state.
2010-12-02 17:21:12 -08:00
method ( ) - > ensure_method_data ( ) ;
2007-12-01 00:00:00 +00:00
}
Init ( : : AliasLevel ) ;
print_compile_messages ( ) ;
2014-01-24 15:26:56 +04:00
_ilt = InlineTree : : build_inline_tree_root ( ) ;
2007-12-01 00:00:00 +00:00
// Even if NO memory addresses are used, MergeMem nodes must have at least 1 slice
assert ( num_alias_types ( ) > = AliasIdxRaw , " " ) ;
# define MINIMUM_NODE_HASH 1023
// Node list that Iterative GVN will start with
Unique_Node_List for_igvn ( comp_arena ( ) ) ;
set_for_igvn ( & for_igvn ) ;
// GVN that will be run immediately on new nodes
uint estimated_size = method ( ) - > code_size ( ) * 4 + 64 ;
estimated_size = ( estimated_size < MINIMUM_NODE_HASH ? MINIMUM_NODE_HASH : estimated_size ) ;
PhaseGVN gvn ( node_arena ( ) , estimated_size ) ;
set_initial_gvn ( & gvn ) ;
2014-04-09 09:17:43 +02:00
print_inlining_init ( ) ;
2007-12-01 00:00:00 +00:00
{ // Scope for timing the parser
2014-09-25 12:10:57 +04:00
TracePhase tp ( " parse " , & timers [ _t_parser ] ) ;
2007-12-01 00:00:00 +00:00
// Put top into the hash table ASAP.
initial_gvn ( ) - > transform_no_reclaim ( top ( ) ) ;
// Set up tf(), start(), and find a CallGenerator.
2011-04-07 09:53:20 -07:00
CallGenerator * cg = NULL ;
2007-12-01 00:00:00 +00:00
if ( is_osr_compilation ( ) ) {
const TypeTuple * domain = StartOSRNode : : osr_domain ( ) ;
const TypeTuple * range = TypeTuple : : make_range ( method ( ) - > signature ( ) ) ;
init_tf ( TypeFunc : : make ( domain , range ) ) ;
2014-06-02 08:07:29 +02:00
StartNode * s = new StartOSRNode ( root ( ) , domain ) ;
2007-12-01 00:00:00 +00:00
initial_gvn ( ) - > set_type_bottom ( s ) ;
init_start ( s ) ;
cg = CallGenerator : : for_osr ( method ( ) , entry_bci ( ) ) ;
} else {
// Normal case.
init_tf ( TypeFunc : : make ( method ( ) ) ) ;
2014-06-02 08:07:29 +02:00
StartNode * s = new StartNode ( root ( ) , tf ( ) - > domain ( ) ) ;
2007-12-01 00:00:00 +00:00
initial_gvn ( ) - > set_type_bottom ( s ) ;
init_start ( s ) ;
2011-04-07 09:53:20 -07:00
if ( method ( ) - > intrinsic_id ( ) = = vmIntrinsics : : _Reference_get & & UseG1GC ) {
// With java.lang.ref.reference.get() we must go through the
// intrinsic when G1 is enabled - even when get() is the root
// method of the compile - so that, if necessary, the value in
// the referent field of the reference object gets recorded by
// the pre-barrier code.
// Specifically, if G1 is enabled, the value in the referent
// field is recorded by the G1 SATB pre barrier. This will
// result in the referent being marked live and the reference
// object removed from the list of discovered references during
// reference processing.
cg = find_intrinsic ( method ( ) , false ) ;
}
if ( cg = = NULL ) {
float past_uses = method ( ) - > interpreter_invocation_count ( ) ;
float expected_uses = past_uses ;
cg = CallGenerator : : for_inline ( method ( ) , expected_uses ) ;
}
2007-12-01 00:00:00 +00:00
}
if ( failing ( ) ) return ;
if ( cg = = NULL ) {
record_method_not_compilable_all_tiers ( " cannot parse method " ) ;
return ;
}
JVMState * jvms = build_start_state ( start ( ) , tf ( ) ) ;
2014-06-10 13:37:16 +02:00
if ( ( jvms = cg - > generate ( jvms ) ) = = NULL ) {
2014-12-22 11:21:20 +01:00
if ( ! failure_reason_is ( C2Compiler : : retry_class_loading_during_parsing ( ) ) ) {
record_method_not_compilable ( " method parse failed " ) ;
}
2007-12-01 00:00:00 +00:00
return ;
}
GraphKit kit ( jvms ) ;
if ( ! kit . stopped ( ) ) {
// Accept return values, and transfer control we know not where.
// This is done by a special, unique ReturnNode bound to root.
return_values ( kit . jvms ( ) ) ;
}
if ( kit . has_exceptions ( ) ) {
// Any exceptions that escape from this call must be rethrown
// to whatever caller is dynamically above us on the stack.
// This is done by a special, unique RethrowNode bound to root.
rethrow_exceptions ( kit . transfer_exceptions_into_jvms ( ) ) ;
}
2012-12-23 17:08:22 +01:00
assert ( IncrementalInline | | ( _late_inlines . length ( ) = = 0 & & ! has_mh_late_inlines ( ) ) , " incremental inlining is off " ) ;
2009-11-12 09:24:21 -08:00
2012-12-23 17:08:22 +01:00
if ( _late_inlines . length ( ) = = 0 & & ! has_mh_late_inlines ( ) & & ! failing ( ) & & has_stringbuilder ( ) ) {
inline_string_calls ( true ) ;
2009-11-12 09:24:21 -08:00
}
2012-12-23 17:08:22 +01:00
if ( failing ( ) ) return ;
2009-11-12 09:24:21 -08:00
2013-06-10 11:30:51 +02:00
print_method ( PHASE_BEFORE_REMOVEUSELESS , 3 ) ;
2008-09-17 12:59:52 -07:00
2007-12-01 00:00:00 +00:00
// Remove clutter produced by parsing.
if ( ! failing ( ) ) {
ResourceMark rm ;
PhaseRemoveUseless pru ( initial_gvn ( ) , & for_igvn ) ;
}
}
// Note: Large methods are capped off in do_one_bytecode().
if ( failing ( ) ) return ;
// After parsing, node notes are no longer automagic.
// They must be propagated by register_new_node_with_optimizer(),
// clone(), or the like.
set_default_node_notes ( NULL ) ;
for ( ; ; ) {
int successes = Inline_Warm ( ) ;
if ( failing ( ) ) return ;
if ( successes = = 0 ) break ;
}
// Drain the list.
Finish_Warm ( ) ;
# ifndef PRODUCT
2015-10-20 18:07:28 +02:00
if ( _printer & & _printer - > should_print ( 1 ) ) {
_printer - > print_inlining ( ) ;
2007-12-01 00:00:00 +00:00
}
# endif
if ( failing ( ) ) return ;
NOT_PRODUCT ( verify_graph_edges ( ) ; )
// Now optimize
Optimize ( ) ;
if ( failing ( ) ) return ;
NOT_PRODUCT ( verify_graph_edges ( ) ; )
# ifndef PRODUCT
if ( PrintIdeal ) {
ttyLocker ttyl ; // keep the following output all in one block
// This output goes directly to the tty, not the compiler log.
// To enable tools to match it up with the compilation activity,
// be sure to tag this tty output with the compile ID.
if ( xtty ! = NULL ) {
xtty - > head ( " ideal compile_id='%d'%s " , compile_id ( ) ,
is_osr_compilation ( ) ? " compile_kind='osr' " :
" " ) ;
}
root ( ) - > dump ( 9999 ) ;
if ( xtty ! = NULL ) {
xtty - > tail ( " ideal " ) ;
}
}
# endif
2013-11-05 01:57:18 -08:00
NOT_PRODUCT ( verify_barriers ( ) ; )
2014-01-08 10:25:50 -08:00
// Dump compilation data to replay it.
2015-10-20 18:07:28 +02:00
if ( directive - > DumpReplayOption ) {
2014-01-08 10:25:50 -08:00
env ( ) - > dump_replay_data ( _compile_id ) ;
}
2015-10-20 18:07:28 +02:00
if ( directive - > DumpInlineOption & & ( ilt ( ) ! = NULL ) ) {
2014-01-08 10:25:50 -08:00
env ( ) - > dump_inline_data ( _compile_id ) ;
}
2007-12-01 00:00:00 +00:00
// Now that we know the size of all the monitors we can add a fixed slot
// for the original deopt pc.
_orig_pc_slot = fixed_slots ( ) ;
int next_slot = _orig_pc_slot + ( sizeof ( address ) / VMRegImpl : : stack_slot_size ) ;
set_fixed_slots ( next_slot ) ;
2013-11-27 16:16:21 -08:00
// Compute when to use implicit null checks. Used by matching trap based
// nodes and NullCheck optimization.
set_allowed_deopt_reasons ( ) ;
2007-12-01 00:00:00 +00:00
// Now generate code
Code_Gen ( ) ;
if ( failing ( ) ) return ;
// Check if we want to skip execution of all compiled code.
{
# ifndef PRODUCT
if ( OptoNoExecute ) {
record_method_not_compilable ( " +OptoNoExecute " ) ; // Flag as failed
return ;
}
# endif
2014-09-25 12:10:57 +04:00
TracePhase tp ( " install_code " , & timers [ _t_registerMethod ] ) ;
2007-12-01 00:00:00 +00:00
if ( is_osr_compilation ( ) ) {
_code_offsets . set_value ( CodeOffsets : : Verified_Entry , 0 ) ;
_code_offsets . set_value ( CodeOffsets : : OSR_Entry , _first_block_size ) ;
} else {
_code_offsets . set_value ( CodeOffsets : : Verified_Entry , _first_block_size ) ;
_code_offsets . set_value ( CodeOffsets : : OSR_Entry , 0 ) ;
}
env ( ) - > register_method ( _method , _entry_bci ,
& _code_offsets ,
_orig_pc_slot_offset_in_bytes ,
code_buffer ( ) ,
frame_size_in_words ( ) , _oop_map_set ,
& _handler_table , & _inc_table ,
compiler ,
2012-09-17 19:39:07 -07:00
has_unsafe_access ( ) ,
2014-03-20 17:49:27 -07:00
SharedRuntime : : is_wide_vector ( max_vector_size ( ) ) ,
2015-10-20 18:07:28 +02:00
_directive ,
2014-03-20 17:49:27 -07:00
rtm_state ( )
2007-12-01 00:00:00 +00:00
) ;
2012-10-05 18:57:10 -07:00
if ( log ( ) ! = NULL ) // Print code cache state into compiler log
log ( ) - > code_cache_state ( ) ;
2007-12-01 00:00:00 +00:00
}
}
//------------------------------Compile----------------------------------------
// Compile a runtime stub
Compile : : Compile ( ciEnv * ci_env ,
TypeFunc_generator generator ,
address stub_function ,
const char * stub_name ,
int is_fancy_jump ,
bool pass_tls ,
bool save_arg_registers ,
2015-10-20 18:07:28 +02:00
bool return_pc ,
DirectiveSet * directive )
2007-12-01 00:00:00 +00:00
: Phase ( Compiler ) ,
_env ( ci_env ) ,
2015-10-20 18:07:28 +02:00
_directive ( directive ) ,
2007-12-01 00:00:00 +00:00
_log ( ci_env - > log ( ) ) ,
2013-02-13 10:25:09 +01:00
_compile_id ( 0 ) ,
2007-12-01 00:00:00 +00:00
_save_argument_registers ( save_arg_registers ) ,
_method ( NULL ) ,
_stub_name ( stub_name ) ,
_stub_function ( stub_function ) ,
_stub_entry_point ( NULL ) ,
_entry_bci ( InvocationEntryBci ) ,
_initial_gvn ( NULL ) ,
_for_igvn ( NULL ) ,
_warm_calls ( NULL ) ,
_orig_pc_slot ( 0 ) ,
_orig_pc_slot_offset_in_bytes ( 0 ) ,
_subsume_loads ( true ) ,
2008-03-06 10:30:17 -08:00
_do_escape_analysis ( false ) ,
2013-05-08 15:08:01 -07:00
_eliminate_boxing ( false ) ,
2007-12-01 00:00:00 +00:00
_failure_reason ( NULL ) ,
_code_buffer ( " Compile::Fill_buffer " ) ,
2010-02-18 11:35:41 +01:00
_has_method_handle_invokes ( false ) ,
2010-12-03 01:34:31 -08:00
_mach_constant_base_node ( NULL ) ,
2007-12-01 00:00:00 +00:00
_node_bundling_limit ( 0 ) ,
_node_bundling_base ( NULL ) ,
2009-07-23 14:53:56 -07:00
_java_calls ( 0 ) ,
_inner_loops ( 0 ) ,
2007-12-01 00:00:00 +00:00
# ifndef PRODUCT
_trace_opto_output ( TraceOptoOutput ) ,
2013-11-22 12:14:09 -08:00
_in_dump_cnt ( 0 ) ,
2007-12-01 00:00:00 +00:00
_printer ( NULL ) ,
# endif
2014-08-07 12:18:58 -07:00
_comp_arena ( mtCompiler ) ,
_node_arena ( mtCompiler ) ,
_old_arena ( mtCompiler ) ,
_Compile_types ( mtCompiler ) ,
2012-11-27 17:24:15 -08:00
_dead_node_list ( comp_arena ( ) ) ,
_dead_node_count ( 0 ) ,
2012-12-18 14:55:25 +01:00
_congraph ( NULL ) ,
2014-01-08 10:25:50 -08:00
_replay_inline_data ( NULL ) ,
2012-12-23 17:08:22 +01:00
_number_of_mh_late_inlines ( 0 ) ,
_inlining_progress ( false ) ,
_inlining_incrementally ( false ) ,
2012-12-18 14:55:25 +01:00
_print_inlining_list ( NULL ) ,
2014-04-09 09:17:43 +02:00
_print_inlining_stream ( NULL ) ,
2013-10-19 12:16:43 +02:00
_print_inlining_idx ( 0 ) ,
2014-05-26 14:27:01 +02:00
_print_inlining_output ( NULL ) ,
2014-04-01 09:36:49 +02:00
_allowed_reasons ( 0 ) ,
2014-11-24 07:29:03 -08:00
_interpreter_frame_size ( 0 ) ,
_max_node_limit ( MaxNodeLimit ) {
2007-12-01 00:00:00 +00:00
C = this ;
2014-09-25 12:10:57 +04:00
TraceTime t1 ( NULL , & _t_totalCompilation , CITime , false ) ;
TraceTime t2 ( NULL , & _t_stubCompilation , CITime , false ) ;
2007-12-01 00:00:00 +00:00
# ifndef PRODUCT
set_print_assembly ( PrintFrameConverterAssembly ) ;
2008-09-17 12:59:52 -07:00
set_parsed_irreducible_loop ( false ) ;
2007-12-01 00:00:00 +00:00
# endif
2014-05-02 16:44:54 -07:00
set_has_irreducible_loop ( false ) ; // no loops
2007-12-01 00:00:00 +00:00
CompileWrapper cw ( this ) ;
Init ( /*AliasLevel=*/ 0 ) ;
init_tf ( ( * generator ) ( ) ) ;
{
// The following is a dummy for the sake of GraphKit::gen_stub
Unique_Node_List for_igvn ( comp_arena ( ) ) ;
set_for_igvn ( & for_igvn ) ; // not used, but some GraphKit guys push on this
PhaseGVN gvn ( Thread : : current ( ) - > resource_area ( ) , 255 ) ;
set_initial_gvn ( & gvn ) ; // not significant, but GraphKit guys use it pervasively
gvn . transform_no_reclaim ( top ( ) ) ;
GraphKit kit ;
kit . gen_stub ( stub_function , stub_name , is_fancy_jump , pass_tls , return_pc ) ;
}
NOT_PRODUCT ( verify_graph_edges ( ) ; )
Code_Gen ( ) ;
if ( failing ( ) ) return ;
// Entry point will be accessed using compile->stub_entry_point();
if ( code_buffer ( ) = = NULL ) {
Matcher : : soft_match_failure ( ) ;
} else {
if ( PrintAssembly & & ( WizardMode | | Verbose ) )
tty - > print_cr ( " ### Stub::%s " , stub_name ) ;
if ( ! failing ( ) ) {
assert ( _fixed_slots = = 0 , " no fixed slots used for runtime stubs " ) ;
// Make the NMethod
// For now we mark the frame as never safe for profile stackwalking
RuntimeStub * rs = RuntimeStub : : new_runtime_stub ( stub_name ,
code_buffer ( ) ,
CodeOffsets : : frame_never_safe ,
// _code_offsets.value(CodeOffsets::Frame_Complete),
frame_size_in_words ( ) ,
_oop_map_set ,
save_arg_registers ) ;
assert ( rs ! = NULL & & rs - > is_runtime_stub ( ) , " sanity check " ) ;
_stub_entry_point = rs - > entry_point ( ) ;
}
}
}
//------------------------------Init-------------------------------------------
// Prepare for a single compilation
void Compile : : Init ( int aliaslevel ) {
_unique = 0 ;
_regalloc = NULL ;
_tf = NULL ; // filled in later
_top = NULL ; // cached later
_matcher = NULL ; // filled in later
_cfg = NULL ; // filled in later
set_24_bit_selection_and_mode ( Use24BitFP , false ) ;
_node_note_array = NULL ;
_default_node_notes = NULL ;
2014-07-25 10:06:17 +02:00
DEBUG_ONLY ( _modified_nodes = NULL ; ) // Used in Optimize()
2007-12-01 00:00:00 +00:00
_immutable_memory = NULL ; // filled in at first inquiry
// Globally visible Nodes
// First set TOP to NULL to give safe behavior during creation of RootNode
set_cached_top_node ( NULL ) ;
2014-06-02 08:07:29 +02:00
set_root ( new RootNode ( ) ) ;
2007-12-01 00:00:00 +00:00
// Now that you have a Root to point to, create the real TOP
2014-06-02 08:07:29 +02:00
set_cached_top_node ( new ConNode ( Type : : TOP ) ) ;
2007-12-01 00:00:00 +00:00
set_recent_alloc ( NULL , NULL ) ;
// Create Debug Information Recorder to record scopes, oopmaps, etc.
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
env ( ) - > set_oop_recorder ( new OopRecorder ( env ( ) - > arena ( ) ) ) ;
2007-12-01 00:00:00 +00:00
env ( ) - > set_debug_info ( new DebugInformationRecorder ( env ( ) - > oop_recorder ( ) ) ) ;
env ( ) - > set_dependencies ( new Dependencies ( env ( ) ) ) ;
_fixed_slots = 0 ;
set_has_split_ifs ( false ) ;
set_has_loops ( has_method ( ) & & method ( ) - > has_loops ( ) ) ; // first approximation
2009-11-12 09:24:21 -08:00
set_has_stringbuilder ( false ) ;
2013-05-08 15:08:01 -07:00
set_has_boxed_value ( false ) ;
2007-12-01 00:00:00 +00:00
_trap_can_recompile = false ; // no traps emitted yet
_major_progress = true ; // start out assuming good things will happen
set_has_unsafe_access ( false ) ;
2012-09-17 19:39:07 -07:00
set_max_vector_size ( 0 ) ;
2007-12-01 00:00:00 +00:00
Copy : : zero_to_bytes ( _trap_hist , sizeof ( _trap_hist ) ) ;
set_decompile_count ( 0 ) ;
2015-10-20 18:07:28 +02:00
set_do_freq_based_layout ( _directive - > BlockLayoutByFrequencyOption ) ;
2010-09-03 17:51:07 -07:00
set_num_loop_opts ( LoopOptsCount ) ;
set_do_inlining ( Inline ) ;
set_max_inline_size ( MaxInlineSize ) ;
set_freq_inline_size ( FreqInlineSize ) ;
set_do_scheduling ( OptoScheduling ) ;
set_do_count_invocations ( false ) ;
set_do_method_data_update ( false ) ;
2015-05-05 12:33:57 -07:00
set_do_vector_loop ( false ) ;
if ( AllowVectorizeOnDemand ) {
2015-10-20 18:07:28 +02:00
if ( has_method ( ) & & ( _directive - > VectorizeOption | | _directive - > VectorizeDebugOption ) ) {
2015-05-05 12:33:57 -07:00
set_do_vector_loop ( true ) ;
2015-10-26 19:33:31 -07:00
NOT_PRODUCT ( if ( do_vector_loop ( ) & & Verbose ) { tty - > print ( " Compile::Init: do vectorized loops (SIMD like) for method %s \n " , method ( ) - > name ( ) - > as_quoted_ascii ( ) ) ; } )
2015-05-05 12:33:57 -07:00
} else if ( has_method ( ) & & method ( ) - > name ( ) ! = 0 & &
method ( ) - > intrinsic_id ( ) = = vmIntrinsics : : _forEachRemaining ) {
set_do_vector_loop ( true ) ;
}
}
2015-10-26 19:33:31 -07:00
set_use_cmove ( UseCMoveUnconditionally /* || do_vector_loop()*/ ) ; //TODO: consider do_vector_loop() mandate use_cmove unconditionally
NOT_PRODUCT ( if ( use_cmove ( ) & & Verbose & & has_method ( ) ) { tty - > print ( " Compile::Init: use CMove without profitability tests for method %s \n " , method ( ) - > name ( ) - > as_quoted_ascii ( ) ) ; } )
2015-05-05 12:33:57 -07:00
2014-05-13 11:32:10 -07:00
set_age_code ( has_method ( ) & & method ( ) - > profile_aging ( ) ) ;
2014-03-20 17:49:27 -07:00
set_rtm_state ( NoRTM ) ; // No RTM lock eliding by default
2015-10-20 18:07:28 +02:00
_max_node_limit = _directive - > MaxNodeLimitOption ;
2014-03-20 17:49:27 -07:00
# if INCLUDE_RTM_OPT
if ( UseRTMLocking & & has_method ( ) & & ( method ( ) - > method_data_or_null ( ) ! = NULL ) ) {
int rtm_state = method ( ) - > method_data ( ) - > rtm_state ( ) ;
if ( method_has_option ( " NoRTMLockEliding " ) | | ( ( rtm_state & NoRTM ) ! = 0 ) ) {
// Don't generate RTM lock eliding code.
set_rtm_state ( NoRTM ) ;
} else if ( method_has_option ( " UseRTMLockEliding " ) | | ( ( rtm_state & UseRTM ) ! = 0 ) | | ! UseRTMDeopt ) {
// Generate RTM lock eliding code without abort ratio calculation code.
set_rtm_state ( UseRTM ) ;
} else if ( UseRTMDeopt ) {
// Generate RTM lock eliding code and include abort ratio calculation
// code if UseRTMDeopt is on.
set_rtm_state ( ProfileRTM ) ;
}
}
# endif
2007-12-01 00:00:00 +00:00
if ( debug_info ( ) - > recording_non_safepoints ( ) ) {
set_node_note_array ( new ( comp_arena ( ) ) GrowableArray < Node_Notes * >
( comp_arena ( ) , 8 , 0 , NULL ) ) ;
set_default_node_notes ( Node_Notes : : make ( this ) ) ;
}
// // -- Initialize types before each compile --
// // Update cached type information
// if( _method && _method->constants() )
// Type::update_loaded_types(_method, _method->constants());
// Init alias_type map.
2008-03-06 10:30:17 -08:00
if ( ! _do_escape_analysis & & aliaslevel = = 3 )
2007-12-01 00:00:00 +00:00
aliaslevel = 2 ; // No unique types without escape analysis
_AliasLevel = aliaslevel ;
const int grow_ats = 16 ;
_max_alias_types = grow_ats ;
_alias_types = NEW_ARENA_ARRAY ( comp_arena ( ) , AliasType * , grow_ats ) ;
AliasType * ats = NEW_ARENA_ARRAY ( comp_arena ( ) , AliasType , grow_ats ) ;
Copy : : zero_to_bytes ( ats , sizeof ( AliasType ) * grow_ats ) ;
{
for ( int i = 0 ; i < grow_ats ; i + + ) _alias_types [ i ] = & ats [ i ] ;
}
// Initialize the first few types.
_alias_types [ AliasIdxTop ] - > Init ( AliasIdxTop , NULL ) ;
_alias_types [ AliasIdxBot ] - > Init ( AliasIdxBot , TypePtr : : BOTTOM ) ;
_alias_types [ AliasIdxRaw ] - > Init ( AliasIdxRaw , TypeRawPtr : : BOTTOM ) ;
_num_alias_types = AliasIdxRaw + 1 ;
// Zero out the alias type cache.
Copy : : zero_to_bytes ( _alias_cache , sizeof ( _alias_cache ) ) ;
// A NULL adr_type hits in the cache right away. Preload the right answer.
probe_alias_cache ( NULL ) - > _index = AliasIdxTop ;
_intrinsics = NULL ;
2010-08-03 15:55:03 -07:00
_macro_nodes = new ( comp_arena ( ) ) GrowableArray < Node * > ( comp_arena ( ) , 8 , 0 , NULL ) ;
_predicate_opaqs = new ( comp_arena ( ) ) GrowableArray < Node * > ( comp_arena ( ) , 8 , 0 , NULL ) ;
2013-02-12 12:56:11 +01:00
_expensive_nodes = new ( comp_arena ( ) ) GrowableArray < Node * > ( comp_arena ( ) , 8 , 0 , NULL ) ;
2007-12-01 00:00:00 +00:00
register_library_intrinsics ( ) ;
}
//---------------------------init_start----------------------------------------
// Install the StartNode on this compile object.
void Compile : : init_start ( StartNode * s ) {
if ( failing ( ) )
return ; // already failing
assert ( s = = start ( ) , " " ) ;
}
2014-10-06 06:51:37 -07:00
/**
* Return the ' StartNode ' . We must not have a pending failure , since the ideal graph
* can be in an inconsistent state , i . e . , we can get segmentation faults when traversing
* the ideal graph .
*/
2007-12-01 00:00:00 +00:00
StartNode * Compile : : start ( ) const {
2015-09-29 11:02:08 +02:00
assert ( ! failing ( ) , " Must not have pending failure. Reason is: %s " , failure_reason ( ) ) ;
2007-12-01 00:00:00 +00:00
for ( DUIterator_Fast imax , i = root ( ) - > fast_outs ( imax ) ; i < imax ; i + + ) {
Node * start = root ( ) - > fast_out ( i ) ;
2014-10-06 06:51:37 -07:00
if ( start - > is_Start ( ) ) {
2007-12-01 00:00:00 +00:00
return start - > as_Start ( ) ;
2014-10-06 06:51:37 -07:00
}
2007-12-01 00:00:00 +00:00
}
2014-05-02 16:44:54 -07:00
fatal ( " Did not find Start node! " ) ;
2007-12-01 00:00:00 +00:00
return NULL ;
}
//-------------------------------immutable_memory-------------------------------------
// Access immutable memory
Node * Compile : : immutable_memory ( ) {
if ( _immutable_memory ! = NULL ) {
return _immutable_memory ;
}
StartNode * s = start ( ) ;
for ( DUIterator_Fast imax , i = s - > fast_outs ( imax ) ; true ; i + + ) {
Node * p = s - > fast_out ( i ) ;
if ( p ! = s & & p - > as_Proj ( ) - > _con = = TypeFunc : : Memory ) {
_immutable_memory = p ;
return _immutable_memory ;
}
}
ShouldNotReachHere ( ) ;
return NULL ;
}
//----------------------set_cached_top_node------------------------------------
// Install the cached top node, and make sure Node::is_top works correctly.
void Compile : : set_cached_top_node ( Node * tn ) {
if ( tn ! = NULL ) verify_top ( tn ) ;
Node * old_top = _top ;
_top = tn ;
// Calling Node::setup_is_top allows the nodes the chance to adjust
// their _out arrays.
if ( _top ! = NULL ) _top - > setup_is_top ( ) ;
if ( old_top ! = NULL ) old_top - > setup_is_top ( ) ;
assert ( _top = = NULL | | top ( ) - > is_top ( ) , " " ) ;
}
2012-11-27 17:24:15 -08:00
# ifdef ASSERT
uint Compile : : count_live_nodes_by_graph_walk ( ) {
Unique_Node_List useful ( comp_arena ( ) ) ;
// Get useful node list by walking the graph.
identify_useful_nodes ( useful ) ;
return useful . size ( ) ;
}
void Compile : : print_missing_nodes ( ) {
// Return if CompileLog is NULL and PrintIdealNodeCount is false.
if ( ( _log = = NULL ) & & ( ! PrintIdealNodeCount ) ) {
return ;
}
// This is an expensive function. It is executed only when the user
// specifies VerifyIdealNodeCount option or otherwise knows the
// additional work that needs to be done to identify reachable nodes
// by walking the flow graph and find the missing ones using
// _dead_node_list.
Unique_Node_List useful ( comp_arena ( ) ) ;
// Get useful node list by walking the graph.
identify_useful_nodes ( useful ) ;
uint l_nodes = C - > live_nodes ( ) ;
uint l_nodes_by_walk = useful . size ( ) ;
if ( l_nodes ! = l_nodes_by_walk ) {
if ( _log ! = NULL ) {
_log - > begin_head ( " mismatched_nodes count='%d' " , abs ( ( int ) ( l_nodes - l_nodes_by_walk ) ) ) ;
_log - > stamp ( ) ;
_log - > end_head ( ) ;
}
VectorSet & useful_member_set = useful . member_set ( ) ;
int last_idx = l_nodes_by_walk ;
for ( int i = 0 ; i < last_idx ; i + + ) {
if ( useful_member_set . test ( i ) ) {
if ( _dead_node_list . test ( i ) ) {
if ( _log ! = NULL ) {
_log - > elem ( " mismatched_node_info node_idx='%d' type='both live and dead' " , i ) ;
}
if ( PrintIdealNodeCount ) {
// Print the log message to tty
tty - > print_cr ( " mismatched_node idx='%d' both live and dead' " , i ) ;
useful . at ( i ) - > dump ( ) ;
}
}
}
else if ( ! _dead_node_list . test ( i ) ) {
if ( _log ! = NULL ) {
_log - > elem ( " mismatched_node_info node_idx='%d' type='neither live nor dead' " , i ) ;
}
if ( PrintIdealNodeCount ) {
// Print the log message to tty
tty - > print_cr ( " mismatched_node idx='%d' type='neither live nor dead' " , i ) ;
}
}
}
if ( _log ! = NULL ) {
_log - > tail ( " mismatched_nodes " ) ;
}
}
}
2014-07-25 10:06:17 +02:00
void Compile : : record_modified_node ( Node * n ) {
if ( _modified_nodes ! = NULL & & ! _inlining_incrementally & &
n - > outcnt ( ) ! = 0 & & ! n - > is_Con ( ) ) {
_modified_nodes - > push ( n ) ;
}
}
void Compile : : remove_modified_node ( Node * n ) {
if ( _modified_nodes ! = NULL ) {
_modified_nodes - > remove ( n ) ;
}
}
2012-11-27 17:24:15 -08:00
# endif
2007-12-01 00:00:00 +00:00
# ifndef PRODUCT
void Compile : : verify_top ( Node * tn ) const {
if ( tn ! = NULL ) {
assert ( tn - > is_Con ( ) , " top node must be a constant " ) ;
assert ( ( ( ConNode * ) tn ) - > type ( ) = = Type : : TOP , " top node must have correct type " ) ;
assert ( tn - > in ( 0 ) ! = NULL , " must have live top node " ) ;
}
}
# endif
///-------------------Managing Per-Node Debug & Profile Info-------------------
void Compile : : grow_node_notes ( GrowableArray < Node_Notes * > * arr , int grow_by ) {
guarantee ( arr ! = NULL , " " ) ;
int num_blocks = arr - > length ( ) ;
if ( grow_by < num_blocks ) grow_by = num_blocks ;
int num_notes = grow_by * _node_notes_block_size ;
Node_Notes * notes = NEW_ARENA_ARRAY ( node_arena ( ) , Node_Notes , num_notes ) ;
Copy : : zero_to_bytes ( notes , num_notes * sizeof ( Node_Notes ) ) ;
while ( num_notes > 0 ) {
arr - > append ( notes ) ;
notes + = _node_notes_block_size ;
num_notes - = _node_notes_block_size ;
}
assert ( num_notes = = 0 , " exact multiple, please " ) ;
}
bool Compile : : copy_node_notes_to ( Node * dest , Node * source ) {
if ( source = = NULL | | dest = = NULL ) return false ;
if ( dest - > is_Con ( ) )
return false ; // Do not push debug info onto constants.
# ifdef ASSERT
// Leave a bread crumb trail pointing to the original node:
if ( dest ! = NULL & & dest ! = source & & dest - > debug_orig ( ) = = NULL ) {
dest - > set_debug_orig ( source ) ;
}
# endif
if ( node_note_array ( ) = = NULL )
return false ; // Not collecting any notes now.
// This is a copy onto a pre-existing node, which may already have notes.
// If both nodes have notes, do not overwrite any pre-existing notes.
Node_Notes * source_notes = node_notes_at ( source - > _idx ) ;
if ( source_notes = = NULL | | source_notes - > is_clear ( ) ) return false ;
Node_Notes * dest_notes = node_notes_at ( dest - > _idx ) ;
if ( dest_notes = = NULL | | dest_notes - > is_clear ( ) ) {
return set_node_notes_at ( dest - > _idx , source_notes ) ;
}
Node_Notes merged_notes = ( * source_notes ) ;
// The order of operations here ensures that dest notes will win...
merged_notes . update_from ( dest_notes ) ;
return set_node_notes_at ( dest - > _idx , & merged_notes ) ;
}
//--------------------------allow_range_check_smearing-------------------------
// Gating condition for coalescing similar range checks.
// Sometimes we try 'speculatively' replacing a series of a range checks by a
// single covering check that is at least as strong as any of them.
// If the optimization succeeds, the simplified (strengthened) range check
// will always succeed. If it fails, we will deopt, and then give up
// on the optimization.
bool Compile : : allow_range_check_smearing ( ) const {
// If this method has already thrown a range-check,
// assume it was because we already tried range smearing
// and it failed.
uint already_trapped = trap_count ( Deoptimization : : Reason_range_check ) ;
return ! already_trapped ;
}
//------------------------------flatten_alias_type-----------------------------
const TypePtr * Compile : : flatten_alias_type ( const TypePtr * tj ) const {
int offset = tj - > offset ( ) ;
TypePtr : : PTR ptr = tj - > ptr ( ) ;
2008-07-16 16:04:39 -07:00
// Known instance (scalarizable allocation) alias only with itself.
bool is_known_inst = tj - > isa_oopptr ( ) ! = NULL & &
tj - > is_oopptr ( ) - > is_known_instance ( ) ;
2007-12-01 00:00:00 +00:00
// Process weird unsafe references.
if ( offset = = Type : : OffsetBot & & ( tj - > isa_instptr ( ) /*|| tj->isa_klassptr()*/ ) ) {
assert ( InlineUnsafeOps , " indeterminate pointers come only from unsafe ops " ) ;
2008-07-16 16:04:39 -07:00
assert ( ! is_known_inst , " scalarizable allocation should not have unsafe references " ) ;
2007-12-01 00:00:00 +00:00
tj = TypeOopPtr : : BOTTOM ;
ptr = tj - > ptr ( ) ;
offset = tj - > offset ( ) ;
}
// Array pointers need some flattening
const TypeAryPtr * ta = tj - > isa_aryptr ( ) ;
2013-09-10 14:51:48 -07:00
if ( ta & & ta - > is_stable ( ) ) {
// Erase stability property for alias analysis.
tj = ta = ta - > cast_to_stable ( false ) ;
}
2008-07-16 16:04:39 -07:00
if ( ta & & is_known_inst ) {
if ( offset ! = Type : : OffsetBot & &
offset > arrayOopDesc : : length_offset_in_bytes ( ) ) {
offset = Type : : OffsetBot ; // Flatten constant access into array body only
tj = ta = TypeAryPtr : : make ( ptr , ta - > ary ( ) , ta - > klass ( ) , true , offset , ta - > instance_id ( ) ) ;
}
} else if ( ta & & _AliasLevel > = 2 ) {
2007-12-01 00:00:00 +00:00
// For arrays indexed by constant indices, we flatten the alias
// space to include all of the array body. Only the header, klass
// and array length can be accessed un-aliased.
if ( offset ! = Type : : OffsetBot ) {
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
if ( ta - > const_oop ( ) ) { // MethodData* or Method*
2007-12-01 00:00:00 +00:00
offset = Type : : OffsetBot ; // Flatten constant access into array body
2008-07-16 16:04:39 -07:00
tj = ta = TypeAryPtr : : make ( ptr , ta - > const_oop ( ) , ta - > ary ( ) , ta - > klass ( ) , false , offset ) ;
2007-12-01 00:00:00 +00:00
} else if ( offset = = arrayOopDesc : : length_offset_in_bytes ( ) ) {
// range is OK as-is.
tj = ta = TypeAryPtr : : RANGE ;
} else if ( offset = = oopDesc : : klass_offset_in_bytes ( ) ) {
tj = TypeInstPtr : : KLASS ; // all klass loads look alike
ta = TypeAryPtr : : RANGE ; // generic ignored junk
ptr = TypePtr : : BotPTR ;
} else if ( offset = = oopDesc : : mark_offset_in_bytes ( ) ) {
tj = TypeInstPtr : : MARK ;
ta = TypeAryPtr : : RANGE ; // generic ignored junk
ptr = TypePtr : : BotPTR ;
} else { // Random constant offset into array body
offset = Type : : OffsetBot ; // Flatten constant access into array body
2008-07-16 16:04:39 -07:00
tj = ta = TypeAryPtr : : make ( ptr , ta - > ary ( ) , ta - > klass ( ) , false , offset ) ;
2007-12-01 00:00:00 +00:00
}
}
// Arrays of fixed size alias with arrays of unknown size.
if ( ta - > size ( ) ! = TypeInt : : POS ) {
const TypeAry * tary = TypeAry : : make ( ta - > elem ( ) , TypeInt : : POS ) ;
2008-07-16 16:04:39 -07:00
tj = ta = TypeAryPtr : : make ( ptr , ta - > const_oop ( ) , tary , ta - > klass ( ) , false , offset ) ;
2007-12-01 00:00:00 +00:00
}
// Arrays of known objects become arrays of unknown objects.
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
if ( ta - > elem ( ) - > isa_narrowoop ( ) & & ta - > elem ( ) ! = TypeNarrowOop : : BOTTOM ) {
const TypeAry * tary = TypeAry : : make ( TypeNarrowOop : : BOTTOM , ta - > size ( ) ) ;
2008-07-16 16:04:39 -07:00
tj = ta = TypeAryPtr : : make ( ptr , ta - > const_oop ( ) , tary , NULL , false , offset ) ;
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
}
2007-12-01 00:00:00 +00:00
if ( ta - > elem ( ) - > isa_oopptr ( ) & & ta - > elem ( ) ! = TypeInstPtr : : BOTTOM ) {
const TypeAry * tary = TypeAry : : make ( TypeInstPtr : : BOTTOM , ta - > size ( ) ) ;
2008-07-16 16:04:39 -07:00
tj = ta = TypeAryPtr : : make ( ptr , ta - > const_oop ( ) , tary , NULL , false , offset ) ;
2007-12-01 00:00:00 +00:00
}
// Arrays of bytes and of booleans both use 'bastore' and 'baload' so
// cannot be distinguished by bytecode alone.
if ( ta - > elem ( ) = = TypeInt : : BOOL ) {
const TypeAry * tary = TypeAry : : make ( TypeInt : : BYTE , ta - > size ( ) ) ;
ciKlass * aklass = ciTypeArrayKlass : : make ( T_BYTE ) ;
2008-07-16 16:04:39 -07:00
tj = ta = TypeAryPtr : : make ( ptr , ta - > const_oop ( ) , tary , aklass , false , offset ) ;
2007-12-01 00:00:00 +00:00
}
// During the 2nd round of IterGVN, NotNull castings are removed.
// Make sure the Bottom and NotNull variants alias the same.
// Also, make sure exact and non-exact variants alias the same.
2013-10-23 12:40:23 +02:00
if ( ptr = = TypePtr : : NotNull | | ta - > klass_is_exact ( ) | | ta - > speculative ( ) ! = NULL ) {
2011-06-28 15:50:07 -07:00
tj = ta = TypeAryPtr : : make ( TypePtr : : BotPTR , ta - > ary ( ) , ta - > klass ( ) , false , offset ) ;
2007-12-01 00:00:00 +00:00
}
}
// Oop pointers need some flattening
const TypeInstPtr * to = tj - > isa_instptr ( ) ;
if ( to & & _AliasLevel > = 2 & & to ! = TypeOopPtr : : BOTTOM ) {
2011-03-18 16:00:34 -07:00
ciInstanceKlass * k = to - > klass ( ) - > as_instance_klass ( ) ;
2007-12-01 00:00:00 +00:00
if ( ptr = = TypePtr : : Constant ) {
2011-03-18 16:00:34 -07:00
if ( to - > klass ( ) ! = ciEnv : : current ( ) - > Class_klass ( ) | |
offset < k - > size_helper ( ) * wordSize ) {
// No constant oop pointers (such as Strings); they alias with
// unknown strings.
assert ( ! is_known_inst , " not scalarizable allocation " ) ;
tj = to = TypeInstPtr : : make ( TypePtr : : BotPTR , to - > klass ( ) , false , 0 , offset ) ;
}
2008-07-16 16:04:39 -07:00
} else if ( is_known_inst ) {
2008-05-21 10:45:07 -07:00
tj = to ; // Keep NotNull and klass_is_exact for instance type
2007-12-01 00:00:00 +00:00
} else if ( ptr = = TypePtr : : NotNull | | to - > klass_is_exact ( ) ) {
// During the 2nd round of IterGVN, NotNull castings are removed.
// Make sure the Bottom and NotNull variants alias the same.
// Also, make sure exact and non-exact variants alias the same.
2008-07-16 16:04:39 -07:00
tj = to = TypeInstPtr : : make ( TypePtr : : BotPTR , to - > klass ( ) , false , 0 , offset ) ;
2007-12-01 00:00:00 +00:00
}
2013-10-23 12:40:23 +02:00
if ( to - > speculative ( ) ! = NULL ) {
tj = to = TypeInstPtr : : make ( to - > ptr ( ) , to - > klass ( ) , to - > klass_is_exact ( ) , to - > const_oop ( ) , to - > offset ( ) , to - > instance_id ( ) ) ;
}
2007-12-01 00:00:00 +00:00
// Canonicalize the holder of this field
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
if ( offset > = 0 & & offset < instanceOopDesc : : base_offset_in_bytes ( ) ) {
2007-12-01 00:00:00 +00:00
// First handle header references such as a LoadKlassNode, even if the
// object's klass is unloaded at compile time (4965979).
2008-07-16 16:04:39 -07:00
if ( ! is_known_inst ) { // Do it only for non-instance types
tj = to = TypeInstPtr : : make ( TypePtr : : BotPTR , env ( ) - > Object_klass ( ) , false , NULL , offset ) ;
}
2007-12-01 00:00:00 +00:00
} else if ( offset < 0 | | offset > = k - > size_helper ( ) * wordSize ) {
2011-03-18 16:00:34 -07:00
// Static fields are in the space above the normal instance
// fields in the java.lang.Class instance.
if ( to - > klass ( ) ! = ciEnv : : current ( ) - > Class_klass ( ) ) {
to = NULL ;
tj = TypeOopPtr : : BOTTOM ;
offset = tj - > offset ( ) ;
}
2007-12-01 00:00:00 +00:00
} else {
ciInstanceKlass * canonical_holder = k - > get_canonical_holder ( offset ) ;
if ( ! k - > equals ( canonical_holder ) | | tj - > offset ( ) ! = offset ) {
2008-07-16 16:04:39 -07:00
if ( is_known_inst ) {
tj = to = TypeInstPtr : : make ( to - > ptr ( ) , canonical_holder , true , NULL , offset , to - > instance_id ( ) ) ;
} else {
tj = to = TypeInstPtr : : make ( to - > ptr ( ) , canonical_holder , false , NULL , offset ) ;
}
2007-12-01 00:00:00 +00:00
}
}
}
// Klass pointers to object array klasses need some flattening
const TypeKlassPtr * tk = tj - > isa_klassptr ( ) ;
if ( tk ) {
// If we are referencing a field within a Klass, we need
// to assume the worst case of an Object. Both exact and
2011-12-19 14:16:23 -08:00
// inexact types must flatten to the same alias class so
// use NotNull as the PTR.
2007-12-01 00:00:00 +00:00
if ( offset = = Type : : OffsetBot | | ( offset > = 0 & & ( size_t ) offset < sizeof ( Klass ) ) ) {
2011-12-19 14:16:23 -08:00
tj = tk = TypeKlassPtr : : make ( TypePtr : : NotNull ,
2007-12-01 00:00:00 +00:00
TypeKlassPtr : : OBJECT - > klass ( ) ,
offset ) ;
}
ciKlass * klass = tk - > klass ( ) ;
if ( klass - > is_obj_array_klass ( ) ) {
ciKlass * k = TypeAryPtr : : OOPS - > klass ( ) ;
if ( ! k | | ! k - > is_loaded ( ) ) // Only fails for some -Xcomp runs
k = TypeInstPtr : : BOTTOM - > klass ( ) ;
tj = tk = TypeKlassPtr : : make ( TypePtr : : NotNull , k , offset ) ;
}
// Check for precise loads from the primary supertype array and force them
// to the supertype cache alias index. Check for generic array loads from
// the primary supertype array and also force them to the supertype cache
// alias index. Since the same load can reach both, we need to merge
// these 2 disparate memories into the same alias class. Since the
// primary supertype array is read-only, there's no chance of confusion
// where we bypass an array load and an array store.
2011-12-07 11:35:03 +01:00
int primary_supers_offset = in_bytes ( Klass : : primary_supers_offset ( ) ) ;
2011-12-19 14:16:23 -08:00
if ( offset = = Type : : OffsetBot | |
( offset > = primary_supers_offset & &
offset < ( int ) ( primary_supers_offset + Klass : : primary_super_limit ( ) * wordSize ) ) | |
2011-12-07 11:35:03 +01:00
offset = = ( int ) in_bytes ( Klass : : secondary_super_cache_offset ( ) ) ) {
offset = in_bytes ( Klass : : secondary_super_cache_offset ( ) ) ;
2007-12-01 00:00:00 +00:00
tj = tk = TypeKlassPtr : : make ( TypePtr : : NotNull , tk - > klass ( ) , offset ) ;
}
}
// Flatten all Raw pointers together.
if ( tj - > base ( ) = = Type : : RawPtr )
tj = TypeRawPtr : : BOTTOM ;
if ( tj - > base ( ) = = Type : : AnyPtr )
tj = TypePtr : : BOTTOM ; // An error, which the caller must check for.
// Flatten all to bottom for now
switch ( _AliasLevel ) {
case 0 :
tj = TypePtr : : BOTTOM ;
break ;
case 1 : // Flatten to: oop, static, field or array
switch ( tj - > base ( ) ) {
//case Type::AryPtr: tj = TypeAryPtr::RANGE; break;
case Type : : RawPtr : tj = TypeRawPtr : : BOTTOM ; break ;
case Type : : AryPtr : // do not distinguish arrays at all
case Type : : InstPtr : tj = TypeInstPtr : : BOTTOM ; break ;
case Type : : KlassPtr : tj = TypeKlassPtr : : OBJECT ; break ;
case Type : : AnyPtr : tj = TypePtr : : BOTTOM ; break ; // caller checks it
default : ShouldNotReachHere ( ) ;
}
break ;
2009-02-27 13:27:09 -08:00
case 2 : // No collapsing at level 2; keep all splits
case 3 : // No collapsing at level 3; keep all splits
2007-12-01 00:00:00 +00:00
break ;
default :
Unimplemented ( ) ;
}
offset = tj - > offset ( ) ;
assert ( offset ! = Type : : OffsetTop , " Offset has fallen from constant " ) ;
assert ( ( offset ! = Type : : OffsetBot & & tj - > base ( ) ! = Type : : AryPtr ) | |
( offset = = Type : : OffsetBot & & tj - > base ( ) = = Type : : AryPtr ) | |
( offset = = Type : : OffsetBot & & tj = = TypeOopPtr : : BOTTOM ) | |
( offset = = Type : : OffsetBot & & tj = = TypePtr : : BOTTOM ) | |
( offset = = oopDesc : : mark_offset_in_bytes ( ) & & tj - > base ( ) = = Type : : AryPtr ) | |
( offset = = oopDesc : : klass_offset_in_bytes ( ) & & tj - > base ( ) = = Type : : AryPtr ) | |
( offset = = arrayOopDesc : : length_offset_in_bytes ( ) & & tj - > base ( ) = = Type : : AryPtr ) ,
" For oops, klasses, raw offset must be constant; for arrays the offset is never known " ) ;
assert ( tj - > ptr ( ) ! = TypePtr : : TopPTR & &
tj - > ptr ( ) ! = TypePtr : : AnyNull & &
tj - > ptr ( ) ! = TypePtr : : Null , " No imprecise addresses " ) ;
// assert( tj->ptr() != TypePtr::Constant ||
// tj->base() == Type::RawPtr ||
// tj->base() == Type::KlassPtr, "No constant oop addresses" );
return tj ;
}
void Compile : : AliasType : : Init ( int i , const TypePtr * at ) {
_index = i ;
_adr_type = at ;
_field = NULL ;
2013-09-10 14:51:48 -07:00
_element = NULL ;
2007-12-01 00:00:00 +00:00
_is_rewritable = true ; // default
const TypeOopPtr * atoop = ( at ! = NULL ) ? at - > isa_oopptr ( ) : NULL ;
2008-06-26 13:34:00 -07:00
if ( atoop ! = NULL & & atoop - > is_known_instance ( ) ) {
const TypeOopPtr * gt = atoop - > cast_to_instance_id ( TypeOopPtr : : InstanceBot ) ;
2007-12-01 00:00:00 +00:00
_general_index = Compile : : current ( ) - > get_alias_index ( gt ) ;
} else {
_general_index = 0 ;
}
}
//---------------------------------print_on------------------------------------
# ifndef PRODUCT
void Compile : : AliasType : : print_on ( outputStream * st ) {
if ( index ( ) < 10 )
st - > print ( " @ <%d> " , index ( ) ) ;
else st - > print ( " @ <%d> " , index ( ) ) ;
st - > print ( is_rewritable ( ) ? " " : " RO " ) ;
int offset = adr_type ( ) - > offset ( ) ;
if ( offset = = Type : : OffsetBot )
st - > print ( " +any " ) ;
else st - > print ( " +%-3d " , offset ) ;
st - > print ( " in " ) ;
adr_type ( ) - > dump_on ( st ) ;
const TypeOopPtr * tjp = adr_type ( ) - > isa_oopptr ( ) ;
if ( field ( ) ! = NULL & & tjp ) {
if ( tjp - > klass ( ) ! = field ( ) - > holder ( ) | |
tjp - > offset ( ) ! = field ( ) - > offset_in_bytes ( ) ) {
st - > print ( " != " ) ;
field ( ) - > print ( ) ;
st - > print ( " *** " ) ;
}
}
}
void print_alias_types ( ) {
Compile * C = Compile : : current ( ) ;
tty - > print_cr ( " --- Alias types, AliasIdxBot .. %d " , C - > num_alias_types ( ) - 1 ) ;
for ( int idx = Compile : : AliasIdxBot ; idx < C - > num_alias_types ( ) ; idx + + ) {
C - > alias_type ( idx ) - > print_on ( tty ) ;
tty - > cr ( ) ;
}
}
# endif
//----------------------------probe_alias_cache--------------------------------
Compile : : AliasCacheEntry * Compile : : probe_alias_cache ( const TypePtr * adr_type ) {
intptr_t key = ( intptr_t ) adr_type ;
key ^ = key > > logAliasCacheSize ;
return & _alias_cache [ key & right_n_bits ( logAliasCacheSize ) ] ;
}
//-----------------------------grow_alias_types--------------------------------
void Compile : : grow_alias_types ( ) {
const int old_ats = _max_alias_types ; // how many before?
const int new_ats = old_ats ; // how many more?
const int grow_ats = old_ats + new_ats ; // how many now?
_max_alias_types = grow_ats ;
_alias_types = REALLOC_ARENA_ARRAY ( comp_arena ( ) , AliasType * , _alias_types , old_ats , grow_ats ) ;
AliasType * ats = NEW_ARENA_ARRAY ( comp_arena ( ) , AliasType , new_ats ) ;
Copy : : zero_to_bytes ( ats , sizeof ( AliasType ) * new_ats ) ;
for ( int i = 0 ; i < new_ats ; i + + ) _alias_types [ old_ats + i ] = & ats [ i ] ;
}
//--------------------------------find_alias_type------------------------------
2011-03-18 16:00:34 -07:00
Compile : : AliasType * Compile : : find_alias_type ( const TypePtr * adr_type , bool no_create , ciField * original_field ) {
2007-12-01 00:00:00 +00:00
if ( _AliasLevel = = 0 )
return alias_type ( AliasIdxBot ) ;
AliasCacheEntry * ace = probe_alias_cache ( adr_type ) ;
if ( ace - > _adr_type = = adr_type ) {
return alias_type ( ace - > _index ) ;
}
// Handle special cases.
if ( adr_type = = NULL ) return alias_type ( AliasIdxTop ) ;
if ( adr_type = = TypePtr : : BOTTOM ) return alias_type ( AliasIdxBot ) ;
// Do it the slow way.
const TypePtr * flat = flatten_alias_type ( adr_type ) ;
# ifdef ASSERT
assert ( flat = = flatten_alias_type ( flat ) , " idempotent " ) ;
assert ( flat ! = TypePtr : : BOTTOM , " cannot alias-analyze an untyped ptr " ) ;
if ( flat - > isa_oopptr ( ) & & ! flat - > isa_klassptr ( ) ) {
const TypeOopPtr * foop = flat - > is_oopptr ( ) ;
2008-07-16 16:04:39 -07:00
// Scalarizable allocations have exact klass always.
bool exact = ! foop - > klass_is_exact ( ) | | foop - > is_known_instance ( ) ;
const TypePtr * xoop = foop - > cast_to_exactness ( exact ) - > is_ptr ( ) ;
2007-12-01 00:00:00 +00:00
assert ( foop = = flatten_alias_type ( xoop ) , " exactness must not affect alias type " ) ;
}
assert ( flat = = flatten_alias_type ( flat ) , " exact bit doesn't matter " ) ;
# endif
int idx = AliasIdxTop ;
for ( int i = 0 ; i < num_alias_types ( ) ; i + + ) {
if ( alias_type ( i ) - > adr_type ( ) = = flat ) {
idx = i ;
break ;
}
}
if ( idx = = AliasIdxTop ) {
if ( no_create ) return NULL ;
// Grow the array if necessary.
if ( _num_alias_types = = _max_alias_types ) grow_alias_types ( ) ;
// Add a new alias type.
idx = _num_alias_types + + ;
_alias_types [ idx ] - > Init ( idx , flat ) ;
if ( flat = = TypeInstPtr : : KLASS ) alias_type ( idx ) - > set_rewritable ( false ) ;
if ( flat = = TypeAryPtr : : RANGE ) alias_type ( idx ) - > set_rewritable ( false ) ;
if ( flat - > isa_instptr ( ) ) {
if ( flat - > offset ( ) = = java_lang_Class : : klass_offset_in_bytes ( )
& & flat - > is_instptr ( ) - > klass ( ) = = env ( ) - > Class_klass ( ) )
alias_type ( idx ) - > set_rewritable ( false ) ;
}
2013-09-10 14:51:48 -07:00
if ( flat - > isa_aryptr ( ) ) {
# ifdef ASSERT
const int header_size_min = arrayOopDesc : : base_offset_in_bytes ( T_BYTE ) ;
// (T_BYTE has the weakest alignment and size restrictions...)
assert ( flat - > offset ( ) < header_size_min , " array body reference must be OffsetBot " ) ;
# endif
if ( flat - > offset ( ) = = TypePtr : : OffsetBot ) {
alias_type ( idx ) - > set_element ( flat - > is_aryptr ( ) - > elem ( ) ) ;
}
}
2007-12-01 00:00:00 +00:00
if ( flat - > isa_klassptr ( ) ) {
2011-12-07 11:35:03 +01:00
if ( flat - > offset ( ) = = in_bytes ( Klass : : super_check_offset_offset ( ) ) )
2007-12-01 00:00:00 +00:00
alias_type ( idx ) - > set_rewritable ( false ) ;
2011-12-07 11:35:03 +01:00
if ( flat - > offset ( ) = = in_bytes ( Klass : : modifier_flags_offset ( ) ) )
2007-12-01 00:00:00 +00:00
alias_type ( idx ) - > set_rewritable ( false ) ;
2011-12-07 11:35:03 +01:00
if ( flat - > offset ( ) = = in_bytes ( Klass : : access_flags_offset ( ) ) )
2007-12-01 00:00:00 +00:00
alias_type ( idx ) - > set_rewritable ( false ) ;
2011-12-07 11:35:03 +01:00
if ( flat - > offset ( ) = = in_bytes ( Klass : : java_mirror_offset ( ) ) )
2007-12-01 00:00:00 +00:00
alias_type ( idx ) - > set_rewritable ( false ) ;
}
// %%% (We would like to finalize JavaThread::threadObj_offset(),
// but the base pointer type is not distinctive enough to identify
// references into JavaThread.)
2011-03-18 16:00:34 -07:00
// Check for final fields.
2007-12-01 00:00:00 +00:00
const TypeInstPtr * tinst = flat - > isa_instptr ( ) ;
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
if ( tinst & & tinst - > offset ( ) > = instanceOopDesc : : base_offset_in_bytes ( ) ) {
2011-03-18 16:00:34 -07:00
ciField * field ;
if ( tinst - > const_oop ( ) ! = NULL & &
tinst - > klass ( ) = = ciEnv : : current ( ) - > Class_klass ( ) & &
tinst - > offset ( ) > = ( tinst - > klass ( ) - > as_instance_klass ( ) - > size_helper ( ) * wordSize ) ) {
// static field
ciInstanceKlass * k = tinst - > const_oop ( ) - > as_instance ( ) - > java_lang_Class_klass ( ) - > as_instance_klass ( ) ;
field = k - > get_field_by_offset ( tinst - > offset ( ) , true ) ;
} else {
ciInstanceKlass * k = tinst - > klass ( ) - > as_instance_klass ( ) ;
field = k - > get_field_by_offset ( tinst - > offset ( ) , false ) ;
}
assert ( field = = NULL | |
original_field = = NULL | |
( field - > holder ( ) = = original_field - > holder ( ) & &
field - > offset ( ) = = original_field - > offset ( ) & &
field - > is_static ( ) = = original_field - > is_static ( ) ) , " wrong field? " ) ;
2007-12-01 00:00:00 +00:00
// Set field() and is_rewritable() attributes.
if ( field ! = NULL ) alias_type ( idx ) - > set_field ( field ) ;
}
}
// Fill the cache for next time.
ace - > _adr_type = adr_type ;
ace - > _index = idx ;
assert ( alias_type ( adr_type ) = = alias_type ( idx ) , " type must be installed " ) ;
// Might as well try to fill the cache for the flattened version, too.
AliasCacheEntry * face = probe_alias_cache ( flat ) ;
if ( face - > _adr_type = = NULL ) {
face - > _adr_type = flat ;
face - > _index = idx ;
assert ( alias_type ( flat ) = = alias_type ( idx ) , " flat type must work too " ) ;
}
return alias_type ( idx ) ;
}
Compile : : AliasType * Compile : : alias_type ( ciField * field ) {
const TypeOopPtr * t ;
if ( field - > is_static ( ) )
2011-03-18 16:00:34 -07:00
t = TypeInstPtr : : make ( field - > holder ( ) - > java_mirror ( ) ) ;
2007-12-01 00:00:00 +00:00
else
t = TypeOopPtr : : make_from_klass_raw ( field - > holder ( ) ) ;
2011-03-18 16:00:34 -07:00
AliasType * atp = alias_type ( t - > add_offset ( field - > offset_in_bytes ( ) ) , field ) ;
2013-09-10 14:51:48 -07:00
assert ( ( field - > is_final ( ) | | field - > is_stable ( ) ) = = ! atp - > is_rewritable ( ) , " must get the rewritable bits correct " ) ;
2007-12-01 00:00:00 +00:00
return atp ;
}
//------------------------------have_alias_type--------------------------------
bool Compile : : have_alias_type ( const TypePtr * adr_type ) {
AliasCacheEntry * ace = probe_alias_cache ( adr_type ) ;
if ( ace - > _adr_type = = adr_type ) {
return true ;
}
// Handle special cases.
if ( adr_type = = NULL ) return true ;
if ( adr_type = = TypePtr : : BOTTOM ) return true ;
2011-03-18 16:00:34 -07:00
return find_alias_type ( adr_type , true , NULL ) ! = NULL ;
2007-12-01 00:00:00 +00:00
}
//-----------------------------must_alias--------------------------------------
// True if all values of the given address type are in the given alias category.
bool Compile : : must_alias ( const TypePtr * adr_type , int alias_idx ) {
if ( alias_idx = = AliasIdxBot ) return true ; // the universal category
if ( adr_type = = NULL ) return true ; // NULL serves as TypePtr::TOP
if ( alias_idx = = AliasIdxTop ) return false ; // the empty category
if ( adr_type - > base ( ) = = Type : : AnyPtr ) return false ; // TypePtr::BOTTOM or its twins
// the only remaining possible overlap is identity
int adr_idx = get_alias_index ( adr_type ) ;
assert ( adr_idx ! = AliasIdxBot & & adr_idx ! = AliasIdxTop , " " ) ;
assert ( adr_idx = = alias_idx | |
( alias_type ( alias_idx ) - > adr_type ( ) ! = TypeOopPtr : : BOTTOM
& & adr_type ! = TypeOopPtr : : BOTTOM ) ,
" should not be testing for overlap with an unsafe pointer " ) ;
return adr_idx = = alias_idx ;
}
//------------------------------can_alias--------------------------------------
// True if any values of the given address type are in the given alias category.
bool Compile : : can_alias ( const TypePtr * adr_type , int alias_idx ) {
if ( alias_idx = = AliasIdxTop ) return false ; // the empty category
if ( adr_type = = NULL ) return false ; // NULL serves as TypePtr::TOP
if ( alias_idx = = AliasIdxBot ) return true ; // the universal category
if ( adr_type - > base ( ) = = Type : : AnyPtr ) return true ; // TypePtr::BOTTOM or its twins
// the only remaining possible overlap is identity
int adr_idx = get_alias_index ( adr_type ) ;
assert ( adr_idx ! = AliasIdxBot & & adr_idx ! = AliasIdxTop , " " ) ;
return adr_idx = = alias_idx ;
}
//---------------------------pop_warm_call-------------------------------------
WarmCallInfo * Compile : : pop_warm_call ( ) {
WarmCallInfo * wci = _warm_calls ;
if ( wci ! = NULL ) _warm_calls = wci - > remove_from ( wci ) ;
return wci ;
}
//----------------------------Inline_Warm--------------------------------------
int Compile : : Inline_Warm ( ) {
// If there is room, try to inline some more warm call sites.
// %%% Do a graph index compaction pass when we think we're out of space?
if ( ! InlineWarmCalls ) return 0 ;
int calls_made_hot = 0 ;
int room_to_grow = NodeCountInliningCutoff - unique ( ) ;
int amount_to_grow = MIN2 ( room_to_grow , ( int ) NodeCountInliningStep ) ;
int amount_grown = 0 ;
WarmCallInfo * call ;
while ( amount_to_grow > 0 & & ( call = pop_warm_call ( ) ) ! = NULL ) {
int est_size = ( int ) call - > size ( ) ;
if ( est_size > ( room_to_grow - amount_grown ) ) {
// This one won't fit anyway. Get rid of it.
call - > make_cold ( ) ;
continue ;
}
call - > make_hot ( ) ;
calls_made_hot + + ;
amount_grown + = est_size ;
amount_to_grow - = est_size ;
}
if ( calls_made_hot > 0 ) set_major_progress ( ) ;
return calls_made_hot ;
}
//----------------------------Finish_Warm--------------------------------------
void Compile : : Finish_Warm ( ) {
if ( ! InlineWarmCalls ) return ;
if ( failing ( ) ) return ;
if ( warm_calls ( ) = = NULL ) return ;
// Clean up loose ends, if we are out of space for inlining.
WarmCallInfo * call ;
while ( ( call = pop_warm_call ( ) ) ! = NULL ) {
call - > make_cold ( ) ;
}
}
2010-01-12 14:37:35 -08:00
//---------------------cleanup_loop_predicates-----------------------
// Remove the opaque nodes that protect the predicates so that all unused
// checks and uncommon_traps will be eliminated from the ideal graph
void Compile : : cleanup_loop_predicates ( PhaseIterGVN & igvn ) {
if ( predicate_count ( ) = = 0 ) return ;
for ( int i = predicate_count ( ) ; i > 0 ; i - - ) {
Node * n = predicate_opaque1_node ( i - 1 ) ;
assert ( n - > Opcode ( ) = = Op_Opaque1 , " must be " ) ;
igvn . replace_node ( n , n - > in ( 1 ) ) ;
}
assert ( predicate_count ( ) = = 0 , " should be clean! " ) ;
}
2007-12-01 00:00:00 +00:00
2012-12-23 17:08:22 +01:00
// StringOpts and late inlining of string methods
void Compile : : inline_string_calls ( bool parse_time ) {
{
// remove useless nodes to make the usage analysis simpler
ResourceMark rm ;
PhaseRemoveUseless pru ( initial_gvn ( ) , for_igvn ( ) ) ;
}
{
ResourceMark rm ;
2013-06-10 11:30:51 +02:00
print_method ( PHASE_BEFORE_STRINGOPTS , 3 ) ;
2012-12-23 17:08:22 +01:00
PhaseStringOpts pso ( initial_gvn ( ) , for_igvn ( ) ) ;
2013-06-10 11:30:51 +02:00
print_method ( PHASE_AFTER_STRINGOPTS , 3 ) ;
2012-12-23 17:08:22 +01:00
}
// now inline anything that we skipped the first time around
if ( ! parse_time ) {
_late_inlines_pos = _late_inlines . length ( ) ;
}
while ( _string_late_inlines . length ( ) > 0 ) {
CallGenerator * cg = _string_late_inlines . pop ( ) ;
cg - > do_late_inline ( ) ;
if ( failing ( ) ) return ;
}
_string_late_inlines . trunc_to ( 0 ) ;
}
2013-05-08 15:08:01 -07:00
// Late inlining of boxing methods
void Compile : : inline_boxing_calls ( PhaseIterGVN & igvn ) {
if ( _boxing_late_inlines . length ( ) > 0 ) {
assert ( has_boxed_value ( ) , " inconsistent " ) ;
PhaseGVN * gvn = initial_gvn ( ) ;
set_inlining_incrementally ( true ) ;
assert ( igvn . _worklist . size ( ) = = 0 , " should be done with igvn " ) ;
for_igvn ( ) - > clear ( ) ;
gvn - > replace_with ( & igvn ) ;
2014-06-10 13:37:16 +02:00
_late_inlines_pos = _late_inlines . length ( ) ;
2013-05-08 15:08:01 -07:00
while ( _boxing_late_inlines . length ( ) > 0 ) {
CallGenerator * cg = _boxing_late_inlines . pop ( ) ;
cg - > do_late_inline ( ) ;
if ( failing ( ) ) return ;
}
_boxing_late_inlines . trunc_to ( 0 ) ;
{
ResourceMark rm ;
PhaseRemoveUseless pru ( gvn , for_igvn ( ) ) ;
}
igvn = PhaseIterGVN ( gvn ) ;
igvn . optimize ( ) ;
set_inlining_progress ( false ) ;
set_inlining_incrementally ( false ) ;
}
}
2012-12-23 17:08:22 +01:00
void Compile : : inline_incrementally_one ( PhaseIterGVN & igvn ) {
assert ( IncrementalInline , " incremental inlining should be on " ) ;
PhaseGVN * gvn = initial_gvn ( ) ;
set_inlining_progress ( false ) ;
for_igvn ( ) - > clear ( ) ;
gvn - > replace_with ( & igvn ) ;
2014-09-25 12:10:57 +04:00
{
TracePhase tp ( " incrementalInline_inline " , & timers [ _t_incrInline_inline ] ) ;
int i = 0 ;
for ( ; i < _late_inlines . length ( ) & & ! inlining_progress ( ) ; i + + ) {
CallGenerator * cg = _late_inlines . at ( i ) ;
_late_inlines_pos = i + 1 ;
cg - > do_late_inline ( ) ;
if ( failing ( ) ) return ;
}
int j = 0 ;
for ( ; i < _late_inlines . length ( ) ; i + + , j + + ) {
_late_inlines . at_put ( j , _late_inlines . at ( i ) ) ;
}
_late_inlines . trunc_to ( j ) ;
2012-12-23 17:08:22 +01:00
}
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " incrementalInline_pru " , & timers [ _t_incrInline_pru ] ) ;
2012-12-23 17:08:22 +01:00
ResourceMark rm ;
2013-05-08 15:08:01 -07:00
PhaseRemoveUseless pru ( gvn , for_igvn ( ) ) ;
2012-12-23 17:08:22 +01:00
}
2014-09-25 12:10:57 +04:00
{
TracePhase tp ( " incrementalInline_igvn " , & timers [ _t_incrInline_igvn ] ) ;
igvn = PhaseIterGVN ( gvn ) ;
}
2012-12-23 17:08:22 +01:00
}
// Perform incremental inlining until bound on number of live nodes is reached
void Compile : : inline_incrementally ( PhaseIterGVN & igvn ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " incrementalInline " , & timers [ _t_incrInline ] ) ;
2012-12-23 17:08:22 +01:00
PhaseGVN * gvn = initial_gvn ( ) ;
set_inlining_incrementally ( true ) ;
set_inlining_progress ( true ) ;
uint low_live_nodes = 0 ;
while ( inlining_progress ( ) & & _late_inlines . length ( ) > 0 ) {
if ( live_nodes ( ) > ( uint ) LiveNodeCountInliningCutoff ) {
if ( low_live_nodes < ( uint ) LiveNodeCountInliningCutoff * 8 / 10 ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " incrementalInline_ideal " , & timers [ _t_incrInline_ideal ] ) ;
2012-12-23 17:08:22 +01:00
// PhaseIdealLoop is expensive so we only try it once we are
2014-06-10 13:37:16 +02:00
// out of live nodes and we only try it again if the previous
// helped got the number of nodes down significantly
2012-12-23 17:08:22 +01:00
PhaseIdealLoop ideal_loop ( igvn , false , true ) ;
if ( failing ( ) ) return ;
low_live_nodes = live_nodes ( ) ;
_major_progress = true ;
}
if ( live_nodes ( ) > ( uint ) LiveNodeCountInliningCutoff ) {
break ;
}
}
inline_incrementally_one ( igvn ) ;
if ( failing ( ) ) return ;
2014-09-25 12:10:57 +04:00
{
TracePhase tp ( " incrementalInline_igvn " , & timers [ _t_incrInline_igvn ] ) ;
igvn . optimize ( ) ;
}
2012-12-23 17:08:22 +01:00
if ( failing ( ) ) return ;
}
assert ( igvn . _worklist . size ( ) = = 0 , " should be done with igvn " ) ;
if ( _string_late_inlines . length ( ) > 0 ) {
assert ( has_stringbuilder ( ) , " inconsistent " ) ;
for_igvn ( ) - > clear ( ) ;
initial_gvn ( ) - > replace_with ( & igvn ) ;
inline_string_calls ( false ) ;
if ( failing ( ) ) return ;
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " incrementalInline_pru " , & timers [ _t_incrInline_pru ] ) ;
2012-12-23 17:08:22 +01:00
ResourceMark rm ;
PhaseRemoveUseless pru ( initial_gvn ( ) , for_igvn ( ) ) ;
}
2014-09-25 12:10:57 +04:00
{
TracePhase tp ( " incrementalInline_igvn " , & timers [ _t_incrInline_igvn ] ) ;
igvn = PhaseIterGVN ( gvn ) ;
igvn . optimize ( ) ;
}
2012-12-23 17:08:22 +01:00
}
set_inlining_incrementally ( false ) ;
}
2007-12-01 00:00:00 +00:00
//------------------------------Optimize---------------------------------------
// Given a graph, optimize it.
void Compile : : Optimize ( ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " optimizer " , & timers [ _t_optimizer ] ) ;
2007-12-01 00:00:00 +00:00
# ifndef PRODUCT
2015-10-20 18:07:28 +02:00
if ( _directive - > BreakAtCompileOption ) {
2007-12-01 00:00:00 +00:00
BREAKPOINT ;
}
# endif
ResourceMark rm ;
int loop_opts_cnt ;
2014-04-09 09:17:43 +02:00
print_inlining_reinit ( ) ;
2007-12-01 00:00:00 +00:00
NOT_PRODUCT ( verify_graph_edges ( ) ; )
2013-06-10 11:30:51 +02:00
print_method ( PHASE_AFTER_PARSING ) ;
2007-12-01 00:00:00 +00:00
{
// Iterative Global Value Numbering, including ideal transforms
// Initialize IterGVN with types and values from parse-time GVN
PhaseIterGVN igvn ( initial_gvn ( ) ) ;
2014-07-25 10:06:17 +02:00
# ifdef ASSERT
_modified_nodes = new ( comp_arena ( ) ) Unique_Node_List ( comp_arena ( ) ) ;
# endif
2007-12-01 00:00:00 +00:00
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " iterGVN " , & timers [ _t_iterGVN ] ) ;
2007-12-01 00:00:00 +00:00
igvn . optimize ( ) ;
}
2013-06-10 11:30:51 +02:00
print_method ( PHASE_ITER_GVN1 , 2 ) ;
2007-12-01 00:00:00 +00:00
if ( failing ( ) ) return ;
2014-09-25 12:10:57 +04:00
inline_incrementally ( igvn ) ;
2012-12-23 17:08:22 +01:00
2013-06-10 11:30:51 +02:00
print_method ( PHASE_INCREMENTAL_INLINE , 2 ) ;
2012-12-23 17:08:22 +01:00
if ( failing ( ) ) return ;
2013-05-08 15:08:01 -07:00
if ( eliminate_boxing ( ) ) {
// Inline valueOf() methods now.
inline_boxing_calls ( igvn ) ;
2014-06-10 13:37:16 +02:00
if ( AlwaysIncrementalInline ) {
inline_incrementally ( igvn ) ;
}
2013-06-10 11:30:51 +02:00
print_method ( PHASE_INCREMENTAL_BOXING_INLINE , 2 ) ;
2013-05-08 15:08:01 -07:00
if ( failing ( ) ) return ;
}
2013-10-23 12:40:23 +02:00
// Remove the speculative part of types and clean up the graph from
// the extra CastPP nodes whose only purpose is to carry them. Do
// that early so that optimizations are not disrupted by the extra
// CastPP nodes.
remove_speculative_types ( igvn ) ;
2013-02-12 12:56:11 +01:00
// No more new expensive nodes will be added to the list from here
// so keep only the actual candidates for optimizations.
cleanup_expensive_nodes ( igvn ) ;
2010-07-02 17:30:30 -07:00
// Perform escape analysis
if ( _do_escape_analysis & & ConnectionGraph : : has_candidates ( this ) ) {
2011-11-09 07:25:51 -08:00
if ( has_loops ( ) ) {
// Cleanup graph (remove dead nodes).
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoop " , & timers [ _t_idealLoop ] ) ;
2011-11-09 07:25:51 -08:00
PhaseIdealLoop ideal_loop ( igvn , false , true ) ;
2013-06-10 11:30:51 +02:00
if ( major_progress ( ) ) print_method ( PHASE_PHASEIDEAL_BEFORE_EA , 2 ) ;
2011-11-09 07:25:51 -08:00
if ( failing ( ) ) return ;
}
2010-07-02 17:30:30 -07:00
ConnectionGraph : : do_analysis ( this , & igvn ) ;
if ( failing ( ) ) return ;
2011-11-16 09:13:57 -08:00
// Optimize out fields loads from scalar replaceable allocations.
2010-07-02 17:30:30 -07:00
igvn . optimize ( ) ;
2013-06-10 11:30:51 +02:00
print_method ( PHASE_ITER_GVN_AFTER_EA , 2 ) ;
2010-07-02 17:30:30 -07:00
if ( failing ( ) ) return ;
2011-11-16 09:13:57 -08:00
if ( congraph ( ) ! = NULL & & macro_count ( ) > 0 ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " macroEliminate " , & timers [ _t_macroEliminate ] ) ;
2011-11-16 09:13:57 -08:00
PhaseMacroExpand mexp ( igvn ) ;
mexp . eliminate_macro_nodes ( ) ;
igvn . set_delay_transform ( false ) ;
igvn . optimize ( ) ;
2013-06-10 11:30:51 +02:00
print_method ( PHASE_ITER_GVN_AFTER_ELIMINATION , 2 ) ;
2011-11-16 09:13:57 -08:00
if ( failing ( ) ) return ;
}
2010-07-02 17:30:30 -07:00
}
2007-12-01 00:00:00 +00:00
// Loop transforms on the ideal graph. Range Check Elimination,
// peeling, unrolling, etc.
// Set loop opts counter
loop_opts_cnt = num_loop_opts ( ) ;
if ( ( loop_opts_cnt > 0 ) & & ( has_loops ( ) | | has_split_ifs ( ) ) ) {
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoop " , & timers [ _t_idealLoop ] ) ;
2011-04-02 10:54:15 -07:00
PhaseIdealLoop ideal_loop ( igvn , true ) ;
2007-12-01 00:00:00 +00:00
loop_opts_cnt - - ;
2013-06-10 11:30:51 +02:00
if ( major_progress ( ) ) print_method ( PHASE_PHASEIDEALLOOP1 , 2 ) ;
2007-12-01 00:00:00 +00:00
if ( failing ( ) ) return ;
}
// Loop opts pass if partial peeling occurred in previous pass
if ( PartialPeelLoop & & major_progress ( ) & & ( loop_opts_cnt > 0 ) ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoop " , & timers [ _t_idealLoop ] ) ;
2011-04-02 10:54:15 -07:00
PhaseIdealLoop ideal_loop ( igvn , false ) ;
2007-12-01 00:00:00 +00:00
loop_opts_cnt - - ;
2013-06-10 11:30:51 +02:00
if ( major_progress ( ) ) print_method ( PHASE_PHASEIDEALLOOP2 , 2 ) ;
2007-12-01 00:00:00 +00:00
if ( failing ( ) ) return ;
}
// Loop opts pass for loop-unrolling before CCP
if ( major_progress ( ) & & ( loop_opts_cnt > 0 ) ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoop " , & timers [ _t_idealLoop ] ) ;
2011-04-02 10:54:15 -07:00
PhaseIdealLoop ideal_loop ( igvn , false ) ;
2007-12-01 00:00:00 +00:00
loop_opts_cnt - - ;
2013-06-10 11:30:51 +02:00
if ( major_progress ( ) ) print_method ( PHASE_PHASEIDEALLOOP3 , 2 ) ;
2007-12-01 00:00:00 +00:00
}
2009-08-14 00:02:12 -07:00
if ( ! failing ( ) ) {
// Verify that last round of loop opts produced a valid graph
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoopVerify " , & timers [ _t_idealLoopVerify ] ) ;
2009-08-14 00:02:12 -07:00
PhaseIdealLoop : : verify ( igvn ) ;
}
2007-12-01 00:00:00 +00:00
}
if ( failing ( ) ) return ;
// Conditional Constant Propagation;
PhaseCCP ccp ( & igvn ) ;
assert ( true , " Break here to ccp.dump_nodes_and_types(_root,999,1) " ) ;
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " ccp " , & timers [ _t_ccp ] ) ;
2007-12-01 00:00:00 +00:00
ccp . do_transform ( ) ;
}
2013-06-10 11:30:51 +02:00
print_method ( PHASE_CPP1 , 2 ) ;
2007-12-01 00:00:00 +00:00
assert ( true , " Break here to ccp.dump_old2new_map() " ) ;
// Iterative Global Value Numbering, including ideal transforms
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " iterGVN2 " , & timers [ _t_iterGVN2 ] ) ;
2007-12-01 00:00:00 +00:00
igvn = ccp ;
igvn . optimize ( ) ;
}
2013-06-10 11:30:51 +02:00
print_method ( PHASE_ITER_GVN2 , 2 ) ;
2007-12-01 00:00:00 +00:00
if ( failing ( ) ) return ;
// Loop transforms on the ideal graph. Range Check Elimination,
// peeling, unrolling, etc.
if ( loop_opts_cnt > 0 ) {
debug_only ( int cnt = 0 ; ) ;
while ( major_progress ( ) & & ( loop_opts_cnt > 0 ) ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoop " , & timers [ _t_idealLoop ] ) ;
2007-12-01 00:00:00 +00:00
assert ( cnt + + < 40 , " infinite cycle in loop optimization " ) ;
2011-04-02 10:54:15 -07:00
PhaseIdealLoop ideal_loop ( igvn , true ) ;
2007-12-01 00:00:00 +00:00
loop_opts_cnt - - ;
2013-06-10 11:30:51 +02:00
if ( major_progress ( ) ) print_method ( PHASE_PHASEIDEALLOOP_ITERATIONS , 2 ) ;
2007-12-01 00:00:00 +00:00
if ( failing ( ) ) return ;
}
}
2015-10-08 12:49:30 -10:00
// Ensure that major progress is now clear
C - > clear_major_progress ( ) ;
2009-08-14 00:02:12 -07:00
{
// Verify that all previous optimizations produced a valid graph
// at least to this point, even if no loop optimizations were done.
2014-09-25 12:10:57 +04:00
TracePhase tp ( " idealLoopVerify " , & timers [ _t_idealLoopVerify ] ) ;
2009-08-14 00:02:12 -07:00
PhaseIdealLoop : : verify ( igvn ) ;
}
2007-12-01 00:00:00 +00:00
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " macroExpand " , & timers [ _t_macroExpand ] ) ;
2007-12-01 00:00:00 +00:00
PhaseMacroExpand mex ( igvn ) ;
if ( mex . expand_macro_nodes ( ) ) {
assert ( failing ( ) , " must bail out w/ explicit message " ) ;
return ;
}
}
2014-07-25 10:06:17 +02:00
DEBUG_ONLY ( _modified_nodes = NULL ; )
2007-12-01 00:00:00 +00:00
} // (End scope of igvn; run destructor if necessary for asserts.)
2014-05-26 14:27:01 +02:00
process_print_inlining ( ) ;
2007-12-01 00:00:00 +00:00
// A method with only infinite loops has no edges entering loops from root
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " graphReshape " , & timers [ _t_graphReshaping ] ) ;
2007-12-01 00:00:00 +00:00
if ( final_graph_reshaping ( ) ) {
assert ( failing ( ) , " must bail out w/ explicit message " ) ;
return ;
}
}
2013-06-10 11:30:51 +02:00
print_method ( PHASE_OPTIMIZE_FINISHED , 2 ) ;
2007-12-01 00:00:00 +00:00
}
//------------------------------Code_Gen---------------------------------------
// Given a graph, generate code for it
void Compile : : Code_Gen ( ) {
2013-08-16 10:23:55 +02:00
if ( failing ( ) ) {
return ;
}
2007-12-01 00:00:00 +00:00
// Perform instruction selection. You might think we could reclaim Matcher
// memory PDQ, but actually the Matcher is used in generating spill code.
// Internals of the Matcher (including some VectorSets) must remain live
// for awhile - thus I cannot reclaim Matcher memory lest a VectorSet usage
// set a bit in reclaimed memory.
// In debug mode can dump m._nodes.dump() for mapping of ideal to machine
// nodes. Mapping is only valid at the root of each matched subtree.
NOT_PRODUCT ( verify_graph_edges ( ) ; )
2013-08-16 10:23:55 +02:00
Matcher matcher ;
_matcher = & matcher ;
2007-12-01 00:00:00 +00:00
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " matcher " , & timers [ _t_matcher ] ) ;
2013-08-16 10:23:55 +02:00
matcher . match ( ) ;
2007-12-01 00:00:00 +00:00
}
// In debug mode can dump m._nodes.dump() for mapping of ideal to machine
// nodes. Mapping is only valid at the root of each matched subtree.
NOT_PRODUCT ( verify_graph_edges ( ) ; )
// If you have too many nodes, or if matching has failed, bail out
check_node_count ( 0 , " out of nodes matching instructions " ) ;
2013-08-16 10:23:55 +02:00
if ( failing ( ) ) {
return ;
}
2007-12-01 00:00:00 +00:00
// Build a proper-looking CFG
2013-08-16 10:23:55 +02:00
PhaseCFG cfg ( node_arena ( ) , root ( ) , matcher ) ;
2007-12-01 00:00:00 +00:00
_cfg = & cfg ;
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " scheduler " , & timers [ _t_scheduler ] ) ;
2013-08-16 10:23:55 +02:00
bool success = cfg . do_global_code_motion ( ) ;
if ( ! success ) {
return ;
}
2007-12-01 00:00:00 +00:00
2013-06-10 11:30:51 +02:00
print_method ( PHASE_GLOBAL_CODE_MOTION , 2 ) ;
2007-12-01 00:00:00 +00:00
NOT_PRODUCT ( verify_graph_edges ( ) ; )
debug_only ( cfg . verify ( ) ; )
}
2015-09-16 13:16:17 -07:00
PhaseChaitin regalloc ( unique ( ) , cfg , matcher , false ) ;
2007-12-01 00:00:00 +00:00
_regalloc = & regalloc ;
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " regalloc " , & timers [ _t_registerAllocation ] ) ;
2007-12-01 00:00:00 +00:00
// Perform register allocation. After Chaitin, use-def chains are
// no longer accurate (at spill code) and so must be ignored.
// Node->LRG->reg mappings are still accurate.
_regalloc - > Register_Allocate ( ) ;
// Bail out if the allocator builds too many nodes
2013-04-16 10:08:41 +02:00
if ( failing ( ) ) {
return ;
}
2007-12-01 00:00:00 +00:00
}
// Prior to register allocation we kept empty basic blocks in case the
// the allocator needed a place to spill. After register allocation we
// are not adding any new instructions. If any basic block is empty, we
// can now safely remove it.
{
2014-09-25 12:10:57 +04:00
TracePhase tp ( " blockOrdering " , & timers [ _t_blockOrdering ] ) ;
2013-08-16 10:23:55 +02:00
cfg . remove_empty_blocks ( ) ;
2008-11-06 14:59:10 -08:00
if ( do_freq_based_layout ( ) ) {
PhaseBlockLayout layout ( cfg ) ;
} else {
cfg . set_loop_alignment ( ) ;
}
cfg . fixup_flow ( ) ;
2007-12-01 00:00:00 +00:00
}
// Apply peephole optimizations
if ( OptoPeephole ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " peephole " , & timers [ _t_peephole ] ) ;
2007-12-01 00:00:00 +00:00
PhasePeephole peep ( _regalloc , cfg ) ;
peep . do_transform ( ) ;
}
2013-11-14 19:24:59 -08:00
// Do late expand if CPU requires this.
if ( Matcher : : require_postalloc_expand ) {
2014-09-25 12:10:57 +04:00
TracePhase tp ( " postalloc_expand " , & timers [ _t_postalloc_expand ] ) ;
2013-11-14 19:24:59 -08:00
cfg . postalloc_expand ( _regalloc ) ;
}
2007-12-01 00:00:00 +00:00
// Convert Nodes to instruction bits in a buffer
{
2014-09-25 12:10:57 +04:00
TraceTime tp ( " output " , & timers [ _t_output ] , CITime ) ;
2007-12-01 00:00:00 +00:00
Output ( ) ;
}
2013-06-10 11:30:51 +02:00
print_method ( PHASE_FINAL_CODE ) ;
2007-12-01 00:00:00 +00:00
// He's dead, Jim.
_cfg = ( PhaseCFG * ) 0xdeadbeef ;
_regalloc = ( PhaseChaitin * ) 0xdeadbeef ;
}
//------------------------------dump_asm---------------------------------------
// Dump formatted assembly
# ifndef PRODUCT
void Compile : : dump_asm ( int * pcs , uint pc_limit ) {
bool cut_short = false ;
tty - > print_cr ( " # " ) ;
tty - > print ( " # " ) ; _tf - > dump ( ) ; tty - > cr ( ) ;
tty - > print_cr ( " # " ) ;
// For all blocks
int pc = 0x0 ; // Program counter
char starts_bundle = ' ' ;
_regalloc - > dump_frame ( ) ;
Node * n = NULL ;
2013-08-16 10:23:55 +02:00
for ( uint i = 0 ; i < _cfg - > number_of_blocks ( ) ; i + + ) {
if ( VMThread : : should_terminate ( ) ) {
cut_short = true ;
break ;
}
Block * block = _cfg - > get_block ( i ) ;
if ( block - > is_connector ( ) & & ! Verbose ) {
continue ;
}
2013-08-26 12:50:23 +02:00
n = block - > head ( ) ;
2013-08-16 10:23:55 +02:00
if ( pcs & & n - > _idx < pc_limit ) {
2007-12-01 00:00:00 +00:00
tty - > print ( " %3.3x " , pcs [ n - > _idx ] ) ;
2013-08-16 10:23:55 +02:00
} else {
2007-12-01 00:00:00 +00:00
tty - > print ( " " ) ;
2013-08-16 10:23:55 +02:00
}
block - > dump_head ( _cfg ) ;
if ( block - > is_connector ( ) ) {
2007-12-01 00:00:00 +00:00
tty - > print_cr ( " # Empty connector block " ) ;
2013-08-16 10:23:55 +02:00
} else if ( block - > num_preds ( ) = = 2 & & block - > pred ( 1 ) - > is_CatchProj ( ) & & block - > pred ( 1 ) - > as_CatchProj ( ) - > _con = = CatchProjNode : : fall_through_index ) {
2007-12-01 00:00:00 +00:00
tty - > print_cr ( " # Block is sole successor of call " ) ;
}
// For all instructions
Node * delay = NULL ;
2013-08-26 12:50:23 +02:00
for ( uint j = 0 ; j < block - > number_of_nodes ( ) ; j + + ) {
2013-08-16 10:23:55 +02:00
if ( VMThread : : should_terminate ( ) ) {
cut_short = true ;
break ;
}
2013-08-26 12:50:23 +02:00
n = block - > get_node ( j ) ;
2007-12-01 00:00:00 +00:00
if ( valid_bundle_info ( n ) ) {
2013-08-16 10:23:55 +02:00
Bundle * bundle = node_bundling ( n ) ;
2007-12-01 00:00:00 +00:00
if ( bundle - > used_in_unconditional_delay ( ) ) {
delay = n ;
continue ;
}
2013-08-16 10:23:55 +02:00
if ( bundle - > starts_bundle ( ) ) {
2007-12-01 00:00:00 +00:00
starts_bundle = ' + ' ;
2013-08-16 10:23:55 +02:00
}
2007-12-01 00:00:00 +00:00
}
2013-08-16 10:23:55 +02:00
if ( WizardMode ) {
n - > dump ( ) ;
}
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
2007-12-01 00:00:00 +00:00
if ( ! n - > is_Region ( ) & & // Dont print in the Assembly
! n - > is_Phi ( ) & & // a few noisely useless nodes
! n - > is_Proj ( ) & &
! n - > is_MachTemp ( ) & &
2009-12-09 16:40:45 -08:00
! n - > is_SafePointScalarObject ( ) & &
2007-12-01 00:00:00 +00:00
! n - > is_Catch ( ) & & // Would be nice to print exception table targets
! n - > is_MergeMem ( ) & & // Not very interesting
! n - > is_top ( ) & & // Debug info table constants
! ( n - > is_Con ( ) & & ! n - > is_Mach ( ) ) // Debug info table constants
) {
if ( pcs & & n - > _idx < pc_limit )
tty - > print ( " %3.3x " , pcs [ n - > _idx ] ) ;
else
tty - > print ( " " ) ;
tty - > print ( " %c " , starts_bundle ) ;
starts_bundle = ' ' ;
tty - > print ( " \t " ) ;
n - > format ( _regalloc , tty ) ;
tty - > cr ( ) ;
}
// If we have an instruction with a delay slot, and have seen a delay,
// then back up and print it
if ( valid_bundle_info ( n ) & & node_bundling ( n ) - > use_unconditional_delay ( ) ) {
assert ( delay ! = NULL , " no unconditional delay instruction " ) ;
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
if ( WizardMode ) delay - > dump ( ) ;
2007-12-01 00:00:00 +00:00
if ( node_bundling ( delay ) - > starts_bundle ( ) )
starts_bundle = ' + ' ;
if ( pcs & & n - > _idx < pc_limit )
tty - > print ( " %3.3x " , pcs [ n - > _idx ] ) ;
else
tty - > print ( " " ) ;
tty - > print ( " %c " , starts_bundle ) ;
starts_bundle = ' ' ;
tty - > print ( " \t " ) ;
delay - > format ( _regalloc , tty ) ;
2014-05-09 16:50:54 -04:00
tty - > cr ( ) ;
2007-12-01 00:00:00 +00:00
delay = NULL ;
}
// Dump the exception table as well
if ( n - > is_Catch ( ) & & ( Verbose | | WizardMode ) ) {
// Print the exception table for this offset
_handler_table . print_subtable_for ( pc ) ;
}
}
if ( pcs & & n - > _idx < pc_limit )
tty - > print_cr ( " %3.3x " , pcs [ n - > _idx ] ) ;
else
2014-05-09 16:50:54 -04:00
tty - > cr ( ) ;
2007-12-01 00:00:00 +00:00
assert ( cut_short | | delay = = NULL , " no unconditional delay branch " ) ;
} // End of per-block dump
2014-05-09 16:50:54 -04:00
tty - > cr ( ) ;
2007-12-01 00:00:00 +00:00
if ( cut_short ) tty - > print_cr ( " *** disassembly is cut short *** " ) ;
}
# endif
//------------------------------Final_Reshape_Counts---------------------------
// This class defines counters to help identify when a method
// may/must be executed using hardware with only 24-bit precision.
struct Final_Reshape_Counts : public StackObj {
int _call_count ; // count non-inlined 'common' calls
int _float_count ; // count float ops requiring 24-bit precision
int _double_count ; // count double ops requiring more precision
int _java_call_count ; // count non-inlined 'java' calls
2009-07-23 14:53:56 -07:00
int _inner_loop_count ; // count loops which need alignment
2007-12-01 00:00:00 +00:00
VectorSet _visited ; // Visitation flags
Node_List _tests ; // Set of IfNodes & PCTableNodes
Final_Reshape_Counts ( ) :
2009-07-23 14:53:56 -07:00
_call_count ( 0 ) , _float_count ( 0 ) , _double_count ( 0 ) ,
_java_call_count ( 0 ) , _inner_loop_count ( 0 ) ,
2007-12-01 00:00:00 +00:00
_visited ( Thread : : current ( ) - > resource_area ( ) ) { }
void inc_call_count ( ) { _call_count + + ; }
void inc_float_count ( ) { _float_count + + ; }
void inc_double_count ( ) { _double_count + + ; }
void inc_java_call_count ( ) { _java_call_count + + ; }
2009-07-23 14:53:56 -07:00
void inc_inner_loop_count ( ) { _inner_loop_count + + ; }
2007-12-01 00:00:00 +00:00
int get_call_count ( ) const { return _call_count ; }
int get_float_count ( ) const { return _float_count ; }
int get_double_count ( ) const { return _double_count ; }
int get_java_call_count ( ) const { return _java_call_count ; }
2009-07-23 14:53:56 -07:00
int get_inner_loop_count ( ) const { return _inner_loop_count ; }
2007-12-01 00:00:00 +00:00
} ;
2013-04-04 10:01:26 -07:00
# ifdef ASSERT
2007-12-01 00:00:00 +00:00
static bool oop_offset_is_sane ( const TypeInstPtr * tp ) {
ciInstanceKlass * k = tp - > klass ( ) - > as_instance_klass ( ) ;
// Make sure the offset goes inside the instance layout.
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
return k - > contains_field_offset ( tp - > offset ( ) ) ;
2007-12-01 00:00:00 +00:00
// Note that OffsetBot and OffsetTop are very negative.
}
2013-04-04 10:01:26 -07:00
# endif
2007-12-01 00:00:00 +00:00
2011-04-05 19:14:03 -07:00
// Eliminate trivially redundant StoreCMs and accumulate their
// precedence edges.
2012-11-27 17:24:15 -08:00
void Compile : : eliminate_redundant_card_marks ( Node * n ) {
2011-04-05 19:14:03 -07:00
assert ( n - > Opcode ( ) = = Op_StoreCM , " expected StoreCM " ) ;
if ( n - > in ( MemNode : : Address ) - > outcnt ( ) > 1 ) {
// There are multiple users of the same address so it might be
// possible to eliminate some of the StoreCMs
Node * mem = n - > in ( MemNode : : Memory ) ;
Node * adr = n - > in ( MemNode : : Address ) ;
Node * val = n - > in ( MemNode : : ValueIn ) ;
Node * prev = n ;
bool done = false ;
// Walk the chain of StoreCMs eliminating ones that match. As
// long as it's a chain of single users then the optimization is
// safe. Eliminating partially redundant StoreCMs would require
// cloning copies down the other paths.
while ( mem - > Opcode ( ) = = Op_StoreCM & & mem - > outcnt ( ) = = 1 & & ! done ) {
if ( adr = = mem - > in ( MemNode : : Address ) & &
val = = mem - > in ( MemNode : : ValueIn ) ) {
// redundant StoreCM
if ( mem - > req ( ) > MemNode : : OopStore ) {
// Hasn't been processed by this code yet.
n - > add_prec ( mem - > in ( MemNode : : OopStore ) ) ;
} else {
// Already converted to precedence edge
for ( uint i = mem - > req ( ) ; i < mem - > len ( ) ; i + + ) {
// Accumulate any precedence edges
if ( mem - > in ( i ) ! = NULL ) {
n - > add_prec ( mem - > in ( i ) ) ;
}
}
// Everything above this point has been processed.
done = true ;
}
// Eliminate the previous StoreCM
prev - > set_req ( MemNode : : Memory , mem - > in ( MemNode : : Memory ) ) ;
assert ( mem - > outcnt ( ) = = 0 , " should be dead " ) ;
2012-11-27 17:24:15 -08:00
mem - > disconnect_inputs ( NULL , this ) ;
2011-04-05 19:14:03 -07:00
} else {
prev = mem ;
}
mem = prev - > in ( MemNode : : Memory ) ;
}
}
}
2007-12-01 00:00:00 +00:00
//------------------------------final_graph_reshaping_impl----------------------
// Implement items 1-5 from final_graph_reshaping below.
2012-11-27 17:24:15 -08:00
void Compile : : final_graph_reshaping_impl ( Node * n , Final_Reshape_Counts & frc ) {
2007-12-01 00:00:00 +00:00
2008-05-29 12:04:14 -07:00
if ( n - > outcnt ( ) = = 0 ) return ; // dead node
2007-12-01 00:00:00 +00:00
uint nop = n - > Opcode ( ) ;
// Check for 2-input instruction with "last use" on right input.
// Swap to left input. Implements item (2).
if ( n - > req ( ) = = 3 & & // two-input instruction
n - > in ( 1 ) - > outcnt ( ) > 1 & & // left use is NOT a last use
( ! n - > in ( 1 ) - > is_Phi ( ) | | n - > in ( 1 ) - > in ( 2 ) ! = n ) & & // it is not data loop
n - > in ( 2 ) - > outcnt ( ) = = 1 & & // right use IS a last use
! n - > in ( 2 ) - > is_Con ( ) ) { // right use is not a constant
// Check for commutative opcode
switch ( nop ) {
case Op_AddI : case Op_AddF : case Op_AddD : case Op_AddL :
case Op_MaxI : case Op_MinI :
case Op_MulI : case Op_MulF : case Op_MulD : case Op_MulL :
case Op_AndL : case Op_XorL : case Op_OrL :
case Op_AndI : case Op_XorI : case Op_OrI : {
// Move "last use" input to left by swapping inputs
n - > swap_edges ( 1 , 2 ) ;
break ;
}
default :
break ;
}
}
2010-06-15 18:07:27 -07:00
# ifdef ASSERT
if ( n - > is_Mem ( ) ) {
2012-11-27 17:24:15 -08:00
int alias_idx = get_alias_index ( n - > as_Mem ( ) - > adr_type ( ) ) ;
2010-06-15 18:07:27 -07:00
assert ( n - > in ( 0 ) ! = NULL | | alias_idx ! = Compile : : AliasIdxRaw | |
// oop will be recorded in oop map if load crosses safepoint
n - > is_Load ( ) & & ( n - > as_Load ( ) - > bottom_type ( ) - > isa_oopptr ( ) | |
LoadNode : : is_immutable_value ( n - > in ( MemNode : : Address ) ) ) ,
" raw memory operations should have control edge " ) ;
}
# endif
2007-12-01 00:00:00 +00:00
// Count FPU ops and common calls, implements item (3)
switch ( nop ) {
// Count all float operations that may use FPU
case Op_AddF :
case Op_SubF :
case Op_MulF :
case Op_DivF :
case Op_NegF :
case Op_ModF :
case Op_ConvI2F :
case Op_ConF :
case Op_CmpF :
case Op_CmpF3 :
// case Op_ConvL2F: // longs are split into 32-bit halves
2009-07-23 14:53:56 -07:00
frc . inc_float_count ( ) ;
2007-12-01 00:00:00 +00:00
break ;
case Op_ConvF2D :
case Op_ConvD2F :
2009-07-23 14:53:56 -07:00
frc . inc_float_count ( ) ;
frc . inc_double_count ( ) ;
2007-12-01 00:00:00 +00:00
break ;
// Count all double operations that may use FPU
case Op_AddD :
case Op_SubD :
case Op_MulD :
case Op_DivD :
case Op_NegD :
case Op_ModD :
case Op_ConvI2D :
case Op_ConvD2I :
// case Op_ConvL2D: // handled by leaf call
// case Op_ConvD2L: // handled by leaf call
case Op_ConD :
case Op_CmpD :
case Op_CmpD3 :
2009-07-23 14:53:56 -07:00
frc . inc_double_count ( ) ;
2007-12-01 00:00:00 +00:00
break ;
case Op_Opaque1 : // Remove Opaque Nodes before matching
case Op_Opaque2 : // Remove Opaque Nodes before matching
2014-03-20 17:49:27 -07:00
case Op_Opaque3 :
2012-11-27 17:24:15 -08:00
n - > subsume_by ( n - > in ( 1 ) , this ) ;
2007-12-01 00:00:00 +00:00
break ;
case Op_CallStaticJava :
case Op_CallJava :
case Op_CallDynamicJava :
2009-07-23 14:53:56 -07:00
frc . inc_java_call_count ( ) ; // Count java call site;
2007-12-01 00:00:00 +00:00
case Op_CallRuntime :
case Op_CallLeaf :
case Op_CallLeafNoFP : {
assert ( n - > is_Call ( ) , " " ) ;
CallNode * call = n - > as_Call ( ) ;
// Count call sites where the FP mode bit would have to be flipped.
// Do not count uncommon runtime calls:
// uncommon_trap, _complete_monitor_locking, _complete_monitor_unlocking,
// _new_Java, _new_typeArray, _new_objArray, _rethrow_Java, ...
if ( ! call - > is_CallStaticJava ( ) | | ! call - > as_CallStaticJava ( ) - > _name ) {
2009-07-23 14:53:56 -07:00
frc . inc_call_count ( ) ; // Count the call site
2007-12-01 00:00:00 +00:00
} else { // See if uncommon argument is shared
Node * n = call - > in ( TypeFunc : : Parms ) ;
int nop = n - > Opcode ( ) ;
// Clone shared simple arguments to uncommon calls, item (1).
if ( n - > outcnt ( ) > 1 & &
! n - > is_Proj ( ) & &
nop ! = Op_CreateEx & &
nop ! = Op_CheckCastPP & &
2008-09-10 18:23:32 -07:00
nop ! = Op_DecodeN & &
2012-10-09 10:11:38 +02:00
nop ! = Op_DecodeNKlass & &
2007-12-01 00:00:00 +00:00
! n - > is_Mem ( ) ) {
Node * x = n - > clone ( ) ;
call - > set_req ( TypeFunc : : Parms , x ) ;
}
}
break ;
}
case Op_StoreD :
case Op_LoadD :
case Op_LoadD_unaligned :
2009-07-23 14:53:56 -07:00
frc . inc_double_count ( ) ;
2007-12-01 00:00:00 +00:00
goto handle_mem ;
case Op_StoreF :
case Op_LoadF :
2009-07-23 14:53:56 -07:00
frc . inc_float_count ( ) ;
2007-12-01 00:00:00 +00:00
goto handle_mem ;
2011-04-05 19:14:03 -07:00
case Op_StoreCM :
{
// Convert OopStore dependence into precedence edge
Node * prec = n - > in ( MemNode : : OopStore ) ;
n - > del_req ( MemNode : : OopStore ) ;
n - > add_prec ( prec ) ;
eliminate_redundant_card_marks ( n ) ;
}
// fall through
2007-12-01 00:00:00 +00:00
case Op_StoreB :
case Op_StoreC :
case Op_StorePConditional :
case Op_StoreI :
case Op_StoreL :
2008-11-07 09:29:38 -08:00
case Op_StoreIConditional :
2007-12-01 00:00:00 +00:00
case Op_StoreLConditional :
case Op_CompareAndSwapI :
case Op_CompareAndSwapL :
case Op_CompareAndSwapP :
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
case Op_CompareAndSwapN :
2012-09-20 16:49:17 +02:00
case Op_GetAndAddI :
case Op_GetAndAddL :
case Op_GetAndSetI :
case Op_GetAndSetL :
case Op_GetAndSetP :
case Op_GetAndSetN :
2007-12-01 00:00:00 +00:00
case Op_StoreP :
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
case Op_StoreN :
2012-10-09 10:11:38 +02:00
case Op_StoreNKlass :
2007-12-01 00:00:00 +00:00
case Op_LoadB :
2009-03-09 03:17:11 -07:00
case Op_LoadUB :
2009-01-26 16:22:12 +01:00
case Op_LoadUS :
2007-12-01 00:00:00 +00:00
case Op_LoadI :
case Op_LoadKlass :
2008-05-21 13:46:23 -07:00
case Op_LoadNKlass :
2007-12-01 00:00:00 +00:00
case Op_LoadL :
case Op_LoadL_unaligned :
case Op_LoadPLocked :
case Op_LoadP :
6420645: Create a vm that uses compressed oops for up to 32gb heapsizes
Compressed oops in instances, arrays, and headers. Code contributors are coleenp, phh, never, swamyv
Reviewed-by: jmasa, kamg, acorn, tbell, kvn, rasbold
2008-04-13 17:43:42 -04:00
case Op_LoadN :
2007-12-01 00:00:00 +00:00
case Op_LoadRange :
case Op_LoadS : {
handle_mem :
# ifdef ASSERT
if ( VerifyOptoOopOffsets ) {
assert ( n - > is_Mem ( ) , " " ) ;
MemNode * mem = ( MemNode * ) n ;
// Check to see if address types have grounded out somehow.
const TypeInstPtr * tp = mem - > in ( MemNode : : Address ) - > bottom_type ( ) - > isa_instptr ( ) ;
assert ( ! tp | | oop_offset_is_sane ( tp ) , " " ) ;
}
# endif
break ;
}
case Op_AddP : { // Assert sane base pointers
2008-06-05 13:02:51 -07:00
Node * addp = n - > in ( AddPNode : : Address ) ;
2007-12-01 00:00:00 +00:00
assert ( ! addp - > is_AddP ( ) | |
addp - > in ( AddPNode : : Base ) - > is_top ( ) | | // Top OK for allocation
addp - > in ( AddPNode : : Base ) = = n - > in ( AddPNode : : Base ) ,
" Base pointers must match " ) ;
2008-06-05 13:02:51 -07:00
# ifdef _LP64
2013-08-12 17:37:02 +02:00
if ( ( UseCompressedOops | | UseCompressedClassPointers ) & &
2008-06-05 13:02:51 -07:00
addp - > Opcode ( ) = = Op_ConP & &
addp = = n - > in ( AddPNode : : Base ) & &
n - > in ( AddPNode : : Offset ) - > is_Con ( ) ) {
// Use addressing with narrow klass to load with offset on x86.
// On sparc loading 32-bits constant and decoding it have less
// instructions (4) then load 64-bits constant (7).
// Do this transformation here since IGVN will convert ConN back to ConP.
const Type * t = addp - > bottom_type ( ) ;
2012-10-09 10:11:38 +02:00
if ( t - > isa_oopptr ( ) | | t - > isa_klassptr ( ) ) {
2008-06-05 13:02:51 -07:00
Node * nn = NULL ;
2012-10-09 10:11:38 +02:00
int op = t - > isa_oopptr ( ) ? Op_ConN : Op_ConNKlass ;
2008-06-05 13:02:51 -07:00
// Look for existing ConN node of the same exact type.
2012-11-27 17:24:15 -08:00
Node * r = root ( ) ;
2008-06-05 13:02:51 -07:00
uint cnt = r - > outcnt ( ) ;
for ( uint i = 0 ; i < cnt ; i + + ) {
Node * m = r - > raw_out ( i ) ;
2012-10-09 10:11:38 +02:00
if ( m ! = NULL & & m - > Opcode ( ) = = op & &
2008-06-24 10:43:29 -07:00
m - > bottom_type ( ) - > make_ptr ( ) = = t ) {
2008-06-05 13:02:51 -07:00
nn = m ;
break ;
}
}
if ( nn ! = NULL ) {
// Decode a narrow oop to match address
// [R12 + narrow_oop_reg<<3 + offset]
2012-10-09 10:11:38 +02:00
if ( t - > isa_oopptr ( ) ) {
2014-06-02 08:07:29 +02:00
nn = new DecodeNNode ( nn , t ) ;
2012-10-09 10:11:38 +02:00
} else {
2014-06-02 08:07:29 +02:00
nn = new DecodeNKlassNode ( nn , t ) ;
2012-10-09 10:11:38 +02:00
}
2008-06-05 13:02:51 -07:00
n - > set_req ( AddPNode : : Base , nn ) ;
n - > set_req ( AddPNode : : Address , nn ) ;
if ( addp - > outcnt ( ) = = 0 ) {
2012-11-27 17:24:15 -08:00
addp - > disconnect_inputs ( NULL , this ) ;
2008-06-05 13:02:51 -07:00
}
}
}
}
# endif
2007-12-01 00:00:00 +00:00
break ;
}
2015-03-24 10:25:09 +01:00
case Op_CastPP : {
// Remove CastPP nodes to gain more freedom during scheduling but
// keep the dependency they encode as control or precedence edges
// (if control is set already) on memory operations. Some CastPP
// nodes don't have a control (don't carry a dependency): skip
// those.
if ( n - > in ( 0 ) ! = NULL ) {
ResourceMark rm ;
Unique_Node_List wq ;
wq . push ( n ) ;
for ( uint next = 0 ; next < wq . size ( ) ; + + next ) {
Node * m = wq . at ( next ) ;
for ( DUIterator_Fast imax , i = m - > fast_outs ( imax ) ; i < imax ; i + + ) {
Node * use = m - > fast_out ( i ) ;
if ( use - > is_Mem ( ) | | use - > is_EncodeNarrowPtr ( ) ) {
use - > ensure_control_or_add_prec ( n - > in ( 0 ) ) ;
} else if ( use - > in ( 0 ) = = NULL ) {
switch ( use - > Opcode ( ) ) {
case Op_AddP :
case Op_DecodeN :
case Op_DecodeNKlass :
case Op_CheckCastPP :
case Op_CastPP :
wq . push ( use ) ;
break ;
}
}
}
}
}
const bool is_LP64 = LP64_ONLY ( true ) NOT_LP64 ( false ) ;
if ( is_LP64 & & n - > in ( 1 ) - > is_DecodeN ( ) & & Matcher : : gen_narrow_oop_implicit_null_checks ( ) ) {
2008-09-23 12:29:06 -07:00
Node * in1 = n - > in ( 1 ) ;
const Type * t = n - > bottom_type ( ) ;
Node * new_in1 = in1 - > clone ( ) ;
new_in1 - > as_DecodeN ( ) - > set_type ( t ) ;
2010-06-02 09:49:32 -07:00
if ( ! Matcher : : narrow_oop_use_complex_address ( ) ) {
2008-09-23 12:29:06 -07:00
//
// x86, ARM and friends can handle 2 adds in addressing mode
// and Matcher can fold a DecodeN node into address by using
// a narrow oop directly and do implicit NULL check in address:
//
// [R12 + narrow_oop_reg<<3 + offset]
// NullCheck narrow_oop_reg
//
// On other platforms (Sparc) we have to keep new DecodeN node and
// use it to do implicit NULL check in address:
//
// decode_not_null narrow_oop_reg, base_reg
// [base_reg + offset]
// NullCheck base_reg
//
2009-02-27 13:27:09 -08:00
// Pin the new DecodeN node to non-null path on these platform (Sparc)
2008-09-23 12:29:06 -07:00
// to keep the information to which NULL check the new DecodeN node
// corresponds to use it as value in implicit_null_check().
//
new_in1 - > set_req ( 0 , n - > in ( 0 ) ) ;
}
2012-11-27 17:24:15 -08:00
n - > subsume_by ( new_in1 , this ) ;
2008-09-23 12:29:06 -07:00
if ( in1 - > outcnt ( ) = = 0 ) {
2012-11-27 17:24:15 -08:00
in1 - > disconnect_inputs ( NULL , this ) ;
2008-09-23 12:29:06 -07:00
}
2015-03-24 10:25:09 +01:00
} else {
n - > subsume_by ( n - > in ( 1 ) , this ) ;
if ( n - > outcnt ( ) = = 0 ) {
n - > disconnect_inputs ( NULL , this ) ;
}
2008-09-23 12:29:06 -07:00
}
break ;
2015-03-24 10:25:09 +01:00
}
# ifdef _LP64
2008-05-21 13:46:23 -07:00
case Op_CmpP :
2008-05-29 12:04:14 -07:00
// Do this transformation here to preserve CmpPNode::sub() and
// other TypePtr related Ideal optimizations (for example, ptr nullness).
2012-10-09 10:11:38 +02:00
if ( n - > in ( 1 ) - > is_DecodeNarrowPtr ( ) | | n - > in ( 2 ) - > is_DecodeNarrowPtr ( ) ) {
2008-09-10 18:23:32 -07:00
Node * in1 = n - > in ( 1 ) ;
Node * in2 = n - > in ( 2 ) ;
2012-10-09 10:11:38 +02:00
if ( ! in1 - > is_DecodeNarrowPtr ( ) ) {
2008-09-10 18:23:32 -07:00
in2 = in1 ;
in1 = n - > in ( 2 ) ;
}
2012-10-09 10:11:38 +02:00
assert ( in1 - > is_DecodeNarrowPtr ( ) , " sanity " ) ;
2008-09-10 18:23:32 -07:00
Node * new_in2 = NULL ;
2012-10-09 10:11:38 +02:00
if ( in2 - > is_DecodeNarrowPtr ( ) ) {
assert ( in2 - > Opcode ( ) = = in1 - > Opcode ( ) , " must be same node type " ) ;
2008-09-10 18:23:32 -07:00
new_in2 = in2 - > in ( 1 ) ;
} else if ( in2 - > Opcode ( ) = = Op_ConP ) {
const Type * t = in2 - > bottom_type ( ) ;
2010-06-02 09:49:32 -07:00
if ( t = = TypePtr : : NULL_PTR ) {
2012-10-09 10:11:38 +02:00
assert ( in1 - > is_DecodeN ( ) , " compare klass to null? " ) ;
2010-06-02 09:49:32 -07:00
// Don't convert CmpP null check into CmpN if compressed
// oops implicit null check is not generated.
// This will allow to generate normal oop implicit null check.
if ( Matcher : : gen_narrow_oop_implicit_null_checks ( ) )
2014-08-05 09:58:52 +02:00
new_in2 = ConNode : : make ( TypeNarrowOop : : NULL_PTR ) ;
2008-09-23 12:29:06 -07:00
//
// This transformation together with CastPP transformation above
// will generated code for implicit NULL checks for compressed oops.
//
// The original code after Optimize()
//
// LoadN memory, narrow_oop_reg
// decode narrow_oop_reg, base_reg
// CmpP base_reg, NULL
// CastPP base_reg // NotNull
// Load [base_reg + offset], val_reg
//
// after these transformations will be
//
// LoadN memory, narrow_oop_reg
// CmpN narrow_oop_reg, NULL
// decode_not_null narrow_oop_reg, base_reg
// Load [base_reg + offset], val_reg
//
// and the uncommon path (== NULL) will use narrow_oop_reg directly
// since narrow oops can be used in debug info now (see the code in
// final_graph_reshaping_walk()).
//
// At the end the code will be matched to
// on x86:
//
// Load_narrow_oop memory, narrow_oop_reg
// Load [R12 + narrow_oop_reg<<3 + offset], val_reg
// NullCheck narrow_oop_reg
//
// and on sparc:
//
// Load_narrow_oop memory, narrow_oop_reg
// decode_not_null narrow_oop_reg, base_reg
// Load [base_reg + offset], val_reg
// NullCheck base_reg
//
2008-05-21 13:46:23 -07:00
} else if ( t - > isa_oopptr ( ) ) {
2014-08-05 09:58:52 +02:00
new_in2 = ConNode : : make ( t - > make_narrowoop ( ) ) ;
2012-10-09 10:11:38 +02:00
} else if ( t - > isa_klassptr ( ) ) {
2014-08-05 09:58:52 +02:00
new_in2 = ConNode : : make ( t - > make_narrowklass ( ) ) ;
2008-05-21 13:46:23 -07:00
}
}
2008-09-10 18:23:32 -07:00
if ( new_in2 ! = NULL ) {
2014-06-02 08:07:29 +02:00
Node * cmpN = new CmpNNode ( in1 - > in ( 1 ) , new_in2 ) ;
2012-11-27 17:24:15 -08:00
n - > subsume_by ( cmpN , this ) ;
2008-09-10 18:23:32 -07:00
if ( in1 - > outcnt ( ) = = 0 ) {
2012-11-27 17:24:15 -08:00
in1 - > disconnect_inputs ( NULL , this ) ;
2008-09-10 18:23:32 -07:00
}
if ( in2 - > outcnt ( ) = = 0 ) {
2012-11-27 17:24:15 -08:00
in2 - > disconnect_inputs ( NULL , this ) ;
2008-09-10 18:23:32 -07:00
}
2008-05-21 13:46:23 -07:00
}
}
2008-08-01 10:06:45 -07:00
break ;
2008-09-23 12:29:06 -07:00
case Op_DecodeN :
2012-10-09 10:11:38 +02:00
case Op_DecodeNKlass :
assert ( ! n - > in ( 1 ) - > is_EncodeNarrowPtr ( ) , " should be optimized out " ) ;
2010-06-02 09:49:32 -07:00
// DecodeN could be pinned when it can't be fold into
2008-12-18 11:26:22 -08:00
// an address expression, see the code for Op_CastPP above.
2012-10-09 10:11:38 +02:00
assert ( n - > in ( 0 ) = = NULL | | ( UseCompressedOops & & ! Matcher : : narrow_oop_use_complex_address ( ) ) , " no control " ) ;
2008-09-23 12:29:06 -07:00
break ;
2012-10-09 10:11:38 +02:00
case Op_EncodeP :
case Op_EncodePKlass : {
2008-09-23 12:29:06 -07:00
Node * in1 = n - > in ( 1 ) ;
2012-10-09 10:11:38 +02:00
if ( in1 - > is_DecodeNarrowPtr ( ) ) {
2012-11-27 17:24:15 -08:00
n - > subsume_by ( in1 - > in ( 1 ) , this ) ;
2008-09-23 12:29:06 -07:00
} else if ( in1 - > Opcode ( ) = = Op_ConP ) {
const Type * t = in1 - > bottom_type ( ) ;
if ( t = = TypePtr : : NULL_PTR ) {
2012-10-09 10:11:38 +02:00
assert ( t - > isa_oopptr ( ) , " null klass? " ) ;
2014-08-05 09:58:52 +02:00
n - > subsume_by ( ConNode : : make ( TypeNarrowOop : : NULL_PTR ) , this ) ;
2008-09-23 12:29:06 -07:00
} else if ( t - > isa_oopptr ( ) ) {
2014-08-05 09:58:52 +02:00
n - > subsume_by ( ConNode : : make ( t - > make_narrowoop ( ) ) , this ) ;
2012-10-09 10:11:38 +02:00
} else if ( t - > isa_klassptr ( ) ) {
2014-08-05 09:58:52 +02:00
n - > subsume_by ( ConNode : : make ( t - > make_narrowklass ( ) ) , this ) ;
2008-09-23 12:29:06 -07:00
}
}
if ( in1 - > outcnt ( ) = = 0 ) {
2012-11-27 17:24:15 -08:00
in1 - > disconnect_inputs ( NULL , this ) ;
2008-09-23 12:29:06 -07:00
}
break ;
}
2009-11-12 09:24:21 -08:00
case Op_Proj : {
if ( OptimizeStringConcat ) {
ProjNode * p = n - > as_Proj ( ) ;
if ( p - > _is_io_use ) {
// Separate projections were used for the exception path which
// are normally removed by a late inline. If it wasn't inlined
// then they will hang around and should just be replaced with
// the original one.
Node * proj = NULL ;
// Replace with just one
for ( SimpleDUIterator i ( p - > in ( 0 ) ) ; i . has_next ( ) ; i . next ( ) ) {
Node * use = i . get ( ) ;
if ( use - > is_Proj ( ) & & p ! = use & & use - > as_Proj ( ) - > _con = = p - > _con ) {
proj = use ;
break ;
}
}
2011-12-27 15:08:43 -08:00
assert ( proj ! = NULL , " must be found " ) ;
2012-11-27 17:24:15 -08:00
p - > subsume_by ( proj , this ) ;
2009-11-12 09:24:21 -08:00
}
}
break ;
}
2008-09-23 12:29:06 -07:00
case Op_Phi :
2012-10-09 10:11:38 +02:00
if ( n - > as_Phi ( ) - > bottom_type ( ) - > isa_narrowoop ( ) | | n - > as_Phi ( ) - > bottom_type ( ) - > isa_narrowklass ( ) ) {
2008-09-23 12:29:06 -07:00
// The EncodeP optimization may create Phi with the same edges
// for all paths. It is not handled well by Register Allocator.
Node * unique_in = n - > in ( 1 ) ;
assert ( unique_in ! = NULL , " " ) ;
uint cnt = n - > req ( ) ;
for ( uint i = 2 ; i < cnt ; i + + ) {
Node * m = n - > in ( i ) ;
assert ( m ! = NULL , " " ) ;
if ( unique_in ! = m )
unique_in = NULL ;
}
if ( unique_in ! = NULL ) {
2012-11-27 17:24:15 -08:00
n - > subsume_by ( unique_in , this ) ;
2008-09-23 12:29:06 -07:00
}
}
break ;
2008-05-21 13:46:23 -07:00
# endif
2007-12-01 00:00:00 +00:00
case Op_ModI :
if ( UseDivMod ) {
// Check if a%b and a/b both exist
Node * d = n - > find_similar ( Op_DivI ) ;
if ( d ) {
// Replace them with a fused divmod if supported
if ( Matcher : : has_match_rule ( Op_DivModI ) ) {
2014-08-05 09:58:52 +02:00
DivModINode * divmod = DivModINode : : make ( n ) ;
2012-11-27 17:24:15 -08:00
d - > subsume_by ( divmod - > div_proj ( ) , this ) ;
n - > subsume_by ( divmod - > mod_proj ( ) , this ) ;
2007-12-01 00:00:00 +00:00
} else {
// replace a%b with a-((a/b)*b)
2014-06-02 08:07:29 +02:00
Node * mult = new MulINode ( d , d - > in ( 2 ) ) ;
Node * sub = new SubINode ( d - > in ( 1 ) , mult ) ;
2012-11-27 17:24:15 -08:00
n - > subsume_by ( sub , this ) ;
2007-12-01 00:00:00 +00:00
}
}
}
break ;
case Op_ModL :
if ( UseDivMod ) {
// Check if a%b and a/b both exist
Node * d = n - > find_similar ( Op_DivL ) ;
if ( d ) {
// Replace them with a fused divmod if supported
if ( Matcher : : has_match_rule ( Op_DivModL ) ) {
2014-08-05 09:58:52 +02:00
DivModLNode * divmod = DivModLNode : : make ( n ) ;
2012-11-27 17:24:15 -08:00
d - > subsume_by ( divmod - > div_proj ( ) , this ) ;
n - > subsume_by ( divmod - > mod_proj ( ) , this ) ;
2007-12-01 00:00:00 +00:00
} else {
// replace a%b with a-((a/b)*b)
2014-06-02 08:07:29 +02:00
Node * mult = new MulLNode ( d , d - > in ( 2 ) ) ;
Node * sub = new SubLNode ( d - > in ( 1 ) , mult ) ;
2012-11-27 17:24:15 -08:00
n - > subsume_by ( sub , this ) ;
2007-12-01 00:00:00 +00:00
}
}
}
break ;
2012-06-15 01:25:19 -07:00
case Op_LoadVector :
case Op_StoreVector :
2007-12-01 00:00:00 +00:00
break ;
2015-04-01 18:07:50 -07:00
case Op_AddReductionVI :
case Op_AddReductionVL :
case Op_AddReductionVF :
case Op_AddReductionVD :
case Op_MulReductionVI :
2015-05-08 11:49:20 -07:00
case Op_MulReductionVL :
2015-04-01 18:07:50 -07:00
case Op_MulReductionVF :
case Op_MulReductionVD :
break ;
2007-12-01 00:00:00 +00:00
case Op_PackB :
case Op_PackS :
case Op_PackI :
case Op_PackF :
case Op_PackL :
case Op_PackD :
if ( n - > req ( ) - 1 > 2 ) {
// Replace many operand PackNodes with a binary tree for matching
PackNode * p = ( PackNode * ) n ;
2014-08-05 09:58:52 +02:00
Node * btp = p - > binary_tree_pack ( 1 , n - > req ( ) ) ;
2012-11-27 17:24:15 -08:00
n - > subsume_by ( btp , this ) ;
2007-12-01 00:00:00 +00:00
}
break ;
2009-07-23 14:53:56 -07:00
case Op_Loop :
case Op_CountedLoop :
if ( n - > as_Loop ( ) - > is_inner_loop ( ) ) {
frc . inc_inner_loop_count ( ) ;
}
break ;
2011-03-25 09:35:39 +01:00
case Op_LShiftI :
case Op_RShiftI :
case Op_URShiftI :
case Op_LShiftL :
case Op_RShiftL :
case Op_URShiftL :
if ( Matcher : : need_masked_shift_count ) {
// The cpu's shift instructions don't restrict the count to the
// lower 5/6 bits. We need to do the masking ourselves.
Node * in2 = n - > in ( 2 ) ;
juint mask = ( n - > bottom_type ( ) = = TypeInt : : INT ) ? ( BitsPerInt - 1 ) : ( BitsPerLong - 1 ) ;
const TypeInt * t = in2 - > find_int_type ( ) ;
if ( t ! = NULL & & t - > is_con ( ) ) {
juint shift = t - > get_con ( ) ;
if ( shift > mask ) { // Unsigned cmp
2014-08-05 09:58:52 +02:00
n - > set_req ( 2 , ConNode : : make ( TypeInt : : make ( shift & mask ) ) ) ;
2011-03-25 09:35:39 +01:00
}
} else {
if ( t = = NULL | | t - > _lo < 0 | | t - > _hi > ( int ) mask ) {
2014-08-05 09:58:52 +02:00
Node * shift = new AndINode ( in2 , ConNode : : make ( TypeInt : : make ( mask ) ) ) ;
2011-03-25 09:35:39 +01:00
n - > set_req ( 2 , shift ) ;
}
}
if ( in2 - > outcnt ( ) = = 0 ) { // Remove dead node
2012-11-27 17:24:15 -08:00
in2 - > disconnect_inputs ( NULL , this ) ;
2011-03-25 09:35:39 +01:00
}
}
break ;
2013-03-06 10:28:38 +01:00
case Op_MemBarStoreStore :
2013-05-08 15:08:01 -07:00
case Op_MemBarRelease :
2013-03-06 10:28:38 +01:00
// Break the link with AllocateNode: it is no longer useful and
// confuses register allocation.
if ( n - > req ( ) > MemBarNode : : Precedent ) {
n - > set_req ( MemBarNode : : Precedent , top ( ) ) ;
}
break ;
2007-12-01 00:00:00 +00:00
default :
assert ( ! n - > is_Call ( ) , " " ) ;
assert ( ! n - > is_Mem ( ) , " " ) ;
2015-01-29 10:25:59 -08:00
assert ( nop ! = Op_ProfileBoolean , " should be eliminated during IGVN " ) ;
2007-12-01 00:00:00 +00:00
break ;
}
2008-04-24 11:13:03 -07:00
// Collect CFG split points
if ( n - > is_MultiBranch ( ) )
2009-07-23 14:53:56 -07:00
frc . _tests . push ( n ) ;
2007-12-01 00:00:00 +00:00
}
//------------------------------final_graph_reshaping_walk---------------------
// Replacing Opaque nodes with their input in final_graph_reshaping_impl(),
// requires that the walk visits a node's inputs before visiting the node.
2012-11-27 17:24:15 -08:00
void Compile : : final_graph_reshaping_walk ( Node_Stack & nstack , Node * root , Final_Reshape_Counts & frc ) {
2008-09-10 18:23:32 -07:00
ResourceArea * area = Thread : : current ( ) - > resource_area ( ) ;
Unique_Node_List sfpt ( area ) ;
2009-07-23 14:53:56 -07:00
frc . _visited . set ( root - > _idx ) ; // first, mark node as visited
2007-12-01 00:00:00 +00:00
uint cnt = root - > req ( ) ;
Node * n = root ;
uint i = 0 ;
while ( true ) {
if ( i < cnt ) {
// Place all non-visited non-null inputs onto stack
Node * m = n - > in ( i ) ;
+ + i ;
2009-07-23 14:53:56 -07:00
if ( m ! = NULL & & ! frc . _visited . test_set ( m - > _idx ) ) {
2014-04-01 09:36:49 +02:00
if ( m - > is_SafePoint ( ) & & m - > as_SafePoint ( ) - > jvms ( ) ! = NULL ) {
// compute worst case interpreter size in case of a deoptimization
update_interpreter_frame_size ( m - > as_SafePoint ( ) - > jvms ( ) - > interpreter_frame_size ( ) ) ;
2008-09-10 18:23:32 -07:00
sfpt . push ( m ) ;
2014-04-01 09:36:49 +02:00
}
2007-12-01 00:00:00 +00:00
cnt = m - > req ( ) ;
nstack . push ( n , i ) ; // put on stack parent and next input's index
n = m ;
i = 0 ;
}
} else {
// Now do post-visit work
2009-07-23 14:53:56 -07:00
final_graph_reshaping_impl ( n , frc ) ;
2007-12-01 00:00:00 +00:00
if ( nstack . is_empty ( ) )
break ; // finished
n = nstack . node ( ) ; // Get node from stack
cnt = n - > req ( ) ;
i = nstack . index ( ) ;
nstack . pop ( ) ; // Shift to the next node on stack
}
}
2008-09-10 18:23:32 -07:00
2010-06-02 09:49:32 -07:00
// Skip next transformation if compressed oops are not used.
2012-10-09 10:11:38 +02:00
if ( ( UseCompressedOops & & ! Matcher : : gen_narrow_oop_implicit_null_checks ( ) ) | |
2013-08-12 17:37:02 +02:00
( ! UseCompressedOops & & ! UseCompressedClassPointers ) )
2010-06-02 09:49:32 -07:00
return ;
2012-10-09 10:11:38 +02:00
// Go over safepoints nodes to skip DecodeN/DecodeNKlass nodes for debug edges.
2008-09-10 18:23:32 -07:00
// It could be done for an uncommon traps or any safepoints/calls
2012-10-09 10:11:38 +02:00
// if the DecodeN/DecodeNKlass node is referenced only in a debug info.
2008-09-10 18:23:32 -07:00
while ( sfpt . size ( ) > 0 ) {
n = sfpt . pop ( ) ;
JVMState * jvms = n - > as_SafePoint ( ) - > jvms ( ) ;
assert ( jvms ! = NULL , " sanity " ) ;
int start = jvms - > debug_start ( ) ;
int end = n - > req ( ) ;
bool is_uncommon = ( n - > is_CallStaticJava ( ) & &
n - > as_CallStaticJava ( ) - > uncommon_trap_request ( ) ! = 0 ) ;
for ( int j = start ; j < end ; j + + ) {
Node * in = n - > in ( j ) ;
2012-10-09 10:11:38 +02:00
if ( in - > is_DecodeNarrowPtr ( ) ) {
2008-09-10 18:23:32 -07:00
bool safe_to_skip = true ;
if ( ! is_uncommon ) {
// Is it safe to skip?
for ( uint i = 0 ; i < in - > outcnt ( ) ; i + + ) {
Node * u = in - > raw_out ( i ) ;
if ( ! u - > is_SafePoint ( ) | |
u - > is_Call ( ) & & u - > as_Call ( ) - > has_non_debug_use ( n ) ) {
safe_to_skip = false ;
}
}
}
if ( safe_to_skip ) {
n - > set_req ( j , in - > in ( 1 ) ) ;
}
if ( in - > outcnt ( ) = = 0 ) {
2012-11-27 17:24:15 -08:00
in - > disconnect_inputs ( NULL , this ) ;
2008-09-10 18:23:32 -07:00
}
}
}
}
2007-12-01 00:00:00 +00:00
}
//------------------------------final_graph_reshaping--------------------------
// Final Graph Reshaping.
//
// (1) Clone simple inputs to uncommon calls, so they can be scheduled late
// and not commoned up and forced early. Must come after regular
// optimizations to avoid GVN undoing the cloning. Clone constant
// inputs to Loop Phis; these will be split by the allocator anyways.
// Remove Opaque nodes.
// (2) Move last-uses by commutative operations to the left input to encourage
// Intel update-in-place two-address operations and better register usage
// on RISCs. Must come after regular optimizations to avoid GVN Ideal
// calls canonicalizing them back.
// (3) Count the number of double-precision FP ops, single-precision FP ops
// and call sites. On Intel, we can get correct rounding either by
// forcing singles to memory (requires extra stores and loads after each
// FP bytecode) or we can set a rounding mode bit (requires setting and
// clearing the mode bit around call sites). The mode bit is only used
// if the relative frequency of single FP ops to calls is low enough.
// This is a key transform for SPEC mpeg_audio.
// (4) Detect infinite loops; blobs of code reachable from above but not
// below. Several of the Code_Gen algorithms fail on such code shapes,
// so we simply bail out. Happens a lot in ZKM.jar, but also happens
// from time to time in other codes (such as -Xcomp finalizer loops, etc).
// Detection is by looking for IfNodes where only 1 projection is
// reachable from below or CatchNodes missing some targets.
// (5) Assert for insane oop offsets in debug mode.
bool Compile : : final_graph_reshaping ( ) {
// an infinite loop may have been eliminated by the optimizer,
// in which case the graph will be empty.
if ( root ( ) - > req ( ) = = 1 ) {
record_method_not_compilable ( " trivial infinite loop " ) ;
return true ;
}
2013-02-12 12:56:11 +01:00
// Expensive nodes have their control input set to prevent the GVN
// from freely commoning them. There's no GVN beyond this point so
// no need to keep the control input. We want the expensive nodes to
// be freely moved to the least frequent code path by gcm.
assert ( OptimizeExpensiveOps | | expensive_count ( ) = = 0 , " optimization off but list non empty? " ) ;
for ( int i = 0 ; i < expensive_count ( ) ; i + + ) {
_expensive_nodes - > at ( i ) - > set_req ( 0 , NULL ) ;
}
2009-07-23 14:53:56 -07:00
Final_Reshape_Counts frc ;
2007-12-01 00:00:00 +00:00
// Visit everybody reachable!
2015-10-08 12:10:19 +02:00
// Allocate stack of size C->live_nodes()/2 to avoid frequent realloc
2015-08-10 10:39:19 -07:00
Node_Stack nstack ( live_nodes ( ) > > 1 ) ;
2009-07-23 14:53:56 -07:00
final_graph_reshaping_walk ( nstack , root ( ) , frc ) ;
2007-12-01 00:00:00 +00:00
// Check for unreachable (from below) code (i.e., infinite loops).
2009-07-23 14:53:56 -07:00
for ( uint i = 0 ; i < frc . _tests . size ( ) ; i + + ) {
MultiBranchNode * n = frc . _tests [ i ] - > as_MultiBranch ( ) ;
2008-04-24 11:13:03 -07:00
// Get number of CFG targets.
2007-12-01 00:00:00 +00:00
// Note that PCTables include exception targets after calls.
2008-04-24 11:13:03 -07:00
uint required_outcnt = n - > required_outcnt ( ) ;
if ( n - > outcnt ( ) ! = required_outcnt ) {
2007-12-01 00:00:00 +00:00
// Check for a few special cases. Rethrow Nodes never take the
// 'fall-thru' path, so expected kids is 1 less.
if ( n - > is_PCTable ( ) & & n - > in ( 0 ) & & n - > in ( 0 ) - > in ( 0 ) ) {
if ( n - > in ( 0 ) - > in ( 0 ) - > is_Call ( ) ) {
CallNode * call = n - > in ( 0 ) - > in ( 0 ) - > as_Call ( ) ;
if ( call - > entry_point ( ) = = OptoRuntime : : rethrow_stub ( ) ) {
2008-04-24 11:13:03 -07:00
required_outcnt - - ; // Rethrow always has 1 less kid
2007-12-01 00:00:00 +00:00
} else if ( call - > req ( ) > TypeFunc : : Parms & &
call - > is_CallDynamicJava ( ) ) {
// Check for null receiver. In such case, the optimizer has
// detected that the virtual call will always result in a null
// pointer exception. The fall-through projection of this CatchNode
// will not be populated.
Node * arg0 = call - > in ( TypeFunc : : Parms ) ;
if ( arg0 - > is_Type ( ) & &
arg0 - > as_Type ( ) - > type ( ) - > higher_equal ( TypePtr : : NULL_PTR ) ) {
2008-04-24 11:13:03 -07:00
required_outcnt - - ;
2007-12-01 00:00:00 +00:00
}
} else if ( call - > entry_point ( ) = = OptoRuntime : : new_array_Java ( ) & &
call - > req ( ) > TypeFunc : : Parms + 1 & &
call - > is_CallStaticJava ( ) ) {
// Check for negative array length. In such case, the optimizer has
// detected that the allocation attempt will always result in an
// exception. There is no fall-through projection of this CatchNode .
Node * arg1 = call - > in ( TypeFunc : : Parms + 1 ) ;
if ( arg1 - > is_Type ( ) & &
arg1 - > as_Type ( ) - > type ( ) - > join ( TypeInt : : POS ) - > empty ( ) ) {
2008-04-24 11:13:03 -07:00
required_outcnt - - ;
2007-12-01 00:00:00 +00:00
}
}
}
}
2008-04-24 11:13:03 -07:00
// Recheck with a better notion of 'required_outcnt'
if ( n - > outcnt ( ) ! = required_outcnt ) {
2007-12-01 00:00:00 +00:00
record_method_not_compilable ( " malformed control flow " ) ;
return true ; // Not all targets reachable!
}
}
// Check that I actually visited all kids. Unreached kids
// must be infinite loops.
for ( DUIterator_Fast jmax , j = n - > fast_outs ( jmax ) ; j < jmax ; j + + )
2009-07-23 14:53:56 -07:00
if ( ! frc . _visited . test ( n - > fast_out ( j ) - > _idx ) ) {
2007-12-01 00:00:00 +00:00
record_method_not_compilable ( " infinite loop " ) ;
return true ; // Found unvisited kid; must be unreach
}
}
// If original bytecodes contained a mixture of floats and doubles
// check if the optimizer has made it homogenous, item (3).
2009-08-19 18:54:35 -07:00
if ( Use24BitFPMode & & Use24BitFP & & UseSSE = = 0 & &
2009-07-23 14:53:56 -07:00
frc . get_float_count ( ) > 32 & &
frc . get_double_count ( ) = = 0 & &
( 10 * frc . get_call_count ( ) < frc . get_float_count ( ) ) ) {
2007-12-01 00:00:00 +00:00
set_24_bit_selection_and_mode ( false , true ) ;
}
2009-07-23 14:53:56 -07:00
set_java_calls ( frc . get_java_call_count ( ) ) ;
set_inner_loops ( frc . get_inner_loop_count ( ) ) ;
2007-12-01 00:00:00 +00:00
// No infinite loops, no reason to bail out.
return false ;
}
//-----------------------------too_many_traps----------------------------------
// Report if there are too many traps at the current method and bci.
// Return true if there was a trap, and/or PerMethodTrapLimit is exceeded.
bool Compile : : too_many_traps ( ciMethod * method ,
int bci ,
Deoptimization : : DeoptReason reason ) {
ciMethodData * md = method - > method_data ( ) ;
if ( md - > is_empty ( ) ) {
// Assume the trap has not occurred, or that it occurred only
// because of a transient condition during start-up in the interpreter.
return false ;
}
2014-02-25 18:16:24 +01:00
ciMethod * m = Deoptimization : : reason_is_speculate ( reason ) ? this - > method ( ) : NULL ;
if ( md - > has_trap_at ( bci , m , reason ) ! = 0 ) {
2007-12-01 00:00:00 +00:00
// Assume PerBytecodeTrapLimit==0, for a more conservative heuristic.
// Also, if there are multiple reasons, or if there is no per-BCI record,
// assume the worst.
if ( log ( ) )
log ( ) - > elem ( " observe trap='%s' count='%d' " ,
Deoptimization : : trap_reason_name ( reason ) ,
md - > trap_count ( reason ) ) ;
return true ;
} else {
// Ignore method/bci and see if there have been too many globally.
return too_many_traps ( reason , md ) ;
}
}
// Less-accurate variant which does not require a method and bci.
bool Compile : : too_many_traps ( Deoptimization : : DeoptReason reason ,
ciMethodData * logmd ) {
2014-02-25 18:16:24 +01:00
if ( trap_count ( reason ) > = Deoptimization : : per_method_trap_limit ( reason ) ) {
2007-12-01 00:00:00 +00:00
// Too many traps globally.
// Note that we use cumulative trap_count, not just md->trap_count.
if ( log ( ) ) {
int mcount = ( logmd = = NULL ) ? - 1 : ( int ) logmd - > trap_count ( reason ) ;
log ( ) - > elem ( " observe trap='%s' count='0' mcount='%d' ccount='%d' " ,
Deoptimization : : trap_reason_name ( reason ) ,
mcount , trap_count ( reason ) ) ;
}
return true ;
} else {
// The coast is clear.
return false ;
}
}
//--------------------------too_many_recompiles--------------------------------
// Report if there are too many recompiles at the current method and bci.
// Consults PerBytecodeRecompilationCutoff and PerMethodRecompilationCutoff.
// Is not eager to return true, since this will cause the compiler to use
// Action_none for a trap point, to avoid too many recompilations.
bool Compile : : too_many_recompiles ( ciMethod * method ,
int bci ,
Deoptimization : : DeoptReason reason ) {
ciMethodData * md = method - > method_data ( ) ;
if ( md - > is_empty ( ) ) {
// Assume the trap has not occurred, or that it occurred only
// because of a transient condition during start-up in the interpreter.
return false ;
}
// Pick a cutoff point well within PerBytecodeRecompilationCutoff.
uint bc_cutoff = ( uint ) PerBytecodeRecompilationCutoff / 8 ;
uint m_cutoff = ( uint ) PerMethodRecompilationCutoff / 2 + 1 ; // not zero
Deoptimization : : DeoptReason per_bc_reason
= Deoptimization : : reason_recorded_per_bytecode_if_any ( reason ) ;
2014-02-25 18:16:24 +01:00
ciMethod * m = Deoptimization : : reason_is_speculate ( reason ) ? this - > method ( ) : NULL ;
2007-12-01 00:00:00 +00:00
if ( ( per_bc_reason = = Deoptimization : : Reason_none
2014-02-25 18:16:24 +01:00
| | md - > has_trap_at ( bci , m , reason ) ! = 0 )
2007-12-01 00:00:00 +00:00
// The trap frequency measure we care about is the recompile count:
2014-02-25 18:16:24 +01:00
& & md - > trap_recompiled_at ( bci , m )
2007-12-01 00:00:00 +00:00
& & md - > overflow_recompile_count ( ) > = bc_cutoff ) {
// Do not emit a trap here if it has already caused recompilations.
// Also, if there are multiple reasons, or if there is no per-BCI record,
// assume the worst.
if ( log ( ) )
log ( ) - > elem ( " observe trap='%s recompiled' count='%d' recompiles2='%d' " ,
Deoptimization : : trap_reason_name ( reason ) ,
md - > trap_count ( reason ) ,
md - > overflow_recompile_count ( ) ) ;
return true ;
} else if ( trap_count ( reason ) ! = 0
& & decompile_count ( ) > = m_cutoff ) {
// Too many recompiles globally, and we have seen this sort of trap.
// Use cumulative decompile_count, not just md->decompile_count.
if ( log ( ) )
log ( ) - > elem ( " observe trap='%s' count='%d' mcount='%d' decompiles='%d' mdecompiles='%d' " ,
Deoptimization : : trap_reason_name ( reason ) ,
md - > trap_count ( reason ) , trap_count ( reason ) ,
md - > decompile_count ( ) , decompile_count ( ) ) ;
return true ;
} else {
// The coast is clear.
return false ;
}
}
2013-11-27 16:16:21 -08:00
// Compute when not to trap. Used by matching trap based nodes and
// NullCheck optimization.
void Compile : : set_allowed_deopt_reasons ( ) {
_allowed_reasons = 0 ;
if ( is_method_compilation ( ) ) {
for ( int rs = ( int ) Deoptimization : : Reason_none + 1 ; rs < Compile : : trapHistLength ; rs + + ) {
assert ( rs < BitsPerInt , " recode bit map " ) ;
if ( ! too_many_traps ( ( Deoptimization : : DeoptReason ) rs ) ) {
_allowed_reasons | = nth_bit ( rs ) ;
}
}
}
}
2007-12-01 00:00:00 +00:00
# ifndef PRODUCT
//------------------------------verify_graph_edges---------------------------
// Walk the Graph and verify that there is a one-to-one correspondence
// between Use-Def edges and Def-Use edges in the graph.
void Compile : : verify_graph_edges ( bool no_dead_code ) {
if ( VerifyGraphEdges ) {
ResourceArea * area = Thread : : current ( ) - > resource_area ( ) ;
Unique_Node_List visited ( area ) ;
// Call recursive graph walk to check edges
_root - > verify_edges ( visited ) ;
if ( no_dead_code ) {
// Now make sure that no visited node is used by an unvisited node.
2014-06-20 08:14:30 +02:00
bool dead_nodes = false ;
2007-12-01 00:00:00 +00:00
Unique_Node_List checked ( area ) ;
while ( visited . size ( ) > 0 ) {
Node * n = visited . pop ( ) ;
checked . push ( n ) ;
for ( uint i = 0 ; i < n - > outcnt ( ) ; i + + ) {
Node * use = n - > raw_out ( i ) ;
if ( checked . member ( use ) ) continue ; // already checked
if ( visited . member ( use ) ) continue ; // already in the graph
if ( use - > is_Con ( ) ) continue ; // a dead ConNode is OK
// At this point, we have found a dead node which is DU-reachable.
2014-06-20 08:14:30 +02:00
if ( ! dead_nodes ) {
2007-12-01 00:00:00 +00:00
tty - > print_cr ( " *** Dead nodes reachable via DU edges: " ) ;
2014-06-20 08:14:30 +02:00
dead_nodes = true ;
}
2007-12-01 00:00:00 +00:00
use - > dump ( 2 ) ;
tty - > print_cr ( " --- " ) ;
checked . push ( use ) ; // No repeats; pretend it is now checked.
}
}
2014-06-20 08:14:30 +02:00
assert ( ! dead_nodes , " using nodes must be reachable from root " ) ;
2007-12-01 00:00:00 +00:00
}
}
}
2013-11-05 01:57:18 -08:00
// Verify GC barriers consistency
// Currently supported:
// - G1 pre-barriers (see GraphKit::g1_write_barrier_pre())
void Compile : : verify_barriers ( ) {
if ( UseG1GC ) {
// Verify G1 pre-barriers
2015-11-17 16:40:52 -05:00
const int marking_offset = in_bytes ( JavaThread : : satb_mark_queue_offset ( ) + SATBMarkQueue : : byte_offset_of_active ( ) ) ;
2013-11-05 01:57:18 -08:00
ResourceArea * area = Thread : : current ( ) - > resource_area ( ) ;
Unique_Node_List visited ( area ) ;
Node_List worklist ( area ) ;
// We're going to walk control flow backwards starting from the Root
worklist . push ( _root ) ;
while ( worklist . size ( ) > 0 ) {
Node * x = worklist . pop ( ) ;
if ( x = = NULL | | x = = top ( ) ) continue ;
if ( visited . member ( x ) ) {
continue ;
} else {
visited . push ( x ) ;
}
if ( x - > is_Region ( ) ) {
for ( uint i = 1 ; i < x - > req ( ) ; i + + ) {
worklist . push ( x - > in ( i ) ) ;
}
} else {
worklist . push ( x - > in ( 0 ) ) ;
// We are looking for the pattern:
// /->ThreadLocal
// If->Bool->CmpI->LoadB->AddP->ConL(marking_offset)
// \->ConI(0)
// We want to verify that the If and the LoadB have the same control
// See GraphKit::g1_write_barrier_pre()
if ( x - > is_If ( ) ) {
IfNode * iff = x - > as_If ( ) ;
if ( iff - > in ( 1 ) - > is_Bool ( ) & & iff - > in ( 1 ) - > in ( 1 ) - > is_Cmp ( ) ) {
CmpNode * cmp = iff - > in ( 1 ) - > in ( 1 ) - > as_Cmp ( ) ;
if ( cmp - > Opcode ( ) = = Op_CmpI & & cmp - > in ( 2 ) - > is_Con ( ) & & cmp - > in ( 2 ) - > bottom_type ( ) - > is_int ( ) - > get_con ( ) = = 0
& & cmp - > in ( 1 ) - > is_Load ( ) ) {
LoadNode * load = cmp - > in ( 1 ) - > as_Load ( ) ;
if ( load - > Opcode ( ) = = Op_LoadB & & load - > in ( 2 ) - > is_AddP ( ) & & load - > in ( 2 ) - > in ( 2 ) - > Opcode ( ) = = Op_ThreadLocal
& & load - > in ( 2 ) - > in ( 3 ) - > is_Con ( )
& & load - > in ( 2 ) - > in ( 3 ) - > bottom_type ( ) - > is_intptr_t ( ) - > get_con ( ) = = marking_offset ) {
Node * if_ctrl = iff - > in ( 0 ) ;
Node * load_ctrl = load - > in ( 0 ) ;
if ( if_ctrl ! = load_ctrl ) {
// Skip possible CProj->NeverBranch in infinite loops
if ( ( if_ctrl - > is_Proj ( ) & & if_ctrl - > Opcode ( ) = = Op_CProj )
& & ( if_ctrl - > in ( 0 ) - > is_MultiBranch ( ) & & if_ctrl - > in ( 0 ) - > Opcode ( ) = = Op_NeverBranch ) ) {
if_ctrl = if_ctrl - > in ( 0 ) - > in ( 0 ) ;
}
}
assert ( load_ctrl ! = NULL & & if_ctrl = = load_ctrl , " controls must match " ) ;
}
}
}
}
}
}
}
}
2007-12-01 00:00:00 +00:00
# endif
// The Compile object keeps track of failure reasons separately from the ciEnv.
// This is required because there is not quite a 1-1 relation between the
// ciEnv and its compilation task and the Compile object. Note that one
// ciEnv might use two Compile objects, if C2Compiler::compile_method decides
// to backtrack and retry without subsuming loads. Other than this backtracking
// behavior, the Compile's failure reason is quietly copied up to the ciEnv
// by the logic in C2Compiler.
void Compile : : record_failure ( const char * reason ) {
if ( log ( ) ! = NULL ) {
log ( ) - > elem ( " failure reason='%s' phase='compile' " , reason ) ;
}
if ( _failure_reason = = NULL ) {
// Record the first failure reason.
_failure_reason = reason ;
}
2013-06-10 11:30:51 +02:00
2008-06-24 16:00:14 -07:00
if ( ! C - > failure_reason_is ( C2Compiler : : retry_no_subsuming_loads ( ) ) ) {
2013-06-10 11:30:51 +02:00
C - > print_method ( PHASE_FAILURE ) ;
2008-06-24 16:00:14 -07:00
}
2007-12-01 00:00:00 +00:00
_root = NULL ; // flush the graph, too
}
2014-09-25 12:10:57 +04:00
Compile : : TracePhase : : TracePhase ( const char * name , elapsedTimer * accumulator )
: TraceTime ( name , accumulator , CITime , CITimeVerbose ) ,
_phase_name ( name ) , _dolog ( CITimeVerbose )
2007-12-01 00:00:00 +00:00
{
2014-09-25 12:10:57 +04:00
if ( _dolog ) {
2007-12-01 00:00:00 +00:00
C = Compile : : current ( ) ;
_log = C - > log ( ) ;
} else {
C = NULL ;
_log = NULL ;
}
if ( _log ! = NULL ) {
2012-11-27 17:24:15 -08:00
_log - > begin_head ( " phase name='%s' nodes='%d' live='%d' " , _phase_name , C - > unique ( ) , C - > live_nodes ( ) ) ;
2007-12-01 00:00:00 +00:00
_log - > stamp ( ) ;
_log - > end_head ( ) ;
}
}
Compile : : TracePhase : : ~ TracePhase ( ) {
2012-11-27 17:24:15 -08:00
C = Compile : : current ( ) ;
if ( _dolog ) {
_log = C - > log ( ) ;
} else {
_log = NULL ;
}
# ifdef ASSERT
if ( PrintIdealNodeCount ) {
tty - > print_cr ( " phase name='%s' nodes='%d' live='%d' live_graph_walk='%d' " ,
_phase_name , C - > unique ( ) , C - > live_nodes ( ) , C - > count_live_nodes_by_graph_walk ( ) ) ;
}
if ( VerifyIdealNodeCount ) {
Compile : : current ( ) - > print_missing_nodes ( ) ;
}
# endif
2007-12-01 00:00:00 +00:00
if ( _log ! = NULL ) {
2012-11-27 17:24:15 -08:00
_log - > done ( " phase name='%s' nodes='%d' live='%d' " , _phase_name , C - > unique ( ) , C - > live_nodes ( ) ) ;
2007-12-01 00:00:00 +00:00
}
}
2010-12-03 01:34:31 -08:00
//=============================================================================
// Two Constant's are equal when the type and the value are equal.
bool Compile : : Constant : : operator = = ( const Constant & other ) {
if ( type ( ) ! = other . type ( ) ) return false ;
if ( can_be_reused ( ) ! = other . can_be_reused ( ) ) return false ;
// For floating point values we compare the bit pattern.
switch ( type ( ) ) {
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
case T_FLOAT : return ( _v . _value . i = = other . _v . _value . i ) ;
2010-12-03 01:34:31 -08:00
case T_LONG :
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
case T_DOUBLE : return ( _v . _value . j = = other . _v . _value . j ) ;
2010-12-03 01:34:31 -08:00
case T_OBJECT :
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
case T_ADDRESS : return ( _v . _value . l = = other . _v . _value . l ) ;
case T_VOID : return ( _v . _value . l = = other . _v . _value . l ) ; // jump-table entries
2012-10-17 12:09:32 -07:00
case T_METADATA : return ( _v . _metadata = = other . _v . _metadata ) ;
2010-12-03 01:34:31 -08:00
default : ShouldNotReachHere ( ) ;
}
return false ;
}
static int type_to_size_in_bytes ( BasicType t ) {
switch ( t ) {
case T_LONG : return sizeof ( jlong ) ;
case T_FLOAT : return sizeof ( jfloat ) ;
case T_DOUBLE : return sizeof ( jdouble ) ;
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
case T_METADATA : return sizeof ( Metadata * ) ;
2010-12-03 01:34:31 -08:00
// We use T_VOID as marker for jump-table entries (labels) which
2011-11-16 01:39:50 -08:00
// need an internal word relocation.
2010-12-03 01:34:31 -08:00
case T_VOID :
case T_ADDRESS :
case T_OBJECT : return sizeof ( jobject ) ;
}
ShouldNotReachHere ( ) ;
return - 1 ;
}
2011-11-16 01:39:50 -08:00
int Compile : : ConstantTable : : qsort_comparator ( Constant * a , Constant * b ) {
// sort descending
if ( a - > freq ( ) > b - > freq ( ) ) return - 1 ;
if ( a - > freq ( ) < b - > freq ( ) ) return 1 ;
return 0 ;
}
2010-12-03 01:34:31 -08:00
void Compile : : ConstantTable : : calculate_offsets_and_size ( ) {
2011-11-16 01:39:50 -08:00
// First, sort the array by frequencies.
_constants . sort ( qsort_comparator ) ;
2010-12-03 01:34:31 -08:00
2011-11-16 01:39:50 -08:00
# ifdef ASSERT
// Make sure all jump-table entries were sorted to the end of the
// array (they have a negative frequency).
bool found_void = false ;
for ( int i = 0 ; i < _constants . length ( ) ; i + + ) {
Constant con = _constants . at ( i ) ;
if ( con . type ( ) = = T_VOID )
found_void = true ; // jump-tables
else
assert ( ! found_void , " wrong sorting " ) ;
}
# endif
2010-12-03 01:34:31 -08:00
2011-11-16 01:39:50 -08:00
int offset = 0 ;
for ( int i = 0 ; i < _constants . length ( ) ; i + + ) {
Constant * con = _constants . adr_at ( i ) ;
2010-12-03 01:34:31 -08:00
2011-11-16 01:39:50 -08:00
// Align offset for type.
int typesize = type_to_size_in_bytes ( con - > type ( ) ) ;
offset = align_size_up ( offset , typesize ) ;
con - > set_offset ( offset ) ; // set constant's offset
2010-12-03 01:34:31 -08:00
2011-11-16 01:39:50 -08:00
if ( con - > type ( ) = = T_VOID ) {
MachConstantNode * n = ( MachConstantNode * ) con - > get_jobject ( ) ;
offset = offset + typesize * n - > outcnt ( ) ; // expand jump-table
} else {
offset = offset + typesize ;
2010-12-03 01:34:31 -08:00
}
}
// Align size up to the next section start (which is insts; see
// CodeBuffer::align_at_start).
assert ( _size = = - 1 , " already set? " ) ;
2011-11-16 01:39:50 -08:00
_size = align_size_up ( offset , CodeEntryAlignment ) ;
2010-12-03 01:34:31 -08:00
}
void Compile : : ConstantTable : : emit ( CodeBuffer & cb ) {
MacroAssembler _masm ( & cb ) ;
2011-11-16 01:39:50 -08:00
for ( int i = 0 ; i < _constants . length ( ) ; i + + ) {
Constant con = _constants . at ( i ) ;
2015-10-22 13:07:10 -04:00
address constant_addr = NULL ;
2011-11-16 01:39:50 -08:00
switch ( con . type ( ) ) {
case T_LONG : constant_addr = _masm . long_constant ( con . get_jlong ( ) ) ; break ;
case T_FLOAT : constant_addr = _masm . float_constant ( con . get_jfloat ( ) ) ; break ;
case T_DOUBLE : constant_addr = _masm . double_constant ( con . get_jdouble ( ) ) ; break ;
case T_OBJECT : {
jobject obj = con . get_jobject ( ) ;
int oop_index = _masm . oop_recorder ( ) - > find_index ( obj ) ;
constant_addr = _masm . address_constant ( ( address ) obj , oop_Relocation : : spec ( oop_index ) ) ;
break ;
}
case T_ADDRESS : {
address addr = ( address ) con . get_jobject ( ) ;
constant_addr = _masm . address_constant ( addr ) ;
break ;
}
// We use T_VOID as marker for jump-table entries (labels) which
// need an internal word relocation.
case T_VOID : {
MachConstantNode * n = ( MachConstantNode * ) con . get_jobject ( ) ;
// Fill the jump-table with a dummy word. The real value is
// filled in later in fill_jump_table.
address dummy = ( address ) n ;
constant_addr = _masm . address_constant ( dummy ) ;
// Expand jump-table
for ( uint i = 1 ; i < n - > outcnt ( ) ; i + + ) {
address temp_addr = _masm . address_constant ( dummy + i ) ;
assert ( temp_addr , " consts section too small " ) ;
2010-12-03 01:34:31 -08:00
}
2011-11-16 01:39:50 -08:00
break ;
}
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
case T_METADATA : {
Metadata * obj = con . get_metadata ( ) ;
int metadata_index = _masm . oop_recorder ( ) - > find_index ( obj ) ;
constant_addr = _masm . address_constant ( ( address ) obj , metadata_Relocation : : spec ( metadata_index ) ) ;
break ;
}
2011-11-16 01:39:50 -08:00
default : ShouldNotReachHere ( ) ;
2010-12-03 01:34:31 -08:00
}
2011-11-16 01:39:50 -08:00
assert ( constant_addr , " consts section too small " ) ;
2014-05-09 16:50:54 -04:00
assert ( ( constant_addr - _masm . code ( ) - > consts ( ) - > start ( ) ) = = con . offset ( ) ,
2015-09-29 11:02:08 +02:00
" must be: %d == %d " , ( int ) ( constant_addr - _masm . code ( ) - > consts ( ) - > start ( ) ) , ( int ) ( con . offset ( ) ) ) ;
2010-12-03 01:34:31 -08:00
}
}
int Compile : : ConstantTable : : find_offset ( Constant & con ) const {
int idx = _constants . find ( con ) ;
assert ( idx ! = - 1 , " constant must be in constant table " ) ;
int offset = _constants . at ( idx ) . offset ( ) ;
assert ( offset ! = - 1 , " constant table not emitted yet? " ) ;
return offset ;
}
void Compile : : ConstantTable : : add ( Constant & con ) {
if ( con . can_be_reused ( ) ) {
int idx = _constants . find ( con ) ;
if ( idx ! = - 1 & & _constants . at ( idx ) . can_be_reused ( ) ) {
2011-11-16 01:39:50 -08:00
_constants . adr_at ( idx ) - > inc_freq ( con . freq ( ) ) ; // increase the frequency by the current value
2010-12-03 01:34:31 -08:00
return ;
}
}
( void ) _constants . append ( con ) ;
}
2011-11-16 01:39:50 -08:00
Compile : : Constant Compile : : ConstantTable : : add ( MachConstantNode * n , BasicType type , jvalue value ) {
2013-08-07 17:56:19 +02:00
Block * b = Compile : : current ( ) - > cfg ( ) - > get_block_for_node ( n ) ;
2011-11-16 01:39:50 -08:00
Constant con ( type , value , b - > _freq ) ;
2010-12-03 01:34:31 -08:00
add ( con ) ;
return con ;
}
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
Compile : : Constant Compile : : ConstantTable : : add ( Metadata * metadata ) {
Constant con ( metadata ) ;
add ( con ) ;
return con ;
}
2011-11-16 01:39:50 -08:00
Compile : : Constant Compile : : ConstantTable : : add ( MachConstantNode * n , MachOper * oper ) {
2010-12-03 01:34:31 -08:00
jvalue value ;
BasicType type = oper - > type ( ) - > basic_type ( ) ;
switch ( type ) {
case T_LONG : value . j = oper - > constantL ( ) ; break ;
case T_FLOAT : value . f = oper - > constantF ( ) ; break ;
case T_DOUBLE : value . d = oper - > constantD ( ) ; break ;
case T_OBJECT :
case T_ADDRESS : value . l = ( jobject ) oper - > constant ( ) ; break ;
6964458: Reimplement class meta-data storage to use native memory
Remove PermGen, allocate meta-data in metaspace linked to class loaders, rewrite GC walking, rewrite and rename metadata to be C++ classes
Co-authored-by: Stefan Karlsson <stefan.karlsson@oracle.com>
Co-authored-by: Mikael Gerdin <mikael.gerdin@oracle.com>
Co-authored-by: Tom Rodriguez <tom.rodriguez@oracle.com>
Reviewed-by: jmasa, stefank, never, coleenp, kvn, brutisso, mgerdin, dholmes, jrose, twisti, roland
2012-09-01 13:25:18 -04:00
case T_METADATA : return add ( ( Metadata * ) oper - > constant ( ) ) ; break ;
2015-09-29 11:02:08 +02:00
default : guarantee ( false , " unhandled type: %s " , type2name ( type ) ) ;
2010-12-03 01:34:31 -08:00
}
2011-11-16 01:39:50 -08:00
return add ( n , type , value ) ;
2010-12-03 01:34:31 -08:00
}
2011-11-16 01:39:50 -08:00
Compile : : Constant Compile : : ConstantTable : : add_jump_table ( MachConstantNode * n ) {
2010-12-03 01:34:31 -08:00
jvalue value ;
// We can use the node pointer here to identify the right jump-table
// as this method is called from Compile::Fill_buffer right before
// the MachNodes are emitted and the jump-table is filled (means the
// MachNode pointers do not change anymore).
value . l = ( jobject ) n ;
2011-11-16 01:39:50 -08:00
Constant con ( T_VOID , value , next_jump_table_freq ( ) , false ) ; // Labels of a jump-table cannot be reused.
add ( con ) ;
2010-12-03 01:34:31 -08:00
return con ;
}
void Compile : : ConstantTable : : fill_jump_table ( CodeBuffer & cb , MachConstantNode * n , GrowableArray < Label * > labels ) const {
// If called from Compile::scratch_emit_size do nothing.
if ( Compile : : current ( ) - > in_scratch_emit_size ( ) ) return ;
assert ( labels . is_nonempty ( ) , " must be " ) ;
2015-09-29 11:02:08 +02:00
assert ( ( uint ) labels . length ( ) = = n - > outcnt ( ) , " must be equal: %d == %d " , labels . length ( ) , n - > outcnt ( ) ) ;
2010-12-03 01:34:31 -08:00
// Since MachConstantNode::constant_offset() also contains
// table_base_offset() we need to subtract the table_base_offset()
// to get the plain offset into the constant table.
int offset = n - > constant_offset ( ) - table_base_offset ( ) ;
MacroAssembler _masm ( & cb ) ;
address * jump_table_base = ( address * ) ( _masm . code ( ) - > consts ( ) - > start ( ) + offset ) ;
2011-11-16 01:39:50 -08:00
for ( uint i = 0 ; i < n - > outcnt ( ) ; i + + ) {
2010-12-03 01:34:31 -08:00
address * constant_addr = & jump_table_base [ i ] ;
2015-09-29 11:02:08 +02:00
assert ( * constant_addr = = ( ( ( address ) n ) + i ) , " all jump-table entries must contain adjusted node pointer: " INTPTR_FORMAT " == " INTPTR_FORMAT , p2i ( * constant_addr ) , p2i ( ( ( address ) n ) + i ) ) ;
2010-12-03 01:34:31 -08:00
* constant_addr = cb . consts ( ) - > target ( * labels . at ( i ) , ( address ) constant_addr ) ;
cb . consts ( ) - > relocate ( ( address ) constant_addr , relocInfo : : internal_word_type ) ;
}
}
2012-12-18 14:55:25 +01:00
2014-08-11 14:12:51 +02:00
//----------------------------static_subtype_check-----------------------------
// Shortcut important common cases when superklass is exact:
// (0) superklass is java.lang.Object (can occur in reflective code)
// (1) subklass is already limited to a subtype of superklass => always ok
// (2) subklass does not overlap with superklass => always fail
// (3) superklass has NO subtypes and we can check with a simple compare.
int Compile : : static_subtype_check ( ciKlass * superk , ciKlass * subk ) {
if ( StressReflectiveCode ) {
return SSC_full_test ; // Let caller generate the general case.
}
if ( superk = = env ( ) - > Object_klass ( ) ) {
return SSC_always_true ; // (0) this test cannot fail
}
ciType * superelem = superk ;
if ( superelem - > is_array_klass ( ) )
superelem = superelem - > as_array_klass ( ) - > base_element_type ( ) ;
if ( ! subk - > is_interface ( ) ) { // cannot trust static interface types yet
if ( subk - > is_subtype_of ( superk ) ) {
return SSC_always_true ; // (1) false path dead; no dynamic test needed
}
if ( ! ( superelem - > is_klass ( ) & & superelem - > as_klass ( ) - > is_interface ( ) ) & &
! superk - > is_subtype_of ( subk ) ) {
return SSC_always_false ;
}
}
// If casting to an instance klass, it must have no subtypes
if ( superk - > is_interface ( ) ) {
// Cannot trust interfaces yet.
// %%% S.B. superk->nof_implementors() == 1
} else if ( superelem - > is_instance_klass ( ) ) {
ciInstanceKlass * ik = superelem - > as_instance_klass ( ) ;
if ( ! ik - > has_subklass ( ) & & ! ik - > is_interface ( ) ) {
if ( ! ik - > is_final ( ) ) {
// Add a dependency if there is a chance of a later subclass.
dependencies ( ) - > assert_leaf_type ( ik ) ;
}
return SSC_easy_test ; // (3) caller can do a simple ptr comparison
}
} else {
// A primitive array type has no subtypes.
return SSC_easy_test ; // (3) caller can do a simple ptr comparison
}
return SSC_full_test ;
}
2015-02-18 18:14:07 +01:00
Node * Compile : : conv_I2X_index ( PhaseGVN * phase , Node * idx , const TypeInt * sizetype ) {
# ifdef _LP64
// The scaled index operand to AddP must be a clean 64-bit value.
// Java allows a 32-bit int to be incremented to a negative
// value, which appears in a 64-bit register as a large
// positive number. Using that large positive number as an
// operand in pointer arithmetic has bad consequences.
// On the other hand, 32-bit overflow is rare, and the possibility
// can often be excluded, if we annotate the ConvI2L node with
// a type assertion that its value is known to be a small positive
// number. (The prior range check has ensured this.)
// This assertion is used by ConvI2LNode::Ideal.
int index_max = max_jint - 1 ; // array size is max_jint, index is one less
if ( sizetype ! = NULL ) index_max = sizetype - > _hi - 1 ;
const TypeLong * lidxtype = TypeLong : : make ( CONST64 ( 0 ) , index_max , Type : : WidenMax ) ;
idx = phase - > transform ( new ConvI2LNode ( idx , lidxtype ) ) ;
# endif
return idx ;
}
2014-04-09 09:17:43 +02:00
// The message about the current inlining is accumulated in
// _print_inlining_stream and transfered into the _print_inlining_list
// once we know whether inlining succeeds or not. For regular
// inlining, messages are appended to the buffer pointed by
// _print_inlining_idx in the _print_inlining_list. For late inlining,
// a new buffer is added after _print_inlining_idx in the list. This
// way we can update the inlining message for late inlining call site
// when the inlining is attempted again.
void Compile : : print_inlining_init ( ) {
if ( print_inlining ( ) | | print_intrinsics ( ) ) {
_print_inlining_stream = new stringStream ( ) ;
_print_inlining_list = new ( comp_arena ( ) ) GrowableArray < PrintInliningBuffer > ( comp_arena ( ) , 1 , 1 , PrintInliningBuffer ( ) ) ;
}
}
void Compile : : print_inlining_reinit ( ) {
if ( print_inlining ( ) | | print_intrinsics ( ) ) {
// Re allocate buffer when we change ResourceMark
_print_inlining_stream = new stringStream ( ) ;
}
}
void Compile : : print_inlining_reset ( ) {
_print_inlining_stream - > reset ( ) ;
}
void Compile : : print_inlining_commit ( ) {
assert ( print_inlining ( ) | | print_intrinsics ( ) , " PrintInlining off? " ) ;
// Transfer the message from _print_inlining_stream to the current
// _print_inlining_list buffer and clear _print_inlining_stream.
_print_inlining_list - > at ( _print_inlining_idx ) . ss ( ) - > write ( _print_inlining_stream - > as_string ( ) , _print_inlining_stream - > size ( ) ) ;
print_inlining_reset ( ) ;
}
void Compile : : print_inlining_push ( ) {
// Add new buffer to the _print_inlining_list at current position
_print_inlining_idx + + ;
_print_inlining_list - > insert_before ( _print_inlining_idx , PrintInliningBuffer ( ) ) ;
}
Compile : : PrintInliningBuffer & Compile : : print_inlining_current ( ) {
return _print_inlining_list - > at ( _print_inlining_idx ) ;
}
void Compile : : print_inlining_update ( CallGenerator * cg ) {
2013-09-24 16:08:00 -07:00
if ( print_inlining ( ) | | print_intrinsics ( ) ) {
2014-04-09 09:17:43 +02:00
if ( ! cg - > is_late_inline ( ) ) {
if ( print_inlining_current ( ) . cg ( ) ! = NULL ) {
print_inlining_push ( ) ;
}
print_inlining_commit ( ) ;
} else {
if ( print_inlining_current ( ) . cg ( ) ! = cg & &
( print_inlining_current ( ) . cg ( ) ! = NULL | |
print_inlining_current ( ) . ss ( ) - > size ( ) ! = 0 ) ) {
print_inlining_push ( ) ;
}
print_inlining_commit ( ) ;
print_inlining_current ( ) . set_cg ( cg ) ;
}
}
}
void Compile : : print_inlining_move_to ( CallGenerator * cg ) {
// We resume inlining at a late inlining call site. Locate the
// corresponding inlining buffer so that we can update it.
if ( print_inlining ( ) ) {
for ( int i = 0 ; i < _print_inlining_list - > length ( ) ; i + + ) {
if ( _print_inlining_list - > adr_at ( i ) - > cg ( ) = = cg ) {
_print_inlining_idx = i ;
return ;
}
}
ShouldNotReachHere ( ) ;
}
}
void Compile : : print_inlining_update_delayed ( CallGenerator * cg ) {
if ( print_inlining ( ) ) {
assert ( _print_inlining_stream - > size ( ) > 0 , " missing inlining msg " ) ;
assert ( print_inlining_current ( ) . cg ( ) = = cg , " wrong entry " ) ;
// replace message with new message
_print_inlining_list - > at_put ( _print_inlining_idx , PrintInliningBuffer ( ) ) ;
print_inlining_commit ( ) ;
print_inlining_current ( ) . set_cg ( cg ) ;
}
}
void Compile : : print_inlining_assert_ready ( ) {
assert ( ! _print_inlining | | _print_inlining_stream - > size ( ) = = 0 , " loosing data " ) ;
}
2014-05-26 14:27:01 +02:00
void Compile : : process_print_inlining ( ) {
2014-04-09 09:17:43 +02:00
bool do_print_inlining = print_inlining ( ) | | print_intrinsics ( ) ;
2014-04-10 11:38:12 +02:00
if ( do_print_inlining | | log ( ) ! = NULL ) {
2012-12-23 17:08:22 +01:00
// Print inlining message for candidates that we couldn't inline
2014-04-09 09:17:43 +02:00
// for lack of space
2012-12-23 17:08:22 +01:00
for ( int i = 0 ; i < _late_inlines . length ( ) ; i + + ) {
CallGenerator * cg = _late_inlines . at ( i ) ;
2014-04-09 09:17:43 +02:00
if ( ! cg - > is_mh_late_inline ( ) ) {
const char * msg = " live nodes > LiveNodeCountInliningCutoff " ;
if ( do_print_inlining ) {
cg - > print_inlining_late ( msg ) ;
}
2014-04-10 11:38:12 +02:00
log_late_inline_failure ( cg , msg ) ;
2012-12-23 17:08:22 +01:00
}
}
2014-04-09 09:17:43 +02:00
}
if ( do_print_inlining ) {
2014-05-26 14:27:01 +02:00
ResourceMark rm ;
stringStream ss ;
2012-12-18 14:55:25 +01:00
for ( int i = 0 ; i < _print_inlining_list - > length ( ) ; i + + ) {
2014-05-26 14:27:01 +02:00
ss . print ( " %s " , _print_inlining_list - > adr_at ( i ) - > ss ( ) - > as_string ( ) ) ;
2012-12-18 14:55:25 +01:00
}
2014-05-26 14:27:01 +02:00
size_t end = ss . size ( ) ;
_print_inlining_output = NEW_ARENA_ARRAY ( comp_arena ( ) , char , end + 1 ) ;
strncpy ( _print_inlining_output , ss . base ( ) , end + 1 ) ;
_print_inlining_output [ end ] = 0 ;
}
}
void Compile : : dump_print_inlining ( ) {
if ( _print_inlining_output ! = NULL ) {
tty - > print_raw ( _print_inlining_output ) ;
2012-12-18 14:55:25 +01:00
}
}
2013-02-12 12:56:11 +01:00
2014-04-10 11:38:12 +02:00
void Compile : : log_late_inline ( CallGenerator * cg ) {
if ( log ( ) ! = NULL ) {
log ( ) - > head ( " late_inline method='%d' inline_id=' " JLONG_FORMAT " ' " , log ( ) - > identify ( cg - > method ( ) ) ,
cg - > unique_id ( ) ) ;
JVMState * p = cg - > call_node ( ) - > jvms ( ) ;
while ( p ! = NULL ) {
log ( ) - > elem ( " jvms bci='%d' method='%d' " , p - > bci ( ) , log ( ) - > identify ( p - > method ( ) ) ) ;
p = p - > caller ( ) ;
}
log ( ) - > tail ( " late_inline " ) ;
}
}
void Compile : : log_late_inline_failure ( CallGenerator * cg , const char * msg ) {
log_late_inline ( cg ) ;
if ( log ( ) ! = NULL ) {
log ( ) - > inline_fail ( msg ) ;
}
}
void Compile : : log_inline_id ( CallGenerator * cg ) {
if ( log ( ) ! = NULL ) {
// The LogCompilation tool needs a unique way to identify late
// inline call sites. This id must be unique for this call site in
// this compilation. Try to have it unique across compilations as
// well because it can be convenient when grepping through the log
// file.
// Distinguish OSR compilations from others in case CICountOSR is
// on.
jlong id = ( ( jlong ) unique ( ) ) + ( ( ( jlong ) compile_id ( ) ) < < 33 ) + ( CICountOSR & & is_osr_compilation ( ) ? ( ( jlong ) 1 ) < < 32 : 0 ) ;
cg - > set_unique_id ( id ) ;
log ( ) - > elem ( " inline_id id=' " JLONG_FORMAT " ' " , id ) ;
}
}
void Compile : : log_inline_failure ( const char * msg ) {
if ( C - > log ( ) ! = NULL ) {
C - > log ( ) - > inline_fail ( msg ) ;
}
}
2014-01-08 10:25:50 -08:00
// Dump inlining replay data to the stream.
// Don't change thread state and acquire any locks.
void Compile : : dump_inline_data ( outputStream * out ) {
InlineTree * inl_tree = ilt ( ) ;
if ( inl_tree ! = NULL ) {
out - > print ( " inline %d " , inl_tree - > count ( ) ) ;
inl_tree - > dump_replay_data ( out ) ;
}
}
2013-02-12 12:56:11 +01:00
int Compile : : cmp_expensive_nodes ( Node * n1 , Node * n2 ) {
if ( n1 - > Opcode ( ) < n2 - > Opcode ( ) ) return - 1 ;
else if ( n1 - > Opcode ( ) > n2 - > Opcode ( ) ) return 1 ;
2015-09-29 11:02:08 +02:00
assert ( n1 - > req ( ) = = n2 - > req ( ) , " can't compare %s nodes: n1->req() = %d, n2->req() = %d " , NodeClassNames [ n1 - > Opcode ( ) ] , n1 - > req ( ) , n2 - > req ( ) ) ;
2013-02-12 12:56:11 +01:00
for ( uint i = 1 ; i < n1 - > req ( ) ; i + + ) {
if ( n1 - > in ( i ) < n2 - > in ( i ) ) return - 1 ;
else if ( n1 - > in ( i ) > n2 - > in ( i ) ) return 1 ;
}
return 0 ;
}
int Compile : : cmp_expensive_nodes ( Node * * n1p , Node * * n2p ) {
Node * n1 = * n1p ;
Node * n2 = * n2p ;
return cmp_expensive_nodes ( n1 , n2 ) ;
}
void Compile : : sort_expensive_nodes ( ) {
if ( ! expensive_nodes_sorted ( ) ) {
_expensive_nodes - > sort ( cmp_expensive_nodes ) ;
}
}
bool Compile : : expensive_nodes_sorted ( ) const {
for ( int i = 1 ; i < _expensive_nodes - > length ( ) ; i + + ) {
if ( cmp_expensive_nodes ( _expensive_nodes - > adr_at ( i ) , _expensive_nodes - > adr_at ( i - 1 ) ) < 0 ) {
return false ;
}
}
return true ;
}
bool Compile : : should_optimize_expensive_nodes ( PhaseIterGVN & igvn ) {
if ( _expensive_nodes - > length ( ) = = 0 ) {
return false ;
}
assert ( OptimizeExpensiveOps , " optimization off? " ) ;
// Take this opportunity to remove dead nodes from the list
int j = 0 ;
for ( int i = 0 ; i < _expensive_nodes - > length ( ) ; i + + ) {
Node * n = _expensive_nodes - > at ( i ) ;
if ( ! n - > is_unreachable ( igvn ) ) {
assert ( n - > is_expensive ( ) , " should be expensive " ) ;
_expensive_nodes - > at_put ( j , n ) ;
j + + ;
}
}
_expensive_nodes - > trunc_to ( j ) ;
// Then sort the list so that similar nodes are next to each other
// and check for at least two nodes of identical kind with same data
// inputs.
sort_expensive_nodes ( ) ;
for ( int i = 0 ; i < _expensive_nodes - > length ( ) - 1 ; i + + ) {
if ( cmp_expensive_nodes ( _expensive_nodes - > adr_at ( i ) , _expensive_nodes - > adr_at ( i + 1 ) ) = = 0 ) {
return true ;
}
}
return false ;
}
void Compile : : cleanup_expensive_nodes ( PhaseIterGVN & igvn ) {
if ( _expensive_nodes - > length ( ) = = 0 ) {
return ;
}
assert ( OptimizeExpensiveOps , " optimization off? " ) ;
// Sort to bring similar nodes next to each other and clear the
// control input of nodes for which there's only a single copy.
sort_expensive_nodes ( ) ;
int j = 0 ;
int identical = 0 ;
int i = 0 ;
2014-07-25 10:06:17 +02:00
bool modified = false ;
2013-02-12 12:56:11 +01:00
for ( ; i < _expensive_nodes - > length ( ) - 1 ; i + + ) {
assert ( j < = i , " can't write beyond current index " ) ;
if ( _expensive_nodes - > at ( i ) - > Opcode ( ) = = _expensive_nodes - > at ( i + 1 ) - > Opcode ( ) ) {
identical + + ;
_expensive_nodes - > at_put ( j + + , _expensive_nodes - > at ( i ) ) ;
continue ;
}
if ( identical > 0 ) {
_expensive_nodes - > at_put ( j + + , _expensive_nodes - > at ( i ) ) ;
identical = 0 ;
} else {
Node * n = _expensive_nodes - > at ( i ) ;
2014-07-25 10:06:17 +02:00
igvn . replace_input_of ( n , 0 , NULL ) ;
2013-02-12 12:56:11 +01:00
igvn . hash_insert ( n ) ;
2014-07-25 10:06:17 +02:00
modified = true ;
2013-02-12 12:56:11 +01:00
}
}
if ( identical > 0 ) {
_expensive_nodes - > at_put ( j + + , _expensive_nodes - > at ( i ) ) ;
} else if ( _expensive_nodes - > length ( ) > = 1 ) {
Node * n = _expensive_nodes - > at ( i ) ;
2014-07-25 10:06:17 +02:00
igvn . replace_input_of ( n , 0 , NULL ) ;
2013-02-12 12:56:11 +01:00
igvn . hash_insert ( n ) ;
2014-07-25 10:06:17 +02:00
modified = true ;
2013-02-12 12:56:11 +01:00
}
_expensive_nodes - > trunc_to ( j ) ;
2014-07-25 10:06:17 +02:00
if ( modified ) {
igvn . optimize ( ) ;
}
2013-02-12 12:56:11 +01:00
}
void Compile : : add_expensive_node ( Node * n ) {
assert ( ! _expensive_nodes - > contains ( n ) , " duplicate entry in expensive list " ) ;
assert ( n - > is_expensive ( ) , " expensive nodes with non-null control here only " ) ;
assert ( ! n - > is_CFG ( ) & & ! n - > is_Mem ( ) , " no cfg or memory nodes here " ) ;
if ( OptimizeExpensiveOps ) {
_expensive_nodes - > append ( n ) ;
} else {
// Clear control input and let IGVN optimize expensive nodes if
// OptimizeExpensiveOps is off.
n - > set_req ( 0 , NULL ) ;
}
}
2013-03-05 04:24:50 -08:00
2013-10-23 12:40:23 +02:00
/**
* Remove the speculative part of types and clean up the graph
*/
void Compile : : remove_speculative_types ( PhaseIterGVN & igvn ) {
if ( UseTypeSpeculation ) {
Unique_Node_List worklist ;
worklist . push ( root ( ) ) ;
int modified = 0 ;
// Go over all type nodes that carry a speculative type, drop the
// speculative part of the type and enqueue the node for an igvn
// which may optimize it out.
for ( uint next = 0 ; next < worklist . size ( ) ; + + next ) {
Node * n = worklist . at ( next ) ;
2014-01-24 09:31:53 +01:00
if ( n - > is_Type ( ) ) {
2013-10-23 12:40:23 +02:00
TypeNode * tn = n - > as_Type ( ) ;
2014-01-24 09:31:53 +01:00
const Type * t = tn - > type ( ) ;
const Type * t_no_spec = t - > remove_speculative ( ) ;
if ( t_no_spec ! = t ) {
bool in_hash = igvn . hash_delete ( n ) ;
assert ( in_hash , " node should be in igvn hash table " ) ;
tn - > set_type ( t_no_spec ) ;
igvn . hash_insert ( n ) ;
igvn . _worklist . push ( n ) ; // give it a chance to go away
modified + + ;
}
2013-10-23 12:40:23 +02:00
}
uint max = n - > len ( ) ;
for ( uint i = 0 ; i < max ; + + i ) {
Node * m = n - > in ( i ) ;
if ( not_a_node ( m ) ) continue ;
worklist . push ( m ) ;
}
}
// Drop the speculative part of all types in the igvn's type table
igvn . remove_speculative_types ( ) ;
if ( modified > 0 ) {
igvn . optimize ( ) ;
}
2014-01-24 09:31:53 +01:00
# ifdef ASSERT
// Verify that after the IGVN is over no speculative type has resurfaced
worklist . clear ( ) ;
worklist . push ( root ( ) ) ;
for ( uint next = 0 ; next < worklist . size ( ) ; + + next ) {
Node * n = worklist . at ( next ) ;
2014-04-10 09:26:24 +02:00
const Type * t = igvn . type_or_null ( n ) ;
assert ( ( t = = NULL ) | | ( t = = t - > remove_speculative ( ) ) , " no more speculative types " ) ;
2014-01-24 09:31:53 +01:00
if ( n - > is_Type ( ) ) {
t = n - > as_Type ( ) - > type ( ) ;
assert ( t = = t - > remove_speculative ( ) , " no more speculative types " ) ;
}
uint max = n - > len ( ) ;
for ( uint i = 0 ; i < max ; + + i ) {
Node * m = n - > in ( i ) ;
if ( not_a_node ( m ) ) continue ;
worklist . push ( m ) ;
}
}
igvn . check_no_speculative_types ( ) ;
# endif
2013-10-23 12:40:23 +02:00
}
}
2013-03-05 04:24:50 -08:00
// Auxiliary method to support randomized stressing/fuzzing.
//
// This method can be called the arbitrary number of times, with current count
// as the argument. The logic allows selecting a single candidate from the
// running list of candidates as follows:
// int count = 0;
// Cand* selected = null;
// while(cand = cand->next()) {
// if (randomized_select(++count)) {
// selected = cand;
// }
// }
//
// Including count equalizes the chances any candidate is "selected".
// This is useful when we don't have the complete list of candidates to choose
// from uniformly. In this case, we need to adjust the randomicity of the
// selection, or else we will end up biasing the selection towards the latter
// candidates.
//
// Quick back-envelope calculation shows that for the list of n candidates
// the equal probability for the candidate to persist as "best" can be
// achieved by replacing it with "next" k-th candidate with the probability
// of 1/k. It can be easily shown that by the end of the run, the
// probability for any candidate is converged to 1/n, thus giving the
// uniform distribution among all the candidates.
//
// We don't care about the domain size as long as (RANDOMIZED_DOMAIN / count) is large.
# define RANDOMIZED_DOMAIN_POW 29
# define RANDOMIZED_DOMAIN (1 << RANDOMIZED_DOMAIN_POW)
# define RANDOMIZED_DOMAIN_MASK ((1 << (RANDOMIZED_DOMAIN_POW + 1)) - 1)
bool Compile : : randomized_select ( int count ) {
assert ( count > 0 , " only positive " ) ;
return ( os : : random ( ) & RANDOMIZED_DOMAIN_MASK ) < ( RANDOMIZED_DOMAIN / count ) ;
}
2015-05-05 12:33:57 -07:00
CloneMap & Compile : : clone_map ( ) { return _clone_map ; }
void Compile : : set_clone_map ( Dict * d ) { _clone_map . _dict = d ; }
void NodeCloneInfo : : dump ( ) const {
tty - > print ( " {%d:%d} " , idx ( ) , gen ( ) ) ;
}
void CloneMap : : clone ( Node * old , Node * nnn , int gen ) {
uint64_t val = value ( old - > _idx ) ;
NodeCloneInfo cio ( val ) ;
assert ( val ! = 0 , " old node should be in the map " ) ;
NodeCloneInfo cin ( cio . idx ( ) , gen + cio . gen ( ) ) ;
insert ( nnn - > _idx , cin . get ( ) ) ;
# ifndef PRODUCT
if ( is_debug ( ) ) {
tty - > print_cr ( " CloneMap::clone inserted node %d info {%d:%d} into CloneMap " , nnn - > _idx , cin . idx ( ) , cin . gen ( ) ) ;
}
# endif
}
void CloneMap : : verify_insert_and_clone ( Node * old , Node * nnn , int gen ) {
NodeCloneInfo cio ( value ( old - > _idx ) ) ;
if ( cio . get ( ) = = 0 ) {
cio . set ( old - > _idx , 0 ) ;
insert ( old - > _idx , cio . get ( ) ) ;
# ifndef PRODUCT
if ( is_debug ( ) ) {
tty - > print_cr ( " CloneMap::verify_insert_and_clone inserted node %d info {%d:%d} into CloneMap " , old - > _idx , cio . idx ( ) , cio . gen ( ) ) ;
}
# endif
}
clone ( old , nnn , gen ) ;
}
int CloneMap : : max_gen ( ) const {
int g = 0 ;
DictI di ( _dict ) ;
for ( ; di . test ( ) ; + + di ) {
int t = gen ( di . _key ) ;
if ( g < t ) {
g = t ;
# ifndef PRODUCT
if ( is_debug ( ) ) {
tty - > print_cr ( " CloneMap::max_gen() update max=%d from %d " , g , _2_node_idx_t ( di . _key ) ) ;
}
# endif
}
}
return g ;
}
void CloneMap : : dump ( node_idx_t key ) const {
uint64_t val = value ( key ) ;
if ( val ! = 0 ) {
NodeCloneInfo ni ( val ) ;
ni . dump ( ) ;
}
}