Merge
This commit is contained in:
commit
45f51703ed
@ -342,6 +342,9 @@
|
|||||||
product(bool, SuperWordReductions, true, \
|
product(bool, SuperWordReductions, true, \
|
||||||
"Enable reductions support in superword.") \
|
"Enable reductions support in superword.") \
|
||||||
\
|
\
|
||||||
|
product(bool, DoReserveCopyInSuperWord, true, \
|
||||||
|
"Create reserve copy of graph in SuperWord.") \
|
||||||
|
\
|
||||||
notproduct(bool, TraceSuperWord, false, \
|
notproduct(bool, TraceSuperWord, false, \
|
||||||
"Trace superword transforms") \
|
"Trace superword transforms") \
|
||||||
\
|
\
|
||||||
|
@ -263,3 +263,136 @@ ProjNode* PhaseIdealLoop::create_slow_version_of_loop(IdealLoopTree *loop,
|
|||||||
|
|
||||||
return iffast;
|
return iffast;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
LoopNode* PhaseIdealLoop::create_reserve_version_of_loop(IdealLoopTree *loop, CountedLoopReserveKit* lk) {
|
||||||
|
Node_List old_new;
|
||||||
|
LoopNode* head = loop->_head->as_Loop();
|
||||||
|
bool counted_loop = head->is_CountedLoop();
|
||||||
|
Node* entry = head->in(LoopNode::EntryControl);
|
||||||
|
_igvn.rehash_node_delayed(entry);
|
||||||
|
IdealLoopTree* outer_loop = loop->_parent;
|
||||||
|
|
||||||
|
ConINode* const_1 = _igvn.intcon(1);
|
||||||
|
set_ctrl(const_1, C->root());
|
||||||
|
IfNode* iff = new IfNode(entry, const_1, PROB_MAX, COUNT_UNKNOWN);
|
||||||
|
register_node(iff, outer_loop, entry, dom_depth(entry));
|
||||||
|
ProjNode* iffast = new IfTrueNode(iff);
|
||||||
|
register_node(iffast, outer_loop, iff, dom_depth(iff));
|
||||||
|
ProjNode* ifslow = new IfFalseNode(iff);
|
||||||
|
register_node(ifslow, outer_loop, iff, dom_depth(iff));
|
||||||
|
|
||||||
|
// Clone the loop body. The clone becomes the fast loop. The
|
||||||
|
// original pre-header will (illegally) have 3 control users
|
||||||
|
// (old & new loops & new if).
|
||||||
|
clone_loop(loop, old_new, dom_depth(head), iff);
|
||||||
|
assert(old_new[head->_idx]->is_Loop(), "" );
|
||||||
|
|
||||||
|
LoopNode* slow_head = old_new[head->_idx]->as_Loop();
|
||||||
|
|
||||||
|
#ifndef PRODUCT
|
||||||
|
if (TraceLoopOpts) {
|
||||||
|
tty->print_cr("PhaseIdealLoop::create_reserve_version_of_loop:");
|
||||||
|
tty->print("\t iff = %d, ", iff->_idx); iff->dump();
|
||||||
|
tty->print("\t iffast = %d, ", iffast->_idx); iffast->dump();
|
||||||
|
tty->print("\t ifslow = %d, ", ifslow->_idx); ifslow->dump();
|
||||||
|
tty->print("\t before replace_input_of: head = %d, ", head->_idx); head->dump();
|
||||||
|
tty->print("\t before replace_input_of: slow_head = %d, ", slow_head->_idx); slow_head->dump();
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
|
// Fast (true) control
|
||||||
|
_igvn.replace_input_of(head, LoopNode::EntryControl, iffast);
|
||||||
|
// Slow (false) control
|
||||||
|
_igvn.replace_input_of(slow_head, LoopNode::EntryControl, ifslow);
|
||||||
|
|
||||||
|
recompute_dom_depth();
|
||||||
|
|
||||||
|
lk->set_iff(iff);
|
||||||
|
|
||||||
|
#ifndef PRODUCT
|
||||||
|
if (TraceLoopOpts ) {
|
||||||
|
tty->print("\t after replace_input_of: head = %d, ", head->_idx); head->dump();
|
||||||
|
tty->print("\t after replace_input_of: slow_head = %d, ", slow_head->_idx); slow_head->dump();
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
|
return slow_head->as_Loop();
|
||||||
|
}
|
||||||
|
|
||||||
|
CountedLoopReserveKit::CountedLoopReserveKit(PhaseIdealLoop* phase, IdealLoopTree *loop, bool active = true) :
|
||||||
|
_phase(phase),
|
||||||
|
_lpt(loop),
|
||||||
|
_lp(NULL),
|
||||||
|
_iff(NULL),
|
||||||
|
_lp_reserved(NULL),
|
||||||
|
_has_reserved(false),
|
||||||
|
_use_new(false),
|
||||||
|
_active(active)
|
||||||
|
{
|
||||||
|
create_reserve();
|
||||||
|
};
|
||||||
|
|
||||||
|
CountedLoopReserveKit::~CountedLoopReserveKit() {
|
||||||
|
if (!_active) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (_has_reserved && !_use_new) {
|
||||||
|
// intcon(0)->iff-node reverts CF to the reserved copy
|
||||||
|
ConINode* const_0 = _phase->_igvn.intcon(0);
|
||||||
|
_phase->set_ctrl(const_0, _phase->C->root());
|
||||||
|
_iff->set_req(1, const_0);
|
||||||
|
|
||||||
|
#ifndef PRODUCT
|
||||||
|
if (TraceLoopOpts) {
|
||||||
|
tty->print_cr("CountedLoopReserveKit::~CountedLoopReserveKit()");
|
||||||
|
tty->print("\t discard loop %d and revert to the reserved loop clone %d: ", _lp->_idx, _lp_reserved->_idx);
|
||||||
|
_lp_reserved->dump();
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
bool CountedLoopReserveKit::create_reserve() {
|
||||||
|
if (!_active) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
if(!_lpt->_head->is_CountedLoop()) {
|
||||||
|
NOT_PRODUCT(if(TraceLoopOpts) {tty->print_cr("CountedLoopReserveKit::create_reserve: %d not counted loop", _lpt->_head->_idx);})
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
CountedLoopNode *cl = _lpt->_head->as_CountedLoop();
|
||||||
|
if (!cl->is_valid_counted_loop()) {
|
||||||
|
NOT_PRODUCT(if(TraceLoopOpts) {tty->print_cr("CountedLoopReserveKit::create_reserve: %d not valid counted loop", cl->_idx);})
|
||||||
|
return false; // skip malformed counted loop
|
||||||
|
}
|
||||||
|
if (!cl->is_main_loop()) {
|
||||||
|
NOT_PRODUCT(if(TraceLoopOpts) {tty->print_cr("CountedLoopReserveKit::create_reserve: %d not main loop", cl->_idx);})
|
||||||
|
return false; // skip normal, pre, and post loops
|
||||||
|
}
|
||||||
|
|
||||||
|
_lp = _lpt->_head->as_Loop();
|
||||||
|
_lp_reserved = _phase->create_reserve_version_of_loop(_lpt, this);
|
||||||
|
|
||||||
|
if (!_lp_reserved->is_CountedLoop()) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
Node* ifslow_pred = _lp_reserved->as_CountedLoop()->in(LoopNode::EntryControl);
|
||||||
|
|
||||||
|
if (!ifslow_pred->is_IfFalse()) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
Node* iff = ifslow_pred->in(0);
|
||||||
|
if (!iff->is_If() || iff != _iff) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (iff->in(1)->Opcode() != Op_ConI) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
return _has_reserved = true;
|
||||||
|
}
|
||||||
|
@ -38,6 +38,7 @@ class IdealLoopTree;
|
|||||||
class LoopNode;
|
class LoopNode;
|
||||||
class Node;
|
class Node;
|
||||||
class PhaseIdealLoop;
|
class PhaseIdealLoop;
|
||||||
|
class CountedLoopReserveKit;
|
||||||
class VectorSet;
|
class VectorSet;
|
||||||
class Invariance;
|
class Invariance;
|
||||||
struct small_cache;
|
struct small_cache;
|
||||||
@ -529,6 +530,8 @@ public:
|
|||||||
class PhaseIdealLoop : public PhaseTransform {
|
class PhaseIdealLoop : public PhaseTransform {
|
||||||
friend class IdealLoopTree;
|
friend class IdealLoopTree;
|
||||||
friend class SuperWord;
|
friend class SuperWord;
|
||||||
|
friend class CountedLoopReserveKit;
|
||||||
|
|
||||||
// Pre-computed def-use info
|
// Pre-computed def-use info
|
||||||
PhaseIterGVN &_igvn;
|
PhaseIterGVN &_igvn;
|
||||||
|
|
||||||
@ -965,6 +968,16 @@ public:
|
|||||||
ProjNode* create_slow_version_of_loop(IdealLoopTree *loop,
|
ProjNode* create_slow_version_of_loop(IdealLoopTree *loop,
|
||||||
Node_List &old_new);
|
Node_List &old_new);
|
||||||
|
|
||||||
|
// Clone a loop and return the clone head (clone_loop_head).
|
||||||
|
// Added nodes include int(1), int(0) - disconnected, If, IfTrue, IfFalse,
|
||||||
|
// This routine was created for usage in CountedLoopReserveKit.
|
||||||
|
//
|
||||||
|
// int(1) -> If -> IfTrue -> original_loop_head
|
||||||
|
// |
|
||||||
|
// V
|
||||||
|
// IfFalse -> clone_loop_head (returned by function pointer)
|
||||||
|
//
|
||||||
|
LoopNode* create_reserve_version_of_loop(IdealLoopTree *loop, CountedLoopReserveKit* lk);
|
||||||
// Clone loop with an invariant test (that does not exit) and
|
// Clone loop with an invariant test (that does not exit) and
|
||||||
// insert a clone of the test that selects which version to
|
// insert a clone of the test that selects which version to
|
||||||
// execute.
|
// execute.
|
||||||
@ -1117,6 +1130,68 @@ public:
|
|||||||
#endif
|
#endif
|
||||||
};
|
};
|
||||||
|
|
||||||
|
// This kit may be used for making of a reserved copy of a loop before this loop
|
||||||
|
// goes under non-reversible changes.
|
||||||
|
//
|
||||||
|
// Function create_reserve() creates a reserved copy (clone) of the loop.
|
||||||
|
// The reserved copy is created by calling
|
||||||
|
// PhaseIdealLoop::create_reserve_version_of_loop - see there how
|
||||||
|
// the original and reserved loops are connected in the outer graph.
|
||||||
|
// If create_reserve succeeded, it returns 'true' and _has_reserved is set to 'true'.
|
||||||
|
//
|
||||||
|
// By default the reserved copy (clone) of the loop is created as dead code - it is
|
||||||
|
// dominated in the outer loop by this node chain:
|
||||||
|
// intcon(1)->If->IfFalse->reserved_copy.
|
||||||
|
// The original loop is dominated by the the same node chain but IfTrue projection:
|
||||||
|
// intcon(1)->If->IfTrue->original_loop.
|
||||||
|
//
|
||||||
|
// In this implementation of CountedLoopReserveKit the ctor includes create_reserve()
|
||||||
|
// and the dtor, checks _use_new value.
|
||||||
|
// If _use_new == false, it "switches" control to reserved copy of the loop
|
||||||
|
// by simple replacing of node intcon(1) with node intcon(0).
|
||||||
|
//
|
||||||
|
// Here is a proposed example of usage (see also SuperWord::output in superword.cpp).
|
||||||
|
//
|
||||||
|
// void CountedLoopReserveKit_example()
|
||||||
|
// {
|
||||||
|
// CountedLoopReserveKit lrk((phase, lpt, DoReserveCopy = true); // create local object
|
||||||
|
// if (DoReserveCopy && !lrk.has_reserved()) {
|
||||||
|
// return; //failed to create reserved loop copy
|
||||||
|
// }
|
||||||
|
// ...
|
||||||
|
// //something is wrong, switch to original loop
|
||||||
|
/// if(something_is_wrong) return; // ~CountedLoopReserveKit makes the switch
|
||||||
|
// ...
|
||||||
|
// //everything worked ok, return with the newly modified loop
|
||||||
|
// lrk.use_new();
|
||||||
|
// return; // ~CountedLoopReserveKit does nothing once use_new() was called
|
||||||
|
// }
|
||||||
|
//
|
||||||
|
// Keep in mind, that by default if create_reserve() is not followed by use_new()
|
||||||
|
// the dtor will "switch to the original" loop.
|
||||||
|
// NOTE. You you modify outside of the original loop this class is no help.
|
||||||
|
//
|
||||||
|
class CountedLoopReserveKit {
|
||||||
|
private:
|
||||||
|
PhaseIdealLoop* _phase;
|
||||||
|
IdealLoopTree* _lpt;
|
||||||
|
LoopNode* _lp;
|
||||||
|
IfNode* _iff;
|
||||||
|
LoopNode* _lp_reserved;
|
||||||
|
bool _has_reserved;
|
||||||
|
bool _use_new;
|
||||||
|
const bool _active; //may be set to false in ctor, then the object is dummy
|
||||||
|
|
||||||
|
public:
|
||||||
|
CountedLoopReserveKit(PhaseIdealLoop* phase, IdealLoopTree *loop, bool active);
|
||||||
|
~CountedLoopReserveKit();
|
||||||
|
void use_new() {_use_new = true;}
|
||||||
|
void set_iff(IfNode* x) {_iff = x;}
|
||||||
|
bool has_reserved() const { return _active && _has_reserved;}
|
||||||
|
private:
|
||||||
|
bool create_reserve();
|
||||||
|
};// class CountedLoopReserveKit
|
||||||
|
|
||||||
inline Node* IdealLoopTree::tail() {
|
inline Node* IdealLoopTree::tail() {
|
||||||
// Handle lazy update of _tail field
|
// Handle lazy update of _tail field
|
||||||
Node *n = _tail;
|
Node *n = _tail;
|
||||||
|
@ -81,6 +81,10 @@ SuperWord::SuperWord(PhaseIdealLoop* phase) :
|
|||||||
if (_phase->C->method() != NULL) {
|
if (_phase->C->method() != NULL) {
|
||||||
_phase->C->method()->has_option_value("VectorizeDebug", _vector_loop_debug);
|
_phase->C->method()->has_option_value("VectorizeDebug", _vector_loop_debug);
|
||||||
}
|
}
|
||||||
|
_CountedLoopReserveKit_debug = 0;
|
||||||
|
if (_phase->C->method() != NULL) {
|
||||||
|
_phase->C->method()->has_option_value("DoReserveCopyInSuperWordDebug", _CountedLoopReserveKit_debug);
|
||||||
|
}
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -1763,6 +1767,22 @@ void SuperWord::co_locate_pack(Node_List* pk) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#ifndef PRODUCT
|
||||||
|
void SuperWord::print_loop(bool whole) {
|
||||||
|
Node_Stack stack(_arena, _phase->C->unique() >> 2);
|
||||||
|
Node_List rpo_list;
|
||||||
|
VectorSet visited(_arena);
|
||||||
|
visited.set(lpt()->_head->_idx);
|
||||||
|
_phase->rpo(lpt()->_head, stack, visited, rpo_list);
|
||||||
|
_phase->dump(lpt(), rpo_list.size(), rpo_list );
|
||||||
|
if(whole) {
|
||||||
|
tty->print_cr("\n Whole loop tree");
|
||||||
|
_phase->dump();
|
||||||
|
tty->print_cr(" End of whole loop tree\n");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
//------------------------------output---------------------------
|
//------------------------------output---------------------------
|
||||||
// Convert packs into vector node operations
|
// Convert packs into vector node operations
|
||||||
void SuperWord::output() {
|
void SuperWord::output() {
|
||||||
@ -1770,7 +1790,7 @@ void SuperWord::output() {
|
|||||||
|
|
||||||
#ifndef PRODUCT
|
#ifndef PRODUCT
|
||||||
if (TraceLoopOpts) {
|
if (TraceLoopOpts) {
|
||||||
tty->print("SuperWord ");
|
tty->print("SuperWord::output ");
|
||||||
lpt()->dump_head();
|
lpt()->dump_head();
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
@ -1789,6 +1809,18 @@ void SuperWord::output() {
|
|||||||
CountedLoopNode *cl = lpt()->_head->as_CountedLoop();
|
CountedLoopNode *cl = lpt()->_head->as_CountedLoop();
|
||||||
uint max_vlen_in_bytes = 0;
|
uint max_vlen_in_bytes = 0;
|
||||||
uint max_vlen = 0;
|
uint max_vlen = 0;
|
||||||
|
|
||||||
|
NOT_PRODUCT(if(_CountedLoopReserveKit_debug > 0) {tty->print_cr("SWPointer::output: print loop before create_reserve_version_of_loop"); print_loop(true);})
|
||||||
|
|
||||||
|
CountedLoopReserveKit make_reversable(_phase, _lpt, DoReserveCopyInSuperWord);
|
||||||
|
|
||||||
|
NOT_PRODUCT(if(_CountedLoopReserveKit_debug > 0) {tty->print_cr("SWPointer::output: print loop after create_reserve_version_of_loop"); print_loop(true);})
|
||||||
|
|
||||||
|
if (DoReserveCopyInSuperWord && !make_reversable.has_reserved()) {
|
||||||
|
NOT_PRODUCT({tty->print_cr("SWPointer::output: loop was not reserved correctly, exiting SuperWord");})
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
for (int i = 0; i < _block.length(); i++) {
|
for (int i = 0; i < _block.length(); i++) {
|
||||||
Node* n = _block.at(i);
|
Node* n = _block.at(i);
|
||||||
Node_List* p = my_pack(n);
|
Node_List* p = my_pack(n);
|
||||||
@ -1888,6 +1920,7 @@ void SuperWord::output() {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
C->set_max_vector_size(max_vlen_in_bytes);
|
C->set_max_vector_size(max_vlen_in_bytes);
|
||||||
|
|
||||||
if (SuperWordLoopUnrollAnalysis) {
|
if (SuperWordLoopUnrollAnalysis) {
|
||||||
if (cl->has_passed_slp()) {
|
if (cl->has_passed_slp()) {
|
||||||
uint slp_max_unroll_factor = cl->slp_max_unroll();
|
uint slp_max_unroll_factor = cl->slp_max_unroll();
|
||||||
@ -1900,6 +1933,12 @@ void SuperWord::output() {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (DoReserveCopyInSuperWord) {
|
||||||
|
make_reversable.use_new();
|
||||||
|
}
|
||||||
|
NOT_PRODUCT(if(_CountedLoopReserveKit_debug > 0) {tty->print_cr("\n Final loop after SuperWord"); print_loop(true);})
|
||||||
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
//------------------------------vector_opd---------------------------
|
//------------------------------vector_opd---------------------------
|
||||||
|
@ -299,6 +299,7 @@ class SuperWord : public ResourceObj {
|
|||||||
GrowableArray<int> _ii_order;
|
GrowableArray<int> _ii_order;
|
||||||
#ifndef PRODUCT
|
#ifndef PRODUCT
|
||||||
uintx _vector_loop_debug; // provide more printing in debug mode
|
uintx _vector_loop_debug; // provide more printing in debug mode
|
||||||
|
uintx _CountedLoopReserveKit_debug; // for debugging CountedLoopReserveKit
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
// Accessors
|
// Accessors
|
||||||
@ -375,6 +376,7 @@ class SuperWord : public ResourceObj {
|
|||||||
// Tracing support
|
// Tracing support
|
||||||
#ifndef PRODUCT
|
#ifndef PRODUCT
|
||||||
void find_adjacent_refs_trace_1(Node* best_align_to_mem_ref, int best_iv_adjustment);
|
void find_adjacent_refs_trace_1(Node* best_align_to_mem_ref, int best_iv_adjustment);
|
||||||
|
void print_loop(bool whole);
|
||||||
#endif
|
#endif
|
||||||
// Find a memory reference to align the loop induction variable to.
|
// Find a memory reference to align the loop induction variable to.
|
||||||
MemNode* find_align_to_ref(Node_List &memops);
|
MemNode* find_align_to_ref(Node_List &memops);
|
||||||
|
Loading…
Reference in New Issue
Block a user