/* * Copyright (c) 2020, Oracle and/or its affiliates. All rights reserved. * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. * * This code is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 only, as * published by the Free Software Foundation. * * This code is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License * version 2 for more details (a copy is included in the LICENSE file that * accompanied this code). * * You should have received a copy of the GNU General Public License version * 2 along with this work; if not, write to the Free Software Foundation, * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. * * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA * or visit www.oracle.com if you need additional information or have any * questions. * */ #include "precompiled.hpp" #include "opto/castnode.hpp" #include "opto/graphKit.hpp" #include "opto/phaseX.hpp" #include "opto/rootnode.hpp" #include "opto/vector.hpp" #include "utilities/macros.hpp" void PhaseVector::optimize_vector_boxes() { Compile::TracePhase tp("vector_elimination", &timers[_t_vector_elimination]); // Signal GraphKit it's post-parse phase. assert(C->inlining_incrementally() == false, "sanity"); C->set_inlining_incrementally(true); C->for_igvn()->clear(); C->initial_gvn()->replace_with(&_igvn); expand_vunbox_nodes(); scalarize_vbox_nodes(); C->inline_vector_reboxing_calls(); expand_vbox_nodes(); eliminate_vbox_alloc_nodes(); C->set_inlining_incrementally(false); do_cleanup(); } void PhaseVector::do_cleanup() { if (C->failing()) return; { Compile::TracePhase tp("vector_pru", &timers[_t_vector_pru]); ResourceMark rm; PhaseRemoveUseless pru(C->initial_gvn(), C->for_igvn()); if (C->failing()) return; } { Compile::TracePhase tp("incrementalInline_igvn", &timers[_t_vector_igvn]); _igvn = PhaseIterGVN(C->initial_gvn()); _igvn.optimize(); if (C->failing()) return; } C->print_method(PHASE_ITER_GVN_BEFORE_EA, 3); } void PhaseVector::scalarize_vbox_nodes() { if (C->failing()) return; if (!EnableVectorReboxing) { return; // don't scalarize vector boxes } int macro_idx = C->macro_count() - 1; while (macro_idx >= 0) { Node * n = C->macro_node(macro_idx); assert(n->is_macro(), "only macro nodes expected here"); if (n->Opcode() == Op_VectorBox) { VectorBoxNode* vbox = static_cast(n); scalarize_vbox_node(vbox); if (C->failing()) return; C->print_method(PHASE_SCALARIZE_VBOX, vbox, 3); } if (C->failing()) return; macro_idx = MIN2(macro_idx - 1, C->macro_count() - 1); } } void PhaseVector::expand_vbox_nodes() { if (C->failing()) return; int macro_idx = C->macro_count() - 1; while (macro_idx >= 0) { Node * n = C->macro_node(macro_idx); assert(n->is_macro(), "only macro nodes expected here"); if (n->Opcode() == Op_VectorBox) { VectorBoxNode* vbox = static_cast(n); expand_vbox_node(vbox); if (C->failing()) return; } if (C->failing()) return; macro_idx = MIN2(macro_idx - 1, C->macro_count() - 1); } } void PhaseVector::expand_vunbox_nodes() { if (C->failing()) return; int macro_idx = C->macro_count() - 1; while (macro_idx >= 0) { Node * n = C->macro_node(macro_idx); assert(n->is_macro(), "only macro nodes expected here"); if (n->Opcode() == Op_VectorUnbox) { VectorUnboxNode* vec_unbox = static_cast(n); expand_vunbox_node(vec_unbox); if (C->failing()) return; C->print_method(PHASE_EXPAND_VUNBOX, vec_unbox, 3); } if (C->failing()) return; macro_idx = MIN2(macro_idx - 1, C->macro_count() - 1); } } void PhaseVector::eliminate_vbox_alloc_nodes() { if (C->failing()) return; int macro_idx = C->macro_count() - 1; while (macro_idx >= 0) { Node * n = C->macro_node(macro_idx); assert(n->is_macro(), "only macro nodes expected here"); if (n->Opcode() == Op_VectorBoxAllocate) { VectorBoxAllocateNode* vbox_alloc = static_cast(n); eliminate_vbox_alloc_node(vbox_alloc); if (C->failing()) return; C->print_method(PHASE_ELIMINATE_VBOX_ALLOC, vbox_alloc, 3); } if (C->failing()) return; macro_idx = MIN2(macro_idx - 1, C->macro_count() - 1); } } static JVMState* clone_jvms(Compile* C, SafePointNode* sfpt) { JVMState* new_jvms = sfpt->jvms()->clone_shallow(C); uint size = sfpt->req(); SafePointNode* map = new SafePointNode(size, new_jvms); for (uint i = 0; i < size; i++) { map->init_req(i, sfpt->in(i)); } new_jvms->set_map(map); return new_jvms; } void PhaseVector::scalarize_vbox_node(VectorBoxNode* vec_box) { Node* vec_value = vec_box->in(VectorBoxNode::Value); PhaseGVN& gvn = *C->initial_gvn(); // Process merged VBAs if (EnableVectorAggressiveReboxing) { Unique_Node_List calls(C->comp_arena()); for (DUIterator_Fast imax, i = vec_box->fast_outs(imax); i < imax; i++) { Node* use = vec_box->fast_out(i); if (use->is_CallJava()) { CallJavaNode* call = use->as_CallJava(); if (call->has_non_debug_use(vec_box) && vec_box->in(VectorBoxNode::Box)->is_Phi()) { calls.push(call); } } } while (calls.size() > 0) { CallJavaNode* call = calls.pop()->as_CallJava(); // Attach new VBA to the call and use it instead of Phi (VBA ... VBA). JVMState* jvms = clone_jvms(C, call); GraphKit kit(jvms); PhaseGVN& gvn = kit.gvn(); // Adjust JVMS from post-call to pre-call state: put args on stack uint nargs = call->method()->arg_size(); kit.ensure_stack(kit.sp() + nargs); for (uint i = TypeFunc::Parms; i < call->tf()->domain()->cnt(); i++) { kit.push(call->in(i)); } jvms = kit.sync_jvms(); Node* new_vbox = NULL; { PreserveReexecuteState prs(&kit); kit.jvms()->set_should_reexecute(true); const TypeInstPtr* vbox_type = vec_box->box_type(); const TypeVect* vect_type = vec_box->vec_type(); Node* vect = vec_box->in(VectorBoxNode::Value); VectorBoxAllocateNode* alloc = new VectorBoxAllocateNode(C, vbox_type); kit.set_edges_for_java_call(alloc, /*must_throw=*/false, /*separate_io_proj=*/true); kit.make_slow_call_ex(alloc, C->env()->Throwable_klass(), /*separate_io_proj=*/true, /*deoptimize=*/true); kit.set_i_o(gvn.transform( new ProjNode(alloc, TypeFunc::I_O) )); kit.set_all_memory(gvn.transform( new ProjNode(alloc, TypeFunc::Memory) )); Node* ret = gvn.transform(new ProjNode(alloc, TypeFunc::Parms)); new_vbox = gvn.transform(new VectorBoxNode(C, ret, vect, vbox_type, vect_type)); kit.replace_in_map(vec_box, new_vbox); } kit.dec_sp(nargs); jvms = kit.sync_jvms(); call->set_req(TypeFunc::Control , kit.control()); call->set_req(TypeFunc::I_O , kit.i_o()); call->set_req(TypeFunc::Memory , kit.reset_memory()); call->set_req(TypeFunc::FramePtr, kit.frameptr()); call->replace_edge(vec_box, new_vbox); C->record_for_igvn(call); } } // Process debug uses at safepoints Unique_Node_List safepoints(C->comp_arena()); for (DUIterator_Fast imax, i = vec_box->fast_outs(imax); i < imax; i++) { Node* use = vec_box->fast_out(i); if (use->is_SafePoint()) { SafePointNode* sfpt = use->as_SafePoint(); if (!sfpt->is_Call() || !sfpt->as_Call()->has_non_debug_use(vec_box)) { safepoints.push(sfpt); } } } while (safepoints.size() > 0) { SafePointNode* sfpt = safepoints.pop()->as_SafePoint(); ciInstanceKlass* iklass = vec_box->box_type()->klass()->as_instance_klass(); int n_fields = iklass->nof_nonstatic_fields(); assert(n_fields == 1, "sanity"); uint first_ind = (sfpt->req() - sfpt->jvms()->scloff()); Node* sobj = new SafePointScalarObjectNode(vec_box->box_type(), #ifdef ASSERT NULL, #endif // ASSERT first_ind, n_fields); sobj->init_req(0, C->root()); sfpt->add_req(vec_value); sobj = gvn.transform(sobj); JVMState *jvms = sfpt->jvms(); jvms->set_endoff(sfpt->req()); // Now make a pass over the debug information replacing any references // to the allocated object with "sobj" int start = jvms->debug_start(); int end = jvms->debug_end(); sfpt->replace_edges_in_range(vec_box, sobj, start, end); C->record_for_igvn(sfpt); } } void PhaseVector::expand_vbox_node(VectorBoxNode* vec_box) { if (vec_box->outcnt() > 0) { Node* vbox = vec_box->in(VectorBoxNode::Box); Node* vect = vec_box->in(VectorBoxNode::Value); Node* result = expand_vbox_node_helper(vbox, vect, vec_box->box_type(), vec_box->vec_type()); C->gvn_replace_by(vec_box, result); C->print_method(PHASE_EXPAND_VBOX, vec_box, 3); } C->remove_macro_node(vec_box); } Node* PhaseVector::expand_vbox_node_helper(Node* vbox, Node* vect, const TypeInstPtr* box_type, const TypeVect* vect_type) { if (vbox->is_Phi() && vect->is_Phi()) { assert(vbox->as_Phi()->region() == vect->as_Phi()->region(), ""); Node* new_phi = new PhiNode(vbox->as_Phi()->region(), box_type); for (uint i = 1; i < vbox->req(); i++) { Node* new_box = expand_vbox_node_helper(vbox->in(i), vect->in(i), box_type, vect_type); new_phi->set_req(i, new_box); } new_phi = C->initial_gvn()->transform(new_phi); return new_phi; } else if (vbox->is_Proj() && vbox->in(0)->Opcode() == Op_VectorBoxAllocate) { VectorBoxAllocateNode* vbox_alloc = static_cast(vbox->in(0)); return expand_vbox_alloc_node(vbox_alloc, vect, box_type, vect_type); } else { assert(!vbox->is_Phi(), ""); // TODO: assert that expanded vbox is initialized with the same value (vect). return vbox; // already expanded } } static bool is_vector_mask(ciKlass* klass) { return klass->is_subclass_of(ciEnv::current()->vector_VectorMask_klass()); } static bool is_vector_shuffle(ciKlass* klass) { return klass->is_subclass_of(ciEnv::current()->vector_VectorShuffle_klass()); } Node* PhaseVector::expand_vbox_alloc_node(VectorBoxAllocateNode* vbox_alloc, Node* value, const TypeInstPtr* box_type, const TypeVect* vect_type) { JVMState* jvms = clone_jvms(C, vbox_alloc); GraphKit kit(jvms); PhaseGVN& gvn = kit.gvn(); ciInstanceKlass* box_klass = box_type->klass()->as_instance_klass(); BasicType bt = vect_type->element_basic_type(); int num_elem = vect_type->length(); bool is_mask = is_vector_mask(box_klass); if (is_mask && bt != T_BOOLEAN) { value = gvn.transform(VectorStoreMaskNode::make(gvn, value, bt, num_elem)); // Although type of mask depends on its definition, in terms of storage everything is stored in boolean array. bt = T_BOOLEAN; assert(value->as_Vector()->bottom_type()->is_vect()->element_basic_type() == bt, "must be consistent with mask representation"); } // Generate array allocation for the field which holds the values. const TypeKlassPtr* array_klass = TypeKlassPtr::make(ciTypeArrayKlass::make(bt)); Node* arr = kit.new_array(kit.makecon(array_klass), kit.intcon(num_elem), 1); // Store the vector value into the array. // (The store should be captured by InitializeNode and turned into initialized store later.) Node* arr_adr = kit.array_element_address(arr, kit.intcon(0), bt); const TypePtr* arr_adr_type = arr_adr->bottom_type()->is_ptr(); Node* arr_mem = kit.memory(arr_adr); Node* vstore = gvn.transform(StoreVectorNode::make(0, kit.control(), arr_mem, arr_adr, arr_adr_type, value, num_elem)); kit.set_memory(vstore, arr_adr_type); C->set_max_vector_size(MAX2(C->max_vector_size(), vect_type->length_in_bytes())); // Generate the allocate for the Vector object. const TypeKlassPtr* klass_type = box_type->as_klass_type(); Node* klass_node = kit.makecon(klass_type); Node* vec_obj = kit.new_instance(klass_node); // Store the allocated array into object. ciField* field = ciEnv::current()->vector_VectorPayload_klass()->get_field_by_name(ciSymbol::payload_name(), ciSymbol::object_signature(), false); assert(field != NULL, ""); Node* vec_field = kit.basic_plus_adr(vec_obj, field->offset_in_bytes()); const TypePtr* vec_adr_type = vec_field->bottom_type()->is_ptr(); // The store should be captured by InitializeNode and turned into initialized store later. Node* field_store = gvn.transform(kit.access_store_at(vec_obj, vec_field, vec_adr_type, arr, TypeOopPtr::make_from_klass(field->type()->as_klass()), T_OBJECT, IN_HEAP)); kit.set_memory(field_store, vec_adr_type); kit.replace_call(vbox_alloc, vec_obj, true); C->remove_macro_node(vbox_alloc); return vec_obj; } void PhaseVector::expand_vunbox_node(VectorUnboxNode* vec_unbox) { if (vec_unbox->outcnt() > 0) { GraphKit kit; PhaseGVN& gvn = kit.gvn(); Node* obj = vec_unbox->obj(); const TypeInstPtr* tinst = gvn.type(obj)->isa_instptr(); ciInstanceKlass* from_kls = tinst->klass()->as_instance_klass(); BasicType bt = vec_unbox->vect_type()->element_basic_type(); BasicType masktype = bt; BasicType elem_bt; if (is_vector_mask(from_kls)) { bt = T_BOOLEAN; } else if (is_vector_shuffle(from_kls)) { if (vec_unbox->is_shuffle_to_vector() == true) { elem_bt = bt; } bt = T_BYTE; } ciField* field = ciEnv::current()->vector_VectorPayload_klass()->get_field_by_name(ciSymbol::payload_name(), ciSymbol::object_signature(), false); assert(field != NULL, ""); int offset = field->offset_in_bytes(); Node* vec_adr = kit.basic_plus_adr(obj, offset); Node* mem = vec_unbox->mem(); Node* ctrl = vec_unbox->in(0); Node* vec_field_ld = LoadNode::make(gvn, ctrl, mem, vec_adr, vec_adr->bottom_type()->is_ptr(), TypeOopPtr::make_from_klass(field->type()->as_klass()), T_OBJECT, MemNode::unordered); vec_field_ld = gvn.transform(vec_field_ld); // For proper aliasing, attach concrete payload type. ciKlass* payload_klass = ciTypeArrayKlass::make(bt); const Type* payload_type = TypeAryPtr::make_from_klass(payload_klass)->cast_to_ptr_type(TypePtr::NotNull); vec_field_ld = gvn.transform(new CastPPNode(vec_field_ld, payload_type)); Node* adr = kit.array_element_address(vec_field_ld, gvn.intcon(0), bt); const TypePtr* adr_type = adr->bottom_type()->is_ptr(); const TypeVect* vt = vec_unbox->bottom_type()->is_vect(); int num_elem = vt->length(); Node* vec_val_load = LoadVectorNode::make(0, ctrl, mem, adr, adr_type, num_elem, bt); vec_val_load = gvn.transform(vec_val_load); C->set_max_vector_size(MAX2(C->max_vector_size(), vt->length_in_bytes())); if (is_vector_mask(from_kls) && masktype != T_BOOLEAN) { assert(vec_unbox->bottom_type()->is_vect()->element_basic_type() == masktype, "expect mask type consistency"); vec_val_load = gvn.transform(new VectorLoadMaskNode(vec_val_load, TypeVect::make(masktype, num_elem))); } else if (is_vector_shuffle(from_kls)) { if (vec_unbox->is_shuffle_to_vector() == false) { assert(vec_unbox->bottom_type()->is_vect()->element_basic_type() == masktype, "expect shuffle type consistency"); vec_val_load = gvn.transform(new VectorLoadShuffleNode(vec_val_load, TypeVect::make(masktype, num_elem))); } else if (elem_bt != T_BYTE) { vec_val_load = gvn.transform(VectorCastNode::make(Op_VectorCastB2X, vec_val_load, elem_bt, num_elem)); } } gvn.hash_delete(vec_unbox); vec_unbox->disconnect_inputs(C); C->gvn_replace_by(vec_unbox, vec_val_load); } C->remove_macro_node(vec_unbox); } void PhaseVector::eliminate_vbox_alloc_node(VectorBoxAllocateNode* vbox_alloc) { JVMState* jvms = clone_jvms(C, vbox_alloc); GraphKit kit(jvms); // Remove VBA, but leave a safepoint behind. // Otherwise, it may end up with a loop without any safepoint polls. kit.replace_call(vbox_alloc, kit.map(), true); C->remove_macro_node(vbox_alloc); }