aoqi@0: /* aoqi@0: * Copyright (c) 2007, 2012, Oracle and/or its affiliates. All rights reserved. aoqi@0: * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. aoqi@0: * aoqi@0: * This code is free software; you can redistribute it and/or modify it aoqi@0: * under the terms of the GNU General Public License version 2 only, as aoqi@0: * published by the Free Software Foundation. aoqi@0: * aoqi@0: * This code is distributed in the hope that it will be useful, but WITHOUT aoqi@0: * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or aoqi@0: * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License aoqi@0: * version 2 for more details (a copy is included in the LICENSE file that aoqi@0: * accompanied this code). aoqi@0: * aoqi@0: * You should have received a copy of the GNU General Public License version aoqi@0: * 2 along with this work; if not, write to the Free Software Foundation, aoqi@0: * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. aoqi@0: * aoqi@0: * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA aoqi@0: * or visit www.oracle.com if you need additional information or have any aoqi@0: * questions. aoqi@0: */ aoqi@0: aoqi@0: #include "precompiled.hpp" aoqi@0: #include "memory/allocation.inline.hpp" aoqi@0: #include "opto/connode.hpp" aoqi@0: #include "opto/vectornode.hpp" aoqi@0: aoqi@0: //------------------------------VectorNode-------------------------------------- aoqi@0: aoqi@0: // Return the vector operator for the specified scalar operation aoqi@0: // and vector length. aoqi@0: int VectorNode::opcode(int sopc, BasicType bt) { aoqi@0: switch (sopc) { aoqi@0: case Op_AddI: aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: return Op_AddVB; aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: return Op_AddVS; aoqi@0: case T_INT: return Op_AddVI; aoqi@0: } aoqi@0: ShouldNotReachHere(); aoqi@0: case Op_AddL: aoqi@0: assert(bt == T_LONG, "must be"); aoqi@0: return Op_AddVL; aoqi@0: case Op_AddF: aoqi@0: assert(bt == T_FLOAT, "must be"); aoqi@0: return Op_AddVF; aoqi@0: case Op_AddD: aoqi@0: assert(bt == T_DOUBLE, "must be"); aoqi@0: return Op_AddVD; aoqi@0: case Op_SubI: aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: return Op_SubVB; aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: return Op_SubVS; aoqi@0: case T_INT: return Op_SubVI; aoqi@0: } aoqi@0: ShouldNotReachHere(); aoqi@0: case Op_SubL: aoqi@0: assert(bt == T_LONG, "must be"); aoqi@0: return Op_SubVL; aoqi@0: case Op_SubF: aoqi@0: assert(bt == T_FLOAT, "must be"); aoqi@0: return Op_SubVF; aoqi@0: case Op_SubD: aoqi@0: assert(bt == T_DOUBLE, "must be"); aoqi@0: return Op_SubVD; aoqi@0: case Op_MulI: aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: return 0; // Unimplemented aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: return Op_MulVS; aoqi@0: case T_INT: return Op_MulVI; aoqi@0: } aoqi@0: ShouldNotReachHere(); aoqi@0: case Op_MulF: aoqi@0: assert(bt == T_FLOAT, "must be"); aoqi@0: return Op_MulVF; aoqi@0: case Op_MulD: aoqi@0: assert(bt == T_DOUBLE, "must be"); aoqi@0: return Op_MulVD; aoqi@0: case Op_DivF: aoqi@0: assert(bt == T_FLOAT, "must be"); aoqi@0: return Op_DivVF; aoqi@0: case Op_DivD: aoqi@0: assert(bt == T_DOUBLE, "must be"); aoqi@0: return Op_DivVD; aoqi@0: case Op_LShiftI: aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: return Op_LShiftVB; aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: return Op_LShiftVS; aoqi@0: case T_INT: return Op_LShiftVI; aoqi@0: } aoqi@0: ShouldNotReachHere(); aoqi@0: case Op_LShiftL: aoqi@0: assert(bt == T_LONG, "must be"); aoqi@0: return Op_LShiftVL; aoqi@0: case Op_RShiftI: aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN:return Op_URShiftVB; // boolean is unsigned value aoqi@0: case T_CHAR: return Op_URShiftVS; // char is unsigned value aoqi@0: case T_BYTE: return Op_RShiftVB; aoqi@0: case T_SHORT: return Op_RShiftVS; aoqi@0: case T_INT: return Op_RShiftVI; aoqi@0: } aoqi@0: ShouldNotReachHere(); aoqi@0: case Op_RShiftL: aoqi@0: assert(bt == T_LONG, "must be"); aoqi@0: return Op_RShiftVL; aoqi@0: case Op_URShiftI: aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN:return Op_URShiftVB; aoqi@0: case T_CHAR: return Op_URShiftVS; aoqi@0: case T_BYTE: aoqi@0: case T_SHORT: return 0; // Vector logical right shift for signed short aoqi@0: // values produces incorrect Java result for aoqi@0: // negative data because java code should convert aoqi@0: // a short value into int value with sign aoqi@0: // extension before a shift. aoqi@0: case T_INT: return Op_URShiftVI; aoqi@0: } aoqi@0: ShouldNotReachHere(); aoqi@0: case Op_URShiftL: aoqi@0: assert(bt == T_LONG, "must be"); aoqi@0: return Op_URShiftVL; aoqi@0: case Op_AndI: aoqi@0: case Op_AndL: aoqi@0: return Op_AndV; aoqi@0: case Op_OrI: aoqi@0: case Op_OrL: aoqi@0: return Op_OrV; aoqi@0: case Op_XorI: aoqi@0: case Op_XorL: aoqi@0: return Op_XorV; aoqi@0: aoqi@0: case Op_LoadB: aoqi@0: case Op_LoadUB: aoqi@0: case Op_LoadUS: aoqi@0: case Op_LoadS: aoqi@0: case Op_LoadI: aoqi@0: case Op_LoadL: aoqi@0: case Op_LoadF: aoqi@0: case Op_LoadD: aoqi@0: return Op_LoadVector; aoqi@0: aoqi@0: case Op_StoreB: aoqi@0: case Op_StoreC: aoqi@0: case Op_StoreI: aoqi@0: case Op_StoreL: aoqi@0: case Op_StoreF: aoqi@0: case Op_StoreD: aoqi@0: return Op_StoreVector; aoqi@0: } aoqi@0: return 0; // Unimplemented aoqi@0: } aoqi@0: aoqi@0: // Also used to check if the code generator aoqi@0: // supports the vector operation. aoqi@0: bool VectorNode::implemented(int opc, uint vlen, BasicType bt) { aoqi@0: if (is_java_primitive(bt) && aoqi@0: (vlen > 1) && is_power_of_2(vlen) && aoqi@0: Matcher::vector_size_supported(bt, vlen)) { aoqi@0: int vopc = VectorNode::opcode(opc, bt); aoqi@0: return vopc > 0 && Matcher::match_rule_supported(vopc); aoqi@0: } aoqi@0: return false; aoqi@0: } aoqi@0: aoqi@0: bool VectorNode::is_shift(Node* n) { aoqi@0: switch (n->Opcode()) { aoqi@0: case Op_LShiftI: aoqi@0: case Op_LShiftL: aoqi@0: case Op_RShiftI: aoqi@0: case Op_RShiftL: aoqi@0: case Op_URShiftI: aoqi@0: case Op_URShiftL: aoqi@0: return true; aoqi@0: } aoqi@0: return false; aoqi@0: } aoqi@0: aoqi@0: // Check if input is loop invariant vector. aoqi@0: bool VectorNode::is_invariant_vector(Node* n) { aoqi@0: // Only Replicate vector nodes are loop invariant for now. aoqi@0: switch (n->Opcode()) { aoqi@0: case Op_ReplicateB: aoqi@0: case Op_ReplicateS: aoqi@0: case Op_ReplicateI: aoqi@0: case Op_ReplicateL: aoqi@0: case Op_ReplicateF: aoqi@0: case Op_ReplicateD: aoqi@0: return true; aoqi@0: } aoqi@0: return false; aoqi@0: } aoqi@0: aoqi@0: // [Start, end) half-open range defining which operands are vectors aoqi@0: void VectorNode::vector_operands(Node* n, uint* start, uint* end) { aoqi@0: switch (n->Opcode()) { aoqi@0: case Op_LoadB: case Op_LoadUB: aoqi@0: case Op_LoadS: case Op_LoadUS: aoqi@0: case Op_LoadI: case Op_LoadL: aoqi@0: case Op_LoadF: case Op_LoadD: aoqi@0: case Op_LoadP: case Op_LoadN: aoqi@0: *start = 0; aoqi@0: *end = 0; // no vector operands aoqi@0: break; aoqi@0: case Op_StoreB: case Op_StoreC: aoqi@0: case Op_StoreI: case Op_StoreL: aoqi@0: case Op_StoreF: case Op_StoreD: aoqi@0: case Op_StoreP: case Op_StoreN: aoqi@0: *start = MemNode::ValueIn; aoqi@0: *end = MemNode::ValueIn + 1; // 1 vector operand aoqi@0: break; aoqi@0: case Op_LShiftI: case Op_LShiftL: aoqi@0: case Op_RShiftI: case Op_RShiftL: aoqi@0: case Op_URShiftI: case Op_URShiftL: aoqi@0: *start = 1; aoqi@0: *end = 2; // 1 vector operand aoqi@0: break; aoqi@0: case Op_AddI: case Op_AddL: case Op_AddF: case Op_AddD: aoqi@0: case Op_SubI: case Op_SubL: case Op_SubF: case Op_SubD: aoqi@0: case Op_MulI: case Op_MulL: case Op_MulF: case Op_MulD: aoqi@0: case Op_DivF: case Op_DivD: aoqi@0: case Op_AndI: case Op_AndL: aoqi@0: case Op_OrI: case Op_OrL: aoqi@0: case Op_XorI: case Op_XorL: aoqi@0: *start = 1; aoqi@0: *end = 3; // 2 vector operands aoqi@0: break; aoqi@0: case Op_CMoveI: case Op_CMoveL: case Op_CMoveF: case Op_CMoveD: aoqi@0: *start = 2; aoqi@0: *end = n->req(); aoqi@0: break; aoqi@0: default: aoqi@0: *start = 1; aoqi@0: *end = n->req(); // default is all operands aoqi@0: } aoqi@0: } aoqi@0: aoqi@0: // Return the vector version of a scalar operation node. aoqi@0: VectorNode* VectorNode::make(Compile* C, int opc, Node* n1, Node* n2, uint vlen, BasicType bt) { aoqi@0: const TypeVect* vt = TypeVect::make(bt, vlen); aoqi@0: int vopc = VectorNode::opcode(opc, bt); aoqi@0: // This method should not be called for unimplemented vectors. aoqi@0: guarantee(vopc > 0, err_msg_res("Vector for '%s' is not implemented", NodeClassNames[opc])); aoqi@0: aoqi@0: switch (vopc) { aoqi@0: case Op_AddVB: return new (C) AddVBNode(n1, n2, vt); aoqi@0: case Op_AddVS: return new (C) AddVSNode(n1, n2, vt); aoqi@0: case Op_AddVI: return new (C) AddVINode(n1, n2, vt); aoqi@0: case Op_AddVL: return new (C) AddVLNode(n1, n2, vt); aoqi@0: case Op_AddVF: return new (C) AddVFNode(n1, n2, vt); aoqi@0: case Op_AddVD: return new (C) AddVDNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_SubVB: return new (C) SubVBNode(n1, n2, vt); aoqi@0: case Op_SubVS: return new (C) SubVSNode(n1, n2, vt); aoqi@0: case Op_SubVI: return new (C) SubVINode(n1, n2, vt); aoqi@0: case Op_SubVL: return new (C) SubVLNode(n1, n2, vt); aoqi@0: case Op_SubVF: return new (C) SubVFNode(n1, n2, vt); aoqi@0: case Op_SubVD: return new (C) SubVDNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_MulVS: return new (C) MulVSNode(n1, n2, vt); aoqi@0: case Op_MulVI: return new (C) MulVINode(n1, n2, vt); aoqi@0: case Op_MulVF: return new (C) MulVFNode(n1, n2, vt); aoqi@0: case Op_MulVD: return new (C) MulVDNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_DivVF: return new (C) DivVFNode(n1, n2, vt); aoqi@0: case Op_DivVD: return new (C) DivVDNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_LShiftVB: return new (C) LShiftVBNode(n1, n2, vt); aoqi@0: case Op_LShiftVS: return new (C) LShiftVSNode(n1, n2, vt); aoqi@0: case Op_LShiftVI: return new (C) LShiftVINode(n1, n2, vt); aoqi@0: case Op_LShiftVL: return new (C) LShiftVLNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_RShiftVB: return new (C) RShiftVBNode(n1, n2, vt); aoqi@0: case Op_RShiftVS: return new (C) RShiftVSNode(n1, n2, vt); aoqi@0: case Op_RShiftVI: return new (C) RShiftVINode(n1, n2, vt); aoqi@0: case Op_RShiftVL: return new (C) RShiftVLNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_URShiftVB: return new (C) URShiftVBNode(n1, n2, vt); aoqi@0: case Op_URShiftVS: return new (C) URShiftVSNode(n1, n2, vt); aoqi@0: case Op_URShiftVI: return new (C) URShiftVINode(n1, n2, vt); aoqi@0: case Op_URShiftVL: return new (C) URShiftVLNode(n1, n2, vt); aoqi@0: aoqi@0: case Op_AndV: return new (C) AndVNode(n1, n2, vt); aoqi@0: case Op_OrV: return new (C) OrVNode (n1, n2, vt); aoqi@0: case Op_XorV: return new (C) XorVNode(n1, n2, vt); aoqi@0: } aoqi@0: fatal(err_msg_res("Missed vector creation for '%s'", NodeClassNames[vopc])); aoqi@0: return NULL; aoqi@0: aoqi@0: } aoqi@0: aoqi@0: // Scalar promotion aoqi@0: VectorNode* VectorNode::scalar2vector(Compile* C, Node* s, uint vlen, const Type* opd_t) { aoqi@0: BasicType bt = opd_t->array_element_basic_type(); aoqi@0: const TypeVect* vt = opd_t->singleton() ? TypeVect::make(opd_t, vlen) aoqi@0: : TypeVect::make(bt, vlen); aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: aoqi@0: return new (C) ReplicateBNode(s, vt); aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: aoqi@0: return new (C) ReplicateSNode(s, vt); aoqi@0: case T_INT: aoqi@0: return new (C) ReplicateINode(s, vt); aoqi@0: case T_LONG: aoqi@0: return new (C) ReplicateLNode(s, vt); aoqi@0: case T_FLOAT: aoqi@0: return new (C) ReplicateFNode(s, vt); aoqi@0: case T_DOUBLE: aoqi@0: return new (C) ReplicateDNode(s, vt); aoqi@0: } aoqi@0: fatal(err_msg_res("Type '%s' is not supported for vectors", type2name(bt))); aoqi@0: return NULL; aoqi@0: } aoqi@0: aoqi@0: VectorNode* VectorNode::shift_count(Compile* C, Node* shift, Node* cnt, uint vlen, BasicType bt) { aoqi@0: assert(VectorNode::is_shift(shift) && !cnt->is_Con(), "only variable shift count"); aoqi@0: // Match shift count type with shift vector type. aoqi@0: const TypeVect* vt = TypeVect::make(bt, vlen); aoqi@0: switch (shift->Opcode()) { aoqi@0: case Op_LShiftI: aoqi@0: case Op_LShiftL: aoqi@0: return new (C) LShiftCntVNode(cnt, vt); aoqi@0: case Op_RShiftI: aoqi@0: case Op_RShiftL: aoqi@0: case Op_URShiftI: aoqi@0: case Op_URShiftL: aoqi@0: return new (C) RShiftCntVNode(cnt, vt); aoqi@0: } aoqi@0: fatal(err_msg_res("Missed vector creation for '%s'", NodeClassNames[shift->Opcode()])); aoqi@0: return NULL; aoqi@0: } aoqi@0: aoqi@0: // Return initial Pack node. Additional operands added with add_opd() calls. aoqi@0: PackNode* PackNode::make(Compile* C, Node* s, uint vlen, BasicType bt) { aoqi@0: const TypeVect* vt = TypeVect::make(bt, vlen); aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: aoqi@0: return new (C) PackBNode(s, vt); aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: aoqi@0: return new (C) PackSNode(s, vt); aoqi@0: case T_INT: aoqi@0: return new (C) PackINode(s, vt); aoqi@0: case T_LONG: aoqi@0: return new (C) PackLNode(s, vt); aoqi@0: case T_FLOAT: aoqi@0: return new (C) PackFNode(s, vt); aoqi@0: case T_DOUBLE: aoqi@0: return new (C) PackDNode(s, vt); aoqi@0: } aoqi@0: fatal(err_msg_res("Type '%s' is not supported for vectors", type2name(bt))); aoqi@0: return NULL; aoqi@0: } aoqi@0: aoqi@0: // Create a binary tree form for Packs. [lo, hi) (half-open) range aoqi@0: PackNode* PackNode::binary_tree_pack(Compile* C, int lo, int hi) { aoqi@0: int ct = hi - lo; aoqi@0: assert(is_power_of_2(ct), "power of 2"); aoqi@0: if (ct == 2) { aoqi@0: PackNode* pk = PackNode::make(C, in(lo), 2, vect_type()->element_basic_type()); aoqi@0: pk->add_opd(in(lo+1)); aoqi@0: return pk; aoqi@0: aoqi@0: } else { aoqi@0: int mid = lo + ct/2; aoqi@0: PackNode* n1 = binary_tree_pack(C, lo, mid); aoqi@0: PackNode* n2 = binary_tree_pack(C, mid, hi ); aoqi@0: aoqi@0: BasicType bt = n1->vect_type()->element_basic_type(); aoqi@0: assert(bt == n2->vect_type()->element_basic_type(), "should be the same"); aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: case T_BYTE: aoqi@0: return new (C) PackSNode(n1, n2, TypeVect::make(T_SHORT, 2)); aoqi@0: case T_CHAR: aoqi@0: case T_SHORT: aoqi@0: return new (C) PackINode(n1, n2, TypeVect::make(T_INT, 2)); aoqi@0: case T_INT: aoqi@0: return new (C) PackLNode(n1, n2, TypeVect::make(T_LONG, 2)); aoqi@0: case T_LONG: aoqi@0: return new (C) Pack2LNode(n1, n2, TypeVect::make(T_LONG, 2)); aoqi@0: case T_FLOAT: aoqi@0: return new (C) PackDNode(n1, n2, TypeVect::make(T_DOUBLE, 2)); aoqi@0: case T_DOUBLE: aoqi@0: return new (C) Pack2DNode(n1, n2, TypeVect::make(T_DOUBLE, 2)); aoqi@0: } aoqi@0: fatal(err_msg_res("Type '%s' is not supported for vectors", type2name(bt))); aoqi@0: } aoqi@0: return NULL; aoqi@0: } aoqi@0: aoqi@0: // Return the vector version of a scalar load node. aoqi@0: LoadVectorNode* LoadVectorNode::make(Compile* C, int opc, Node* ctl, Node* mem, aoqi@0: Node* adr, const TypePtr* atyp, uint vlen, BasicType bt) { aoqi@0: const TypeVect* vt = TypeVect::make(bt, vlen); aoqi@0: return new (C) LoadVectorNode(ctl, mem, adr, atyp, vt); aoqi@0: } aoqi@0: aoqi@0: // Return the vector version of a scalar store node. aoqi@0: StoreVectorNode* StoreVectorNode::make(Compile* C, int opc, Node* ctl, Node* mem, aoqi@0: Node* adr, const TypePtr* atyp, Node* val, aoqi@0: uint vlen) { aoqi@0: return new (C) StoreVectorNode(ctl, mem, adr, atyp, val); aoqi@0: } aoqi@0: aoqi@0: // Extract a scalar element of vector. aoqi@0: Node* ExtractNode::make(Compile* C, Node* v, uint position, BasicType bt) { aoqi@0: assert((int)position < Matcher::max_vector_size(bt), "pos in range"); aoqi@0: ConINode* pos = ConINode::make(C, (int)position); aoqi@0: switch (bt) { aoqi@0: case T_BOOLEAN: aoqi@0: return new (C) ExtractUBNode(v, pos); aoqi@0: case T_BYTE: aoqi@0: return new (C) ExtractBNode(v, pos); aoqi@0: case T_CHAR: aoqi@0: return new (C) ExtractCNode(v, pos); aoqi@0: case T_SHORT: aoqi@0: return new (C) ExtractSNode(v, pos); aoqi@0: case T_INT: aoqi@0: return new (C) ExtractINode(v, pos); aoqi@0: case T_LONG: aoqi@0: return new (C) ExtractLNode(v, pos); aoqi@0: case T_FLOAT: aoqi@0: return new (C) ExtractFNode(v, pos); aoqi@0: case T_DOUBLE: aoqi@0: return new (C) ExtractDNode(v, pos); aoqi@0: } aoqi@0: fatal(err_msg_res("Type '%s' is not supported for vectors", type2name(bt))); aoqi@0: return NULL; aoqi@0: } aoqi@0: