Path: blob/master/src/hotspot/cpu/x86/c2_MacroAssembler_x86.hpp
41144 views
/*1* Copyright (c) 2020, 2021, Oracle and/or its affiliates. All rights reserved.2* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.3*4* This code is free software; you can redistribute it and/or modify it5* under the terms of the GNU General Public License version 2 only, as6* published by the Free Software Foundation.7*8* This code is distributed in the hope that it will be useful, but WITHOUT9* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or10* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License11* version 2 for more details (a copy is included in the LICENSE file that12* accompanied this code).13*14* You should have received a copy of the GNU General Public License version15* 2 along with this work; if not, write to the Free Software Foundation,16* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.17*18* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA19* or visit www.oracle.com if you need additional information or have any20* questions.21*22*/2324#ifndef CPU_X86_C2_MACROASSEMBLER_X86_HPP25#define CPU_X86_C2_MACROASSEMBLER_X86_HPP2627// C2_MacroAssembler contains high-level macros for C22829public:30Assembler::AvxVectorLen vector_length_encoding(int vlen_in_bytes);3132// special instructions for EVEX33void setvectmask(Register dst, Register src, KRegister mask);34void restorevectmask(KRegister mask);3536// Code used by cmpFastLock and cmpFastUnlock mach instructions in .ad file.37// See full desription in macroAssembler_x86.cpp.38void fast_lock(Register obj, Register box, Register tmp,39Register scr, Register cx1, Register cx2,40BiasedLockingCounters* counters,41RTMLockingCounters* rtm_counters,42RTMLockingCounters* stack_rtm_counters,43Metadata* method_data,44bool use_rtm, bool profile_rtm);45void fast_unlock(Register obj, Register box, Register tmp, bool use_rtm);4647#if INCLUDE_RTM_OPT48void rtm_counters_update(Register abort_status, Register rtm_counters);49void branch_on_random_using_rdtsc(Register tmp, Register scr, int count, Label& brLabel);50void rtm_abort_ratio_calculation(Register tmp, Register rtm_counters_reg,51RTMLockingCounters* rtm_counters,52Metadata* method_data);53void rtm_profiling(Register abort_status_Reg, Register rtm_counters_Reg,54RTMLockingCounters* rtm_counters, Metadata* method_data, bool profile_rtm);55void rtm_retry_lock_on_abort(Register retry_count, Register abort_status, Label& retryLabel);56void rtm_retry_lock_on_busy(Register retry_count, Register box, Register tmp, Register scr, Label& retryLabel);57void rtm_stack_locking(Register obj, Register tmp, Register scr,58Register retry_on_abort_count,59RTMLockingCounters* stack_rtm_counters,60Metadata* method_data, bool profile_rtm,61Label& DONE_LABEL, Label& IsInflated);62void rtm_inflated_locking(Register obj, Register box, Register tmp,63Register scr, Register retry_on_busy_count,64Register retry_on_abort_count,65RTMLockingCounters* rtm_counters,66Metadata* method_data, bool profile_rtm,67Label& DONE_LABEL);68#endif6970// Generic instructions support for use in .ad files C2 code generation71void vabsnegd(int opcode, XMMRegister dst, XMMRegister src, Register scr);72void vabsnegd(int opcode, XMMRegister dst, XMMRegister src, int vector_len, Register scr);73void vabsnegf(int opcode, XMMRegister dst, XMMRegister src, Register scr);74void vabsnegf(int opcode, XMMRegister dst, XMMRegister src, int vector_len, Register scr);7576void pminmax(int opcode, BasicType elem_bt, XMMRegister dst, XMMRegister src,77XMMRegister tmp = xnoreg);78void vpminmax(int opcode, BasicType elem_bt,79XMMRegister dst, XMMRegister src1, XMMRegister src2,80int vlen_enc);8182void vminmax_fp(int opcode, BasicType elem_bt,83XMMRegister dst, XMMRegister a, XMMRegister b,84XMMRegister tmp, XMMRegister atmp, XMMRegister btmp,85int vlen_enc);86void evminmax_fp(int opcode, BasicType elem_bt,87XMMRegister dst, XMMRegister a, XMMRegister b,88KRegister ktmp, XMMRegister atmp, XMMRegister btmp,89int vlen_enc);9091void signum_fp(int opcode, XMMRegister dst,92XMMRegister zero, XMMRegister one,93Register scratch);9495void vextendbw(bool sign, XMMRegister dst, XMMRegister src, int vector_len);96void vextendbw(bool sign, XMMRegister dst, XMMRegister src);97void vextendbd(bool sign, XMMRegister dst, XMMRegister src, int vector_len);98void vextendwd(bool sign, XMMRegister dst, XMMRegister src, int vector_len);99100void vshiftd(int opcode, XMMRegister dst, XMMRegister shift);101void vshiftd_imm(int opcode, XMMRegister dst, int shift);102void vshiftd(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vlen_enc);103void vshiftd_imm(int opcode, XMMRegister dst, XMMRegister nds, int shift, int vector_len);104void vshiftw(int opcode, XMMRegister dst, XMMRegister shift);105void vshiftw(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vlen_enc);106void vshiftq(int opcode, XMMRegister dst, XMMRegister shift);107void vshiftq_imm(int opcode, XMMRegister dst, int shift);108void vshiftq(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vlen_enc);109void vshiftq_imm(int opcode, XMMRegister dst, XMMRegister nds, int shift, int vector_len);110111void vprotate_imm(int opcode, BasicType etype, XMMRegister dst, XMMRegister src, int shift, int vector_len);112void vprotate_var(int opcode, BasicType etype, XMMRegister dst, XMMRegister src, XMMRegister shift, int vector_len);113114void varshiftd(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vlen_enc);115void varshiftw(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vlen_enc);116void varshiftq(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vlen_enc, XMMRegister vtmp = xnoreg);117void varshiftbw(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vector_len, XMMRegister vtmp, Register scratch);118void evarshiftb(int opcode, XMMRegister dst, XMMRegister src, XMMRegister shift, int vector_len, XMMRegister vtmp, Register scratch);119120void insert(BasicType typ, XMMRegister dst, Register val, int idx);121void vinsert(BasicType typ, XMMRegister dst, XMMRegister src, Register val, int idx);122void vgather(BasicType typ, XMMRegister dst, Register base, XMMRegister idx, XMMRegister mask, int vector_len);123void evgather(BasicType typ, XMMRegister dst, KRegister mask, Register base, XMMRegister idx, int vector_len);124void evscatter(BasicType typ, Register base, XMMRegister idx, KRegister mask, XMMRegister src, int vector_len);125126void evmovdqu(BasicType type, KRegister kmask, XMMRegister dst, Address src, int vector_len);127void evmovdqu(BasicType type, KRegister kmask, Address dst, XMMRegister src, int vector_len);128129// extract130void extract(BasicType typ, Register dst, XMMRegister src, int idx);131XMMRegister get_lane(BasicType typ, XMMRegister dst, XMMRegister src, int elemindex);132void get_elem(BasicType typ, Register dst, XMMRegister src, int elemindex);133void get_elem(BasicType typ, XMMRegister dst, XMMRegister src, int elemindex, Register tmp = noreg, XMMRegister vtmp = xnoreg);134135// vector test136void vectortest(int bt, int vlen, XMMRegister src1, XMMRegister src2,137XMMRegister vtmp1 = xnoreg, XMMRegister vtmp2 = xnoreg, KRegister mask = knoreg);138139// blend140void evpcmp(BasicType typ, KRegister kdmask, KRegister ksmask, XMMRegister src1, AddressLiteral adr, int comparison, int vector_len, Register scratch = rscratch1);141void evpblend(BasicType typ, XMMRegister dst, KRegister kmask, XMMRegister src1, XMMRegister src2, bool merge, int vector_len);142143void load_vector_mask(XMMRegister dst, XMMRegister src, int vlen_in_bytes, BasicType elem_bt);144void load_iota_indices(XMMRegister dst, Register scratch, int vlen_in_bytes);145146// vector compare147void vpcmpu(BasicType typ, XMMRegister dst, XMMRegister src1, XMMRegister src2, ComparisonPredicate comparison, int vlen_in_bytes,148XMMRegister vtmp1, XMMRegister vtmp2, Register scratch);149void vpcmpu32(BasicType typ, XMMRegister dst, XMMRegister src1, XMMRegister src2, ComparisonPredicate comparison, int vlen_in_bytes,150XMMRegister vtmp1, XMMRegister vtmp2, XMMRegister vtmp3, Register scratch);151152// Reductions for vectors of bytes, shorts, ints, longs, floats, and doubles.153154// dst = src1 reduce(op, src2) using vtmp as temps155void reduceI(int opcode, int vlen, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);156#ifdef _LP64157void reduceL(int opcode, int vlen, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);158void genmask(KRegister dst, Register len, Register temp);159#endif // _LP64160161// dst = reduce(op, src2) using vtmp as temps162void reduce_fp(int opcode, int vlen,163XMMRegister dst, XMMRegister src,164XMMRegister vtmp1, XMMRegister vtmp2 = xnoreg);165void reduceB(int opcode, int vlen, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);166void mulreduceB(int opcode, int vlen, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);167void reduceS(int opcode, int vlen, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);168void reduceFloatMinMax(int opcode, int vlen, bool is_dst_valid,169XMMRegister dst, XMMRegister src,170XMMRegister tmp, XMMRegister atmp, XMMRegister btmp, XMMRegister xmm_0, XMMRegister xmm_1 = xnoreg);171void reduceDoubleMinMax(int opcode, int vlen, bool is_dst_valid,172XMMRegister dst, XMMRegister src,173XMMRegister tmp, XMMRegister atmp, XMMRegister btmp, XMMRegister xmm_0, XMMRegister xmm_1 = xnoreg);174private:175void reduceF(int opcode, int vlen, XMMRegister dst, XMMRegister src, XMMRegister vtmp1, XMMRegister vtmp2);176void reduceD(int opcode, int vlen, XMMRegister dst, XMMRegister src, XMMRegister vtmp1, XMMRegister vtmp2);177178// Int Reduction179void reduce2I (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);180void reduce4I (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);181void reduce8I (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);182void reduce16I(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);183184// Byte Reduction185void reduce8B (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);186void reduce16B(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);187void reduce32B(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);188void reduce64B(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);189void mulreduce8B (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);190void mulreduce16B(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);191void mulreduce32B(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);192void mulreduce64B(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);193194// Short Reduction195void reduce4S (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);196void reduce8S (int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);197void reduce16S(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);198void reduce32S(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);199200// Long Reduction201#ifdef _LP64202void reduce2L(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);203void reduce4L(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);204void reduce8L(int opcode, Register dst, Register src1, XMMRegister src2, XMMRegister vtmp1, XMMRegister vtmp2);205#endif // _LP64206207// Float Reduction208void reduce2F (int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp);209void reduce4F (int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp);210void reduce8F (int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp1, XMMRegister vtmp2);211void reduce16F(int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp1, XMMRegister vtmp2);212213// Double Reduction214void reduce2D(int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp);215void reduce4D(int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp1, XMMRegister vtmp2);216void reduce8D(int opcode, XMMRegister dst, XMMRegister src, XMMRegister vtmp1, XMMRegister vtmp2);217218// Base reduction instruction219void reduce_operation_128(BasicType typ, int opcode, XMMRegister dst, XMMRegister src);220void reduce_operation_256(BasicType typ, int opcode, XMMRegister dst, XMMRegister src1, XMMRegister src2);221222public:223#ifdef _LP64224void vector_mask_operation(int opc, Register dst, XMMRegister mask, XMMRegister xtmp, Register tmp,225KRegister ktmp, int masklen, int vec_enc);226227void vector_mask_operation(int opc, Register dst, XMMRegister mask, XMMRegister xtmp, XMMRegister xtmp1,228Register tmp, int masklen, int vec_enc);229#endif230void string_indexof_char(Register str1, Register cnt1, Register ch, Register result,231XMMRegister vec1, XMMRegister vec2, XMMRegister vec3, Register tmp);232233void stringL_indexof_char(Register str1, Register cnt1, Register ch, Register result,234XMMRegister vec1, XMMRegister vec2, XMMRegister vec3, Register tmp);235236// IndexOf strings.237// Small strings are loaded through stack if they cross page boundary.238void string_indexof(Register str1, Register str2,239Register cnt1, Register cnt2,240int int_cnt2, Register result,241XMMRegister vec, Register tmp,242int ae);243244// IndexOf for constant substrings with size >= 8 elements245// which don't need to be loaded through stack.246void string_indexofC8(Register str1, Register str2,247Register cnt1, Register cnt2,248int int_cnt2, Register result,249XMMRegister vec, Register tmp,250int ae);251252// Smallest code: we don't need to load through stack,253// check string tail.254255// helper function for string_compare256void load_next_elements(Register elem1, Register elem2, Register str1, Register str2,257Address::ScaleFactor scale, Address::ScaleFactor scale1,258Address::ScaleFactor scale2, Register index, int ae);259// Compare strings.260void string_compare(Register str1, Register str2,261Register cnt1, Register cnt2, Register result,262XMMRegister vec1, int ae, KRegister mask = knoreg);263264// Search for Non-ASCII character (Negative byte value) in a byte array,265// return true if it has any and false otherwise.266void has_negatives(Register ary1, Register len,267Register result, Register tmp1,268XMMRegister vec1, XMMRegister vec2, KRegister mask1 = knoreg, KRegister mask2 = knoreg);269270// Compare char[] or byte[] arrays.271void arrays_equals(bool is_array_equ, Register ary1, Register ary2,272Register limit, Register result, Register chr,273XMMRegister vec1, XMMRegister vec2, bool is_char, KRegister mask = knoreg);274275#endif // CPU_X86_C2_MACROASSEMBLER_X86_HPP276277278