/* * Copyright(c) 2019-2021 Qualcomm Innovation Center, Inc. All Rights Reserved. * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, see . */ /* * S-type Instructions */ /**********************************************/ /* SHIFTS */ /**********************************************/ /* NOTE: Rdd = Rs *right* shifts don't make sense */ /* NOTE: Rd[d] = Rs[s] *right* shifts with saturation don't make sense */ #define RSHIFTTYPES(TAGEND,REGD,REGS,REGSTYPE,ACC,ACCSRC,SAT,SATOPT,ATTRS) \ Q6INSN(S2_asr_r_##TAGEND,#REGD "32" #ACC "=asr(" #REGS "32,Rt32)" #SATOPT,ATTRIBS(ATTRS), \ "Arithmetic Shift Right by Register", \ { \ fHIDE(size4s_t) shamt=fSXTN(7,32,RtV);\ REGD##V = SAT(ACCSRC ACC fBIDIR_ASHIFTR(REGS##V,shamt,REGSTYPE)); \ })\ \ Q6INSN(S2_asl_r_##TAGEND,#REGD "32" #ACC "=asl(" #REGS "32,Rt32)" #SATOPT,ATTRIBS(ATTRS), \ "Arithmetic Shift Left by Register", \ { \ fHIDE(size4s_t) shamt=fSXTN(7,32,RtV);\ REGD##V = SAT(ACCSRC ACC fBIDIR_ASHIFTL(REGS##V,shamt,REGSTYPE)); \ })\ \ Q6INSN(S2_lsr_r_##TAGEND,#REGD "32" #ACC "=lsr(" #REGS "32,Rt32)" #SATOPT,ATTRIBS(ATTRS), \ "Logical Shift Right by Register", \ { \ fHIDE(size4s_t) shamt=fSXTN(7,32,RtV);\ REGD##V = SAT(ACCSRC ACC fBIDIR_LSHIFTR(REGS##V,shamt,REGSTYPE)); \ })\ \ Q6INSN(S2_lsl_r_##TAGEND,#REGD "32" #ACC "=lsl(" #REGS "32,Rt32)" #SATOPT,ATTRIBS(ATTRS), \ "Logical Shift Left by Register", \ { \ fHIDE(size4s_t) shamt=fSXTN(7,32,RtV);\ REGD##V = SAT(ACCSRC ACC fBIDIR_LSHIFTL(REGS##V,shamt,REGSTYPE)); \ }) RSHIFTTYPES(r,Rd,Rs,4_8,,,fECHO,,) RSHIFTTYPES(p,Rdd,Rss,8_8,,,fECHO,,) RSHIFTTYPES(r_acc,Rx,Rs,4_8,+,RxV,fECHO,,) RSHIFTTYPES(p_acc,Rxx,Rss,8_8,+,RxxV,fECHO,,) RSHIFTTYPES(r_nac,Rx,Rs,4_8,-,RxV,fECHO,,) RSHIFTTYPES(p_nac,Rxx,Rss,8_8,-,RxxV,fECHO,,) RSHIFTTYPES(r_and,Rx,Rs,4_8,&,RxV,fECHO,,) RSHIFTTYPES(r_or,Rx,Rs,4_8,|,RxV,fECHO,,) RSHIFTTYPES(p_and,Rxx,Rss,8_8,&,RxxV,fECHO,,) RSHIFTTYPES(p_or,Rxx,Rss,8_8,|,RxxV,fECHO,,) RSHIFTTYPES(p_xor,Rxx,Rss,8_8,^,RxxV,fECHO,,) #undef RSHIFTTYPES /* Register shift with saturation */ #define RSATSHIFTTYPES(TAGEND,REGD,REGS,REGSTYPE) \ Q6INSN(S2_asr_r_##TAGEND,#REGD "32" "=asr(" #REGS "32,Rt32):sat",ATTRIBS(), \ "Arithmetic Shift Right by Register", \ { \ fHIDE(size4s_t) shamt=fSXTN(7,32,RtV);\ REGD##V = fBIDIR_ASHIFTR_SAT(REGS##V,shamt,REGSTYPE); \ })\ \ Q6INSN(S2_asl_r_##TAGEND,#REGD "32" "=asl(" #REGS "32,Rt32):sat",ATTRIBS(), \ "Arithmetic Shift Left by Register", \ { \ fHIDE(size4s_t) shamt=fSXTN(7,32,RtV);\ REGD##V = fBIDIR_ASHIFTL_SAT(REGS##V,shamt,REGSTYPE); \ }) RSATSHIFTTYPES(r_sat,Rd,Rs,4_8) #define ISHIFTTYPES(TAGEND,SIZE,REGD,REGS,REGSTYPE,ACC,ACCSRC,SAT,SATOPT,ATTRS) \ Q6INSN(S2_asr_i_##TAGEND,#REGD "32" #ACC "=asr(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(ATTRS), \ "Arithmetic Shift Right by Immediate", \ { REGD##V = SAT(ACCSRC ACC fASHIFTR(REGS##V,uiV,REGSTYPE)); }) \ \ Q6INSN(S2_lsr_i_##TAGEND,#REGD "32" #ACC "=lsr(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(ATTRS), \ "Logical Shift Right by Immediate", \ { REGD##V = SAT(ACCSRC ACC fLSHIFTR(REGS##V,uiV,REGSTYPE)); }) \ \ Q6INSN(S2_asl_i_##TAGEND,#REGD "32" #ACC "=asl(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(ATTRS), \ "Shift Left by Immediate", \ { REGD##V = SAT(ACCSRC ACC fASHIFTL(REGS##V,uiV,REGSTYPE)); }) \ Q6INSN(S6_rol_i_##TAGEND,#REGD "32" #ACC "=rol(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(ATTRS), \ "Rotate Left by Immediate", \ { REGD##V = SAT(ACCSRC ACC fROTL(REGS##V,uiV,REGSTYPE)); }) #define ISHIFTTYPES_ONLY_ASL(TAGEND,SIZE,REGD,REGS,REGSTYPE,ACC,ACCSRC,SAT,SATOPT) \ Q6INSN(S2_asl_i_##TAGEND,#REGD "32" #ACC "=asl(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(), \ "", \ { REGD##V = SAT(ACCSRC ACC fASHIFTL(REGS##V,uiV,REGSTYPE)); }) #define ISHIFTTYPES_ONLY_ASR(TAGEND,SIZE,REGD,REGS,REGSTYPE,ACC,ACCSRC,SAT,SATOPT) \ Q6INSN(S2_asr_i_##TAGEND,#REGD "32" #ACC "=asr(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(), \ "", \ { REGD##V = SAT(ACCSRC ACC fASHIFTR(REGS##V,uiV,REGSTYPE)); }) #define ISHIFTTYPES_NOASR(TAGEND,SIZE,REGD,REGS,REGSTYPE,ACC,ACCSRC,SAT,SATOPT) \ Q6INSN(S2_lsr_i_##TAGEND,#REGD "32" #ACC "=lsr(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(), \ "Logical Shift Right by Register", \ { REGD##V = SAT(ACCSRC ACC fLSHIFTR(REGS##V,uiV,REGSTYPE)); }) \ Q6INSN(S2_asl_i_##TAGEND,#REGD "32" #ACC "=asl(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(), \ "Shift Left by Register", \ { REGD##V = SAT(ACCSRC ACC fASHIFTL(REGS##V,uiV,REGSTYPE)); }) \ Q6INSN(S6_rol_i_##TAGEND,#REGD "32" #ACC "=rol(" #REGS "32,#u" #SIZE ")" #SATOPT,ATTRIBS(), \ "Rotate Left by Immediate", \ { REGD##V = SAT(ACCSRC ACC fROTL(REGS##V,uiV,REGSTYPE)); }) ISHIFTTYPES(r,5,Rd,Rs,4_4,,,fECHO,,) ISHIFTTYPES(p,6,Rdd,Rss,8_8,,,fECHO,,) ISHIFTTYPES(r_acc,5,Rx,Rs,4_4,+,RxV,fECHO,,) ISHIFTTYPES(p_acc,6,Rxx,Rss,8_8,+,RxxV,fECHO,,) ISHIFTTYPES(r_nac,5,Rx,Rs,4_4,-,RxV,fECHO,,) ISHIFTTYPES(p_nac,6,Rxx,Rss,8_8,-,RxxV,fECHO,,) ISHIFTTYPES_NOASR(r_xacc,5,Rx,Rs,4_4,^, RxV,fECHO,) ISHIFTTYPES_NOASR(p_xacc,6,Rxx,Rss,8_8,^, RxxV,fECHO,) ISHIFTTYPES(r_and,5,Rx,Rs,4_4,&,RxV,fECHO,,) ISHIFTTYPES(r_or,5,Rx,Rs,4_4,|,RxV,fECHO,,) ISHIFTTYPES(p_and,6,Rxx,Rss,8_8,&,RxxV,fECHO,,) ISHIFTTYPES(p_or,6,Rxx,Rss,8_8,|,RxxV,fECHO,,) ISHIFTTYPES_ONLY_ASL(r_sat,5,Rd,Rs,4_8,,,fSAT,:sat) Q6INSN(S2_asr_i_r_rnd,"Rd32=asr(Rs32,#u5):rnd",ATTRIBS(), "Shift right with round", { RdV = fASHIFTR(((fASHIFTR(RsV,uiV,4_8))+1),1,8_8); }) Q6INSN(S2_asr_i_p_rnd,"Rdd32=asr(Rss32,#u6):rnd",ATTRIBS(), "Shift right with round", { fHIDE(size8u_t tmp;) fHIDE(size8u_t rnd;) tmp = fASHIFTR(RssV,uiV,8_8); rnd = tmp & 1; RddV = fASHIFTR(tmp,1,8_8) + rnd; }) Q6INSN(S4_lsli,"Rd32=lsl(#s6,Rt32)",ATTRIBS(), "Shift an immediate left by register amount", { fHIDE(size4s_t) shamt = fSXTN(7,32,RtV); RdV = fBIDIR_LSHIFTL(siV,shamt,4_8); }) Q6INSN(S2_addasl_rrri,"Rd32=addasl(Rt32,Rs32,#u3)",ATTRIBS(), "Shift left by small amount and add", { RdV = RtV + fASHIFTL(RsV,uiV,4_4); }) #define SHIFTOPI(TAGEND,INNEROP,INNERSEM)\ Q6INSN(S4_andi_##TAGEND,"Rx32=and(#u8,"INNEROP")",,"Shift-op",{RxV=fIMMEXT(uiV)&INNERSEM;})\ Q6INSN(S4_ori_##TAGEND, "Rx32=or(#u8,"INNEROP")",,"Shift-op",{RxV=fIMMEXT(uiV)|INNERSEM;})\ Q6INSN(S4_addi_##TAGEND,"Rx32=add(#u8,"INNEROP")",,"Shift-op",{RxV=fIMMEXT(uiV)+INNERSEM;})\ Q6INSN(S4_subi_##TAGEND,"Rx32=sub(#u8,"INNEROP")",,"Shift-op",{RxV=fIMMEXT(uiV)-INNERSEM;}) SHIFTOPI(asl_ri,"asl(Rx32,#U5)",(RxV<>UiV)) /**********************************************/ /* PERMUTES */ /**********************************************/ Q6INSN(S2_valignib,"Rdd32=valignb(Rtt32,Rss32,#u3)", ATTRIBS(), "Vector align bytes", { RddV = (fLSHIFTR(RssV,uiV*8,8_8))|(fASHIFTL(RttV,((8-uiV)*8),8_8)); }) Q6INSN(S2_valignrb,"Rdd32=valignb(Rtt32,Rss32,Pu4)", ATTRIBS(), "Align with register", { RddV = fLSHIFTR(RssV,(PuV&0x7)*8,8_8)|(fASHIFTL(RttV,(8-(PuV&0x7))*8,8_8));}) Q6INSN(S2_vspliceib,"Rdd32=vspliceb(Rss32,Rtt32,#u3)", ATTRIBS(), "Vector splice bytes", { RddV = fASHIFTL(RttV,uiV*8,8_8) | fZXTN(uiV*8,64,RssV); }) Q6INSN(S2_vsplicerb,"Rdd32=vspliceb(Rss32,Rtt32,Pu4)", ATTRIBS(), "Splice with register", { RddV = fASHIFTL(RttV,(PuV&7)*8,8_8) | fZXTN((PuV&7)*8,64,RssV); }) Q6INSN(S2_vsplatrh,"Rdd32=vsplath(Rs32)", ATTRIBS(), "Vector splat halfwords from register", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, fGETHALF(0,RsV)); } }) Q6INSN(S2_vsplatrb,"Rd32=vsplatb(Rs32)", ATTRIBS(), "Vector splat bytes from register", { fHIDE(int i;) for (i=0;i<4;i++) { fSETBYTE(i,RdV, fGETBYTE(0,RsV)); } }) Q6INSN(S6_vsplatrbp,"Rdd32=vsplatb(Rs32)", ATTRIBS(), "Vector splat bytes from register", { fHIDE(int i;) for (i=0;i<8;i++) { fSETBYTE(i,RddV, fGETBYTE(0,RsV)); } }) /**********************************************/ /* Insert/Extract[u] */ /**********************************************/ Q6INSN(S2_insert,"Rx32=insert(Rs32,#u5,#U5)", ATTRIBS(), "Insert bits", { fHIDE(int) width=uiV; fHIDE(int) offset=UiV; /* clear bits in Rxx where new bits go */ RxV &= ~(((fCONSTLL(1)<>uiV)); fSETWORD(0,RddV,fZXTN(uiV,32,RsV)); }) Q6INSN(A4_bitsplit,"Rdd32=bitsplit(Rs32,Rt32)", ATTRIBS(), "Split a bitfield into two registers", { fHIDE(size4u_t) shamt = fZXTN(5,32,RtV); fSETWORD(1,RddV,(fCAST4_4u(RsV)>>shamt)); fSETWORD(0,RddV,fZXTN(shamt,32,RsV)); }) Q6INSN(S4_extract,"Rd32=extract(Rs32,#u5,#U5)", ATTRIBS(), "Extract signed bitfield", { fHIDE(int) width=uiV; fHIDE(int) offset=UiV; RdV = fSXTN(width,32,(fCAST4_4u(RsV) >> offset)); }) Q6INSN(S2_extractu,"Rd32=extractu(Rs32,#u5,#U5)", ATTRIBS(), "Extract unsigned bitfield", { fHIDE(int) width=uiV; fHIDE(int) offset=UiV; RdV = fZXTN(width,32,(fCAST4_4u(RsV) >> offset)); }) Q6INSN(S2_insertp,"Rxx32=insert(Rss32,#u6,#U6)", ATTRIBS(), "Insert bits", { fHIDE(int) width=uiV; fHIDE(int) offset=UiV; /* clear bits in Rxx where new bits go */ RxxV &= ~(((fCONSTLL(1)<> offset)); }) Q6INSN(S2_extractup,"Rdd32=extractu(Rss32,#u6,#U6)", ATTRIBS(), "Extract unsigned bitfield", { fHIDE(int) width=uiV; fHIDE(int) offset=UiV; RddV = fZXTN(width,64,(fCAST8_8u(RssV) >> offset)); }) Q6INSN(S2_mask,"Rd32=mask(#u5,#U5)", ATTRIBS(), "Form mask from immediate", { RdV = ((1<>uiV)); } }) Q6INSN(S2_lsr_i_vh,"Rdd32=vlsrh(Rss32,#u4)",ATTRIBS(), "Vector Logical Shift Right by Immediate", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, (fGETUHALF(i,RssV)>>uiV)); } }) Q6INSN(S2_asl_i_vh,"Rdd32=vaslh(Rss32,#u4)",ATTRIBS(), "Vector Arithmetic Shift Left by Immediate", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, (fGETHALF(i,RssV)<> uiV )+1)>>1 )); } }) Q6INSN(S5_asrhub_sat,"Rd32=vasrhub(Rss32,#u4):sat",, "Vector Arithmetic Shift Right by Immediate with Saturate and Pack", { fHIDE(int i;) for (i=0;i<4;i++) { fSETBYTE(i,RdV, fSATUB( fGETHALF(i,RssV) >> uiV )); } }) Q6INSN(S5_vasrhrnd,"Rdd32=vasrh(Rss32,#u4):raw",, "Vector Arithmetic Shift Right by Immediate with Round", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, ( ((fGETHALF(i,RssV) >> uiV)+1)>>1 )); } }) Q6INSN(S2_asl_r_vh,"Rdd32=vaslh(Rss32,Rt32)",ATTRIBS(), "Vector Arithmetic Shift Left by Register", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, fBIDIR_ASHIFTL(fGETHALF(i,RssV),fSXTN(7,32,RtV),2_8)); } }) Q6INSN(S2_lsr_r_vh,"Rdd32=vlsrh(Rss32,Rt32)",ATTRIBS(), "Vector Logical Shift Right by Register", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, fBIDIR_LSHIFTR(fGETUHALF(i,RssV),fSXTN(7,32,RtV),2_8)); } }) Q6INSN(S2_lsl_r_vh,"Rdd32=vlslh(Rss32,Rt32)",ATTRIBS(), "Vector Logical Shift Left by Register", { fHIDE(int i;) for (i=0;i<4;i++) { fSETHALF(i,RddV, fBIDIR_LSHIFTL(fGETUHALF(i,RssV),fSXTN(7,32,RtV),2_8)); } }) /* Word Vector Immediate Shifts */ Q6INSN(S2_asr_i_vw,"Rdd32=vasrw(Rss32,#u5)",ATTRIBS(), "Vector Arithmetic Shift Right by Immediate", { fHIDE(int i;) for (i=0;i<2;i++) { fSETWORD(i,RddV,(fGETWORD(i,RssV)>>uiV)); } }) Q6INSN(S2_asr_i_svw_trun,"Rd32=vasrw(Rss32,#u5)",ATTRIBS(A_ARCHV2), "Vector Arithmetic Shift Right by Immediate with Truncate and Pack", { fHIDE(int i;) for (i=0;i<2;i++) { fSETHALF(i,RdV,fGETHALF(0,(fGETWORD(i,RssV)>>uiV))); } }) Q6INSN(S2_asr_r_svw_trun,"Rd32=vasrw(Rss32,Rt32)",ATTRIBS(A_ARCHV2), "Vector Arithmetic Shift Right truncate and Pack", { fHIDE(int i;) for (i=0;i<2;i++) { fSETHALF(i,RdV,fGETHALF(0,fBIDIR_ASHIFTR(fGETWORD(i,RssV),fSXTN(7,32,RtV),4_8))); } }) Q6INSN(S2_lsr_i_vw,"Rdd32=vlsrw(Rss32,#u5)",ATTRIBS(), "Vector Logical Shift Right by Immediate", { fHIDE(int i;) for (i=0;i<2;i++) { fSETWORD(i,RddV,(fGETUWORD(i,RssV)>>uiV)); } }) Q6INSN(S2_asl_i_vw,"Rdd32=vaslw(Rss32,#u5)",ATTRIBS(), "Vector Arithmetic Shift Left by Immediate", { fHIDE(int i;) for (i=0;i<2;i++) { fSETWORD(i,RddV,(fGETWORD(i,RssV)<> 1) | (fCAST8u((1&fCOUNTONES_8(RssV & RttV)))<<63) ; }) Q6INSN(S2_clbnorm,"Rd32=normamt(Rs32)",ATTRIBS(A_ARCHV2), "Count leading sign bits - 1", { if (RsV == 0) { RdV = 0; } else { RdV = (fMAX(fCL1_4(RsV),fCL1_4(~RsV)))-1;} }) Q6INSN(S4_clbaddi,"Rd32=add(clb(Rs32),#s6)",ATTRIBS(A_ARCHV2), "Count leading sign bits then add signed number", { RdV = (fMAX(fCL1_4(RsV),fCL1_4(~RsV)))+siV;} ) Q6INSN(S4_clbpnorm,"Rd32=normamt(Rss32)",ATTRIBS(A_ARCHV2), "Count leading sign bits - 1", { if (RssV == 0) { RdV = 0; } else { RdV = (fMAX(fCL1_8(RssV),fCL1_8(~RssV)))-1;}}) Q6INSN(S4_clbpaddi,"Rd32=add(clb(Rss32),#s6)",ATTRIBS(A_ARCHV2), "Count leading sign bits then add signed number", { RdV = (fMAX(fCL1_8(RssV),fCL1_8(~RssV)))+siV;}) Q6INSN(S2_clb,"Rd32=clb(Rs32)",ATTRIBS(), "Count leading bits", {RdV = fMAX(fCL1_4(RsV),fCL1_4(~RsV));}) Q6INSN(S2_cl0,"Rd32=cl0(Rs32)",ATTRIBS(), "Count leading bits", {RdV = fCL1_4(~RsV);}) Q6INSN(S2_cl1,"Rd32=cl1(Rs32)",ATTRIBS(), "Count leading bits", {RdV = fCL1_4(RsV);}) Q6INSN(S2_clbp,"Rd32=clb(Rss32)",ATTRIBS(), "Count leading bits", {RdV = fMAX(fCL1_8(RssV),fCL1_8(~RssV));}) Q6INSN(S2_cl0p,"Rd32=cl0(Rss32)",ATTRIBS(), "Count leading bits", {RdV = fCL1_8(~RssV);}) Q6INSN(S2_cl1p,"Rd32=cl1(Rss32)",ATTRIBS(), "Count leading bits", {RdV = fCL1_8(RssV);}) Q6INSN(S2_brev, "Rd32=brev(Rs32)", ATTRIBS(A_ARCHV2), "Bit Reverse",{RdV = fBREV_4(RsV);}) Q6INSN(S2_brevp,"Rdd32=brev(Rss32)", ATTRIBS(), "Bit Reverse",{RddV = fBREV_8(RssV);}) Q6INSN(S2_ct0, "Rd32=ct0(Rs32)", ATTRIBS(A_ARCHV2), "Count Trailing",{RdV = fCL1_4(~fBREV_4(RsV));}) Q6INSN(S2_ct1, "Rd32=ct1(Rs32)", ATTRIBS(A_ARCHV2), "Count Trailing",{RdV = fCL1_4(fBREV_4(RsV));}) Q6INSN(S2_ct0p, "Rd32=ct0(Rss32)", ATTRIBS(), "Count Trailing",{RdV = fCL1_8(~fBREV_8(RssV));}) Q6INSN(S2_ct1p, "Rd32=ct1(Rss32)", ATTRIBS(), "Count Trailing",{RdV = fCL1_8(fBREV_8(RssV));}) Q6INSN(S2_interleave,"Rdd32=interleave(Rss32)",ATTRIBS(A_ARCHV2),"Interleave bits", {RddV = fINTERLEAVE(fGETWORD(1,RssV),fGETWORD(0,RssV));}) Q6INSN(S2_deinterleave,"Rdd32=deinterleave(Rss32)",ATTRIBS(A_ARCHV2),"Interleave bits", {RddV = fDEINTERLEAVE(RssV);})