Changeset 103850 in vbox
- Timestamp:
- Mar 14, 2024 12:38:51 PM (13 months ago)
- svn:sync-xref-src-repo-rev:
- 162221
- Location:
- trunk/src/VBox/VMM
- Files:
-
- 3 edited
Legend:
- Unmodified
- Added
- Removed
-
trunk/src/VBox/VMM/VMMAll/IEMAllInstPython.py
r103849 r103850 2962 2962 'IEM_MC_BROADCAST_XREG_U32_ZX_VLMAX': (McBlock.parseMcGeneric, True, True, g_fNativeSimd), 2963 2963 'IEM_MC_BROADCAST_XREG_U64_ZX_VLMAX': (McBlock.parseMcGeneric, True, True, g_fNativeSimd), 2964 'IEM_MC_BROADCAST_XREG_U8_ZX_VLMAX': (McBlock.parseMcGeneric, True, True, False,),2964 'IEM_MC_BROADCAST_XREG_U8_ZX_VLMAX': (McBlock.parseMcGeneric, True, True, g_fNativeSimd), 2965 2965 'IEM_MC_BROADCAST_YREG_U128_ZX_VLMAX': (McBlock.parseMcGeneric, True, True, False, ), 2966 2966 'IEM_MC_BROADCAST_YREG_U16_ZX_VLMAX': (McBlock.parseMcGeneric, True, True, False, ), -
trunk/src/VBox/VMM/VMMAll/IEMAllN8veRecompFuncs.h
r103849 r103850 7077 7077 7078 7078 7079 #define IEM_MC_BROADCAST_XREG_U8_ZX_VLMAX(a_iXRegDst, a_u8Src) \ 7080 off = iemNativeEmitSimdBroadcastXregU8ZxVlmax(pReNative, off, a_iXRegDst, a_u8Src) 7081 7082 /** Emits code for IEM_MC_BROADCAST_XREG_U8_ZX_VLMAX. */ 7083 DECL_INLINE_THROW(uint32_t) 7084 iemNativeEmitSimdBroadcastXregU8ZxVlmax(PIEMRECOMPILERSTATE pReNative, uint32_t off, uint8_t iXReg, uint8_t idxSrcVar) 7085 { 7086 IEMNATIVE_ASSERT_VAR_IDX(pReNative, idxSrcVar); 7087 IEMNATIVE_ASSERT_VAR_SIZE(pReNative, idxSrcVar, sizeof(uint8_t)); 7088 7089 uint8_t const idxSimdRegDst = iemNativeSimdRegAllocTmpForGuestSimdReg(pReNative, &off, IEMNATIVEGSTSIMDREG_SIMD(iXReg), 7090 kIemNativeGstSimdRegLdStSz_256, kIemNativeGstRegUse_ForFullWrite); 7091 7092 uint8_t const idxVarReg = iemNativeVarRegisterAcquire(pReNative, idxSrcVar, &off); 7093 7094 off = iemNativeEmitSimdBroadcastGprToVecRegU8(pReNative, off, idxSimdRegDst, idxVarReg, false /*f256Bit*/); 7095 off = iemNativeEmitSimdZeroVecRegHighU128(pReNative, off, idxSimdRegDst); 7096 IEMNATIVE_SIMD_REG_STATE_SET_DIRTY_LO_U128(pReNative, iXReg); 7097 IEMNATIVE_SIMD_REG_STATE_SET_DIRTY_HI_U128(pReNative, iXReg); 7098 7099 iemNativeSimdRegFreeTmp(pReNative, idxSimdRegDst); 7100 iemNativeVarRegisterRelease(pReNative, idxSrcVar); 7101 7102 return off; 7103 } 7104 7105 7079 7106 #define IEM_MC_BROADCAST_XREG_U16_ZX_VLMAX(a_iXRegDst, a_u16Src) \ 7080 7107 off = iemNativeEmitSimdBroadcastXregU16ZxVlmax(pReNative, off, a_iXRegDst, a_u16Src) -
trunk/src/VBox/VMM/include/IEMN8veRecompilerEmit.h
r103849 r103850 7907 7907 7908 7908 /** 7909 * Emits a vecdst = gprsrc broadcast, 8-bit. 7910 */ 7911 DECL_FORCE_INLINE(uint32_t) 7912 iemNativeEmitSimdBroadcastGprToVecRegU8Ex(PIEMNATIVEINSTR pCodeBuf, uint32_t off, uint8_t iVecRegDst, uint8_t iGprSrc, bool f256Bit = false) 7913 { 7914 #ifdef RT_ARCH_AMD64 7915 /* pinsrb vecdst, gpr, #0 (ASSUMES SSE 4.1) */ 7916 pCodeBuf[off++] = X86_OP_PRF_SIZE_OP; 7917 if (iVecRegDst >= 8 || iGprSrc >= 8) 7918 pCodeBuf[off++] = (iVecRegDst < 8 ? 0 : X86_OP_REX_R) 7919 | (iGprSrc < 8 ? 0 : X86_OP_REX_B); 7920 pCodeBuf[off++] = 0x0f; 7921 pCodeBuf[off++] = 0x3a; 7922 pCodeBuf[off++] = 0x20; 7923 pCodeBuf[off++] = X86_MODRM_MAKE(X86_MOD_REG, iVecRegDst & 7, iGprSrc & 7); 7924 pCodeBuf[off++] = 0x00; 7925 7926 /* vpbroadcastb {y,x}mm, xmm (ASSUMES AVX2). */ 7927 pCodeBuf[off++] = X86_OP_VEX3; 7928 pCodeBuf[off++] = X86_OP_VEX3_BYTE1_X 7929 | 0x02 /* opcode map. */ 7930 | ( iVecRegDst >= 8 7931 ? 0 7932 : X86_OP_VEX3_BYTE1_B | X86_OP_VEX3_BYTE1_R); 7933 pCodeBuf[off++] = X86_OP_VEX3_BYTE2_MAKE_NO_VVVV(false, f256Bit, X86_OP_VEX3_BYTE2_P_066H); 7934 pCodeBuf[off++] = 0x78; 7935 pCodeBuf[off++] = X86_MODRM_MAKE(X86_MOD_REG, iVecRegDst & 7, iVecRegDst & 7); 7936 #elif defined(RT_ARCH_ARM64) 7937 /* ASSUMES that there are two adjacent 128-bit registers available for the 256-bit value. */ 7938 Assert(!(iVecRegDst & 0x1) || !f256Bit); 7939 7940 /* dup vecsrc, gpr */ 7941 pCodeBuf[off++] = Armv8A64MkVecInstrDup(iVecRegDst, iGprSrc, kArmv8InstrUmovInsSz_U8); 7942 if (f256Bit) 7943 pCodeBuf[off++] = Armv8A64MkVecInstrDup(iVecRegDst + 1, iGprSrc, kArmv8InstrUmovInsSz_U8); 7944 #else 7945 # error "port me" 7946 #endif 7947 return off; 7948 } 7949 7950 7951 /** 7952 * Emits a vecdst[x] = gprsrc broadcast, 8-bit. 7953 */ 7954 DECL_INLINE_THROW(uint32_t) 7955 iemNativeEmitSimdBroadcastGprToVecRegU8(PIEMRECOMPILERSTATE pReNative, uint32_t off, uint8_t iVecRegDst, uint8_t iGprSrc, bool f256Bit = false) 7956 { 7957 #ifdef RT_ARCH_AMD64 7958 off = iemNativeEmitSimdBroadcastGprToVecRegU8Ex(iemNativeInstrBufEnsure(pReNative, off, 12), off, iVecRegDst, iGprSrc, f256Bit); 7959 #elif defined(RT_ARCH_ARM64) 7960 off = iemNativeEmitSimdBroadcastGprToVecRegU8Ex(iemNativeInstrBufEnsure(pReNative, off, f256Bit ? 2 : 1), off, iVecRegDst, iGprSrc, f256Bit); 7961 #else 7962 # error "port me" 7963 #endif 7964 IEMNATIVE_ASSERT_INSTR_BUF_ENSURE(pReNative, off); 7965 return off; 7966 } 7967 7968 7969 /** 7909 7970 * Emits a vecdst = gprsrc broadcast, 16-bit. 7910 7971 */
Note:
See TracChangeset
for help on using the changeset viewer.