sse4-common.h: make changes to make test_PMAXSD usable for 32bit

Modify DO_imm_r_r macro called by test_PMAXSD to use xmm7 register
when testing on 32bit.
This commit is contained in:
Alexandra Hájková
2025-11-11 04:17:36 -05:00
parent 5e584556a9
commit 83a3116dbb
3 changed files with 37 additions and 27 deletions

View File

@@ -1503,17 +1503,6 @@ void test_PMAXSB ( void )
}
}
void test_PMAXSD ( void )
{
V128 src, dst;
Int i;
for (i = 0; i < 10; i++) {
randV128(&src);
randV128(&dst);
DO_mandr_r("pmaxsd", src, dst);
}
}
void test_PMAXUD ( void )
{
V128 src, dst;

View File

@@ -159,16 +159,23 @@ static inline double mkNegNan ( void ) { return -mkPosNan(); }
/* Macros for testing XMM register to register and memory to register operations */
/* Use xmm7 for 32-bit x86, xmm11 for amd64 (xmm8-15 don't exist in 32-bit mode) */
#ifdef __x86_64__
#define XMMREG_DST "xmm11"
#else
#define XMMREG_DST "xmm7"
#endif
#define DO_imm_r_r(_opname, _imm, _src, _dst) \
{ \
V128 _tmp; \
__asm__ __volatile__( \
"movupd (%0), %%xmm2" "\n\t" \
"movupd (%1), %%xmm11" "\n\t" \
_opname " $" #_imm ", %%xmm2, %%xmm11" "\n\t" \
"movupd %%xmm11, (%2)" "\n" \
"movupd (%1), %%" XMMREG_DST "\n\t" \
_opname " $" #_imm ", %%xmm2, %%" XMMREG_DST "\n\t" \
"movupd %%" XMMREG_DST ", (%2)" "\n" \
: /*out*/ : /*in*/ "r"(&(_src)), "r"(&(_dst)), "r"(&(_tmp)) \
: "cc", "memory", "xmm2", "xmm11" \
: "cc", "memory", "xmm2", XMMREG_DST \
); \
RRArgs rra; \
memcpy(&rra.arg1, &(_src), sizeof(V128)); \
@@ -183,11 +190,11 @@ static inline double mkNegNan ( void ) { return -mkPosNan(); }
V128* _srcM = memalign16(sizeof(V128)); \
memcpy(_srcM, &(_src), sizeof(V128)); \
__asm__ __volatile__( \
"movupd (%1), %%xmm11" "\n\t" \
_opname " $" #_imm ", (%0), %%xmm11" "\n\t" \
"movupd %%xmm11, (%2)" "\n" \
"movupd (%1), %%" XMMREG_DST "\n\t" \
_opname " $" #_imm ", (%0), %%" XMMREG_DST "\n\t" \
"movupd %%" XMMREG_DST ", (%2)" "\n" \
: /*out*/ : /*in*/ "r"(_srcM), "r"(&(_dst)), "r"(&(_tmp)) \
: "cc", "memory", "xmm11" \
: "cc", "memory", XMMREG_DST \
); \
RRArgs rra; \
memcpy(&rra.arg1, &(_src), sizeof(V128)); \
@@ -206,11 +213,11 @@ static inline double mkNegNan ( void ) { return -mkPosNan(); }
V128 _tmp; \
__asm__ __volatile__( \
"movupd (%0), %%xmm2" "\n\t" \
"movupd (%1), %%xmm11" "\n\t" \
_opname " %%xmm2, %%xmm11" "\n\t" \
"movupd %%xmm11, (%2)" "\n" \
"movupd (%1), %%" XMMREG_DST "\n\t" \
_opname " %%xmm2, %%" XMMREG_DST "\n\t" \
"movupd %%" XMMREG_DST ", (%2)" "\n" \
: /*out*/ : /*in*/ "r"(&(_src)), "r"(&(_dst)), "r"(&(_tmp)) \
: "cc", "memory", "xmm2", "xmm11" \
: "cc", "memory", "xmm2", XMMREG_DST \
); \
RRArgs rra; \
memcpy(&rra.arg1, &(_src), sizeof(V128)); \
@@ -225,11 +232,11 @@ static inline double mkNegNan ( void ) { return -mkPosNan(); }
V128* _srcM = memalign16(sizeof(V128)); \
memcpy(_srcM, &(_src), sizeof(V128)); \
__asm__ __volatile__( \
"movupd (%1), %%xmm11" "\n\t" \
_opname " (%0), %%xmm11" "\n\t" \
"movupd %%xmm11, (%2)" "\n" \
"movupd (%1), %%" XMMREG_DST "\n\t" \
_opname " (%0), %%" XMMREG_DST "\n\t" \
"movupd %%" XMMREG_DST ", (%2)" "\n" \
: /*out*/ : /*in*/ "r"(_srcM), "r"(&(_dst)), "r"(&(_tmp)) \
: "cc", "memory", "xmm11" \
: "cc", "memory", XMMREG_DST \
); \
RRArgs rra; \
memcpy(&rra.arg1, &(_src), sizeof(V128)); \
@@ -243,4 +250,17 @@ static inline double mkNegNan ( void ) { return -mkPosNan(); }
DO_r_r(_opname, _src, _dst) \
DO_m_r(_opname, _src, _dst)
/* Common test functions */
static inline void test_PMAXSD ( void )
{
V128 src, dst;
Int i;
for (i = 0; i < 10; i++) {
randV128(&src);
randV128(&dst);
DO_mandr_r("pmaxsd", src, dst);
}
}
#endif /* __SSE4_COMMON_H */

View File

@@ -104,6 +104,7 @@ int main(void)
{
// ------ SSE 4.1 ------
test_PINSRD();
test_PMAXSD();
return 0;
}