/* ------------------------------------------------------------------------- */ int test_sign16s_func(void) { INT16 ALIGN(src[65535]), ALIGN(d1[65535]); #ifdef WITH_SSE2 INT16 ALIGN(d2[65535]); int i; #endif int failed = 0; char testStr[256]; /* Test when we can reach 16-byte alignment */ testStr[0] = '\0'; get_random_data(src, sizeof(src)); general_sign_16s(src+1, d1+1, 65535); #ifdef WITH_SSE2 if (IsProcessorFeaturePresentEx(PF_EX_SSSE3)) { strcat(testStr, " SSSE3"); ssse3_sign_16s(src+1, d2+1, 65535); for (i=1; i<65535; ++i) { if (d1[i] != d2[i]) { printf("SIGN16s-SSE-aligned FAIL[%d] of %d: want %d, got %d\n", i, src[i], d1[i], d2[i]); ++failed; } } } #endif /* i386 */ /* Test when we cannot reach 16-byte alignment */ get_random_data(src, sizeof(src)); general_sign_16s(src+1, d1+2, 65535); #ifdef WITH_SSE2 if (IsProcessorFeaturePresentEx(PF_EX_SSSE3)) { ssse3_sign_16s(src+1, d2+2, 65535); for (i=2; i<65535; ++i) { if (d1[i] != d2[i]) { printf("SIGN16s-SSE-unaligned FAIL[%d] of %d: want %d, got %d\n", i, src[i-1], d1[i], d2[i]); ++failed; } } } #endif /* i386 */ if (!failed) printf("All sign16s tests passed (%s).\n", testStr); return (failed > 0) ? FAILURE : SUCCESS; }
/* ------------------------------------------------------------------------- */ int test_sign16s_func(void) { INT16 ALIGN(src[65535]), ALIGN(d1[65535]), ALIGN(d2[65535]); int failed = 0; int i; UINT32 pflags = primitives_get_flags(primitives_get()); char testStr[256]; /* Test when we can reach 16-byte alignment */ testStr[0] = '\0'; get_random_data(src, sizeof(src)); general_sign_16s(src+1, d1+1, 65535); #ifdef _M_IX86_AMD64 if (pflags & PRIM_X86_SSSE3_AVAILABLE) { strcat(testStr, " SSSE3"); ssse3_sign_16s(src+1, d2+1, 65535); for (i=1; i<65535; ++i) { if (d1[i] != d2[i]) { printf("SIGN16s-SSE-aligned FAIL[%d] of %d: want %d, got %d\n", i, src[i], d1[i], d2[i]); ++failed; } } } #endif /* i386 */ /* Test when we cannot reach 16-byte alignment */ get_random_data(src, sizeof(src)); general_sign_16s(src+1, d1+2, 65535); #ifdef _M_IX86_AMD64 if (pflags & PRIM_X86_SSSE3_AVAILABLE) { ssse3_sign_16s(src+1, d2+2, 65535); for (i=2; i<65535; ++i) { if (d1[i] != d2[i]) { printf("SIGN16s-SSE-unaligned FAIL[%d] of %d: want %d, got %d\n", i, src[i-1], d1[i], d2[i]); ++failed; } } } #endif /* i386 */ if (!failed) printf("All sign16s tests passed (%s).\n", testStr); return (failed > 0) ? FAILURE : SUCCESS; }
if (d1[i] != d2[i]) { printf("SIGN16s-SSE-unaligned FAIL[%d] of %d: want %d, got %d\n", i, src[i-1], d1[i], d2[i]); ++failed; } } } #endif /* i386 */ if (!failed) printf("All sign16s tests passed (%s).\n", testStr); return (failed > 0) ? FAILURE : SUCCESS; } /* ------------------------------------------------------------------------- */ STD_SPEED_TEST(sign16s_speed_test, INT16, INT16, dst=dst, TRUE, general_sign_16s(src1, dst, size), TRUE, ssse3_sign_16s(src1, dst, size), PRIM_X86_SSSE3_AVAILABLE, FALSE, dst=dst, 0, FALSE, dst=dst); int test_sign16s_speed(void) { INT16 ALIGN(src[MAX_TEST_SIZE+3]), ALIGN(dst[MAX_TEST_SIZE+3]); get_random_data(src, sizeof(src)); sign16s_speed_test("sign16s", "aligned", src, NULL, 0, dst, test_sizes, NUM_TEST_SIZES, SIGN_PRETEST_ITERATIONS, TEST_TIME); sign16s_speed_test("sign16s", "unaligned", src+1, NULL, 0, dst, test_sizes, NUM_TEST_SIZES, SIGN_PRETEST_ITERATIONS, TEST_TIME); return SUCCESS; }
printf("SIGN16s-SSE-unaligned FAIL[%d] of %d: want %d, got %d\n", i, src[i-1], d1[i], d2[i]); ++failed; } } } #endif /* i386 */ if (!failed) printf("All sign16s tests passed (%s).\n", testStr); return (failed > 0) ? FAILURE : SUCCESS; } /* ------------------------------------------------------------------------- */ STD_SPEED_TEST(sign16s_speed_test, INT16, INT16, dst=dst, TRUE, general_sign_16s(src1, dst, size), #ifdef WITH_SSE2 TRUE, ssse3_sign_16s(src1, dst, size), PF_EX_SSSE3, TRUE, #else FALSE, PRIM_NOP, 0, FALSE, #endif FALSE, dst=dst); int test_sign16s_speed(void) { INT16 ALIGN(src[MAX_TEST_SIZE+3]), ALIGN(dst[MAX_TEST_SIZE+3]); get_random_data(src, sizeof(src)); sign16s_speed_test("sign16s", "aligned", src, NULL, 0, dst, test_sizes, NUM_TEST_SIZES, SIGN_PRETEST_ITERATIONS, TEST_TIME); sign16s_speed_test("sign16s", "unaligned", src+1, NULL, 0, dst, test_sizes, NUM_TEST_SIZES, SIGN_PRETEST_ITERATIONS, TEST_TIME); return SUCCESS; }