comparison test/test_arith.h @ 45:7955bed1d169 default tip

*: add preliminary floating point support no x86 intrinsics just yet, but I did add altivec since it's (arguably) the simplest :)
author Paper <paper@tflc.us>
date Wed, 30 Apr 2025 18:36:38 -0400
parents c6e0df09b86f
children
comparison
equal deleted inserted replaced
44:b0a3f0248ecc 45:7955bed1d169
1 #define CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, secondsign, secondcsign) \ 1 #define CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, secondtype, secondctype) \
2 static int test_arith_v##sign##int##bits##x##size##_##op(v##sign##int##bits##x##size a, v##secondsign##int##bits##x##size b) \ 2 static int test_arith_v##type##bits##x##size##_##op(v##type##bits##x##size a, v##secondtype##bits##x##size b) \
3 { \ 3 { \
4 V##csign##INT##bits##x##size##_ALIGNED_ARRAY(orig_a); \ 4 V##ctype##bits##x##size##_ALIGNED_ARRAY(orig_a); \
5 V##secondcsign##INT##bits##x##size##_ALIGNED_ARRAY(orig_b); \ 5 V##secondctype##bits##x##size##_ALIGNED_ARRAY(orig_b); \
6 V##csign##INT##bits##x##size##_ALIGNED_ARRAY(orig_c); \ 6 V##ctype##bits##x##size##_ALIGNED_ARRAY(orig_c); \
7 \ 7 \
8 v##sign##int##bits##x##size c = v##sign##int##bits##x##size##_##op(a, b); \ 8 v##type##bits##x##size c = v##type##bits##x##size##_##op(a, b); \
9 \ 9 \
10 v##sign##int##bits##x##size##_store_aligned(a, orig_a); \ 10 v##type##bits##x##size##_store_aligned(a, orig_a); \
11 v##secondsign##int##bits##x##size##_store_aligned(b, orig_b); \ 11 v##secondtype##bits##x##size##_store_aligned(b, orig_b); \
12 v##sign##int##bits##x##size##_store_aligned(c, orig_c); \ 12 v##type##bits##x##size##_store_aligned(c, orig_c); \
13 \ 13 \
14 for (int i = 0; i < size; i++) { \ 14 for (int i = 0; i < size; i++) { \
15 if ((sign##int##bits##_t)(equiv) != orig_c[i]) { \ 15 if ((vec_##type##bits)(equiv) != orig_c[i]) { \
16 fprintf(stderr, "v" #sign "int" #bits "x" #size "_" #op " test FAILED at index %d: (%s) [%" PRI ## psign ## bits "] does not equal result [%" PRI ## psign ## bits "]!\n", i, #equiv, (vec_##sign##int##bits)(equiv), orig_c[i]); \ 16 fprintf(stderr, "v" #type #bits "x" #size "_" #op " test FAILED at index %d: (%s) [%" print "] does not equal result [%" print "]!\n", i, #equiv, (vec_##type##bits)(equiv), orig_c[i]); \
17 print_v##sign##int##bits##x##size(stderr,a); \ 17 print_v##type##bits##x##size(stderr,a); \
18 print_v##secondsign##int##bits##x##size(stderr,b); \ 18 print_v##secondtype##bits##x##size(stderr,b); \
19 print_v##sign##int##bits##x##size(stderr,c); \ 19 print_v##type##bits##x##size(stderr,c); \
20 fprintf(stderr, "\n"); \ 20 fprintf(stderr, "\n"); \
21 return 1; \ 21 return 1; \
22 } \ 22 } \
23 } \ 23 } \
24 \ 24 \
25 return 0; \ 25 return 0; \
26 } 26 }
27 27
28 #define CREATE_TEST(sign, psign, csign, bits, size, op, equiv) \ 28 #define CREATE_TEST(type, ctype, print, bits, size, op, equiv) \
29 CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, sign, csign) 29 CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, type, ctype)
30 30
31 #define CREATE_TEST_SHIFT(sign, psign, csign, bits, size, op, equiv) \ 31 #define CREATE_TEST_SHIFT(type, ctype, print, bits, size, op, equiv) \
32 CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, u, U) 32 CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, uint, UINT)
33 33
34 #define CREATE_TESTS_SIGN(sign, psign, csign, bits, size) \ 34 #define CREATE_TESTS_INT(type, ctype, sign, print, bits, size) \
35 CREATE_TEST(sign, psign, csign, bits, size, add, orig_a[i] + orig_b[i]) \ 35 CREATE_TEST(type, ctype, print, bits, size, add, orig_a[i] + orig_b[i]) \
36 CREATE_TEST(sign, psign, csign, bits, size, sub, orig_a[i] - orig_b[i]) \ 36 CREATE_TEST(type, ctype, print, bits, size, sub, orig_a[i] - orig_b[i]) \
37 CREATE_TEST(sign, psign, csign, bits, size, mul, orig_a[i] * orig_b[i]) \ 37 CREATE_TEST(type, ctype, print, bits, size, mul, orig_a[i] * orig_b[i]) \
38 CREATE_TEST(sign, psign, csign, bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ 38 CREATE_TEST(type, ctype, print, bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \
39 CREATE_TEST(sign, psign, csign, bits, size, mod, (orig_b[i]) ? (orig_a[i] % orig_b[i]) : 0) \ 39 CREATE_TEST(type, ctype, print, bits, size, mod, (orig_b[i]) ? (orig_a[i] % orig_b[i]) : 0) \
40 CREATE_TEST(sign, psign, csign, bits, size, and, orig_a[i] & orig_b[i]) \ 40 CREATE_TEST(type, ctype, print, bits, size, and, orig_a[i] & orig_b[i]) \
41 CREATE_TEST(sign, psign, csign, bits, size, or, orig_a[i] | orig_b[i]) \ 41 CREATE_TEST(type, ctype, print, bits, size, or, orig_a[i] | orig_b[i]) \
42 CREATE_TEST(sign, psign, csign, bits, size, xor, orig_a[i] ^ orig_b[i]) \ 42 CREATE_TEST(type, ctype, print, bits, size, xor, orig_a[i] ^ orig_b[i]) \
43 CREATE_TEST(sign, psign, csign, bits, size, avg, (vec_##sign##int##bits)vec_im##sign##avg(orig_a[i], orig_b[i])) \ 43 CREATE_TEST(type, ctype, print, bits, size, avg, (vec_##type##bits)vec_im##sign##avg(orig_a[i], orig_b[i])) \
44 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, rshift, vec_##sign##rshift(orig_a[i], orig_b[i])) \ 44 CREATE_TEST_SHIFT(type, ctype, print, bits, size, rshift, vec_##sign##rshift(orig_a[i], orig_b[i])) \
45 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, lshift, vec_##sign##lshift(orig_a[i], orig_b[i])) \ 45 CREATE_TEST_SHIFT(type, ctype, print, bits, size, lshift, vec_##sign##lshift(orig_a[i], orig_b[i])) \
46 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, lrshift, vec_urshift((vec_uint##bits)orig_a[i], orig_b[i])) \ 46 CREATE_TEST_SHIFT(type, ctype, print, bits, size, lrshift, vec_urshift((vec_uint##bits)orig_a[i], orig_b[i])) \
47 CREATE_TEST(sign, psign, csign, bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ 47 CREATE_TEST(type, ctype, print, bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \
48 CREATE_TEST(sign, psign, csign, bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) 48 CREATE_TEST(type, ctype, print, bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i])
49
50 #define CREATE_TESTS_FLOAT(bits, size) \
51 CREATE_TEST(f, F, "f", bits, size, add, orig_a[i] + orig_b[i]) \
52 CREATE_TEST(f, F, "f", bits, size, sub, orig_a[i] - orig_b[i]) \
53 CREATE_TEST(f, F, "f", bits, size, mul, orig_a[i] * orig_b[i]) \
54 CREATE_TEST(f, F, "f", bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \
55 CREATE_TEST(f, F, "f", bits, size, mod, (orig_b[i]) ? (fmod(orig_a[i], orig_b[i])) : 0) \
56 CREATE_TEST(f, F, "f", bits, size, avg, (orig_a[i] + orig_b[i]) / 2) \
57 CREATE_TEST(f, F, "f", bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \
58 CREATE_TEST(f, F, "f", bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i])
49 59
50 #define CREATE_TESTS(bits, size) \ 60 #define CREATE_TESTS(bits, size) \
51 CREATE_TESTS_SIGN(, d, , bits, size) \ 61 CREATE_TESTS_INT(int, INT, /* nothing */, PRI##d##bits, bits, size) \
52 CREATE_TESTS_SIGN(u, u, U, bits, size) 62 CREATE_TESTS_INT(uint, UINT, u, PRI##u##bits, bits, size)
53 63
54 CREATE_TESTS(8, 2) 64 CREATE_TESTS(8, 2)
55 65
56 CREATE_TESTS(8, 4) 66 CREATE_TESTS(8, 4)
57 CREATE_TESTS(16, 2) 67 CREATE_TESTS(16, 2)
73 CREATE_TESTS(8, 64) 83 CREATE_TESTS(8, 64)
74 CREATE_TESTS(16, 32) 84 CREATE_TESTS(16, 32)
75 CREATE_TESTS(32, 16) 85 CREATE_TESTS(32, 16)
76 CREATE_TESTS(64, 8) 86 CREATE_TESTS(64, 8)
77 87
78 #undef CREATE_TESTS_SIGN 88 CREATE_TESTS_FLOAT(32, 2)
89 CREATE_TESTS_FLOAT(32, 4)
90 CREATE_TESTS_FLOAT(32, 8)
91 CREATE_TESTS_FLOAT(32, 16)
92
93 CREATE_TESTS_FLOAT(64, 2)
94 CREATE_TESTS_FLOAT(64, 4)
95 CREATE_TESTS_FLOAT(64, 8)
96
97 #undef CREATE_TESTS_INT
98 #undef CREATE_TESTS_FLOAT
79 #undef CREATE_TESTS 99 #undef CREATE_TESTS
80 #undef CREATE_TEST 100 #undef CREATE_TEST
81 #undef CREATE_TEST_SHIFT 101 #undef CREATE_TEST_SHIFT
82 102
83 static int test_arith(void) 103 static int test_arith(void)
84 { 104 {
85 int ret = 0; 105 int ret = 0;
86 106
87 #define RUN_TESTS_SIGN(sign, bits, size) \ 107 #define RUN_TESTS_SIGN(shorttype, type, bits, size) \
88 for (size_t i = 0U; i < ARRAY_SIZE(testval##sign##bits); i++) { \ 108 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \
89 const v##sign##int##bits##x##size a = vtest##sign##bits##x##size(i); \ 109 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \
90 for (size_t j = 0U; j < ARRAY_SIZE(testval##sign##bits); j++) { \ 110 for (size_t j = 0U; j < ARRAY_SIZE(testval##shorttype##bits); j++) { \
91 const v##sign##int##bits##x##size b = vtest##sign##bits##x##size(j); \ 111 const v##type##bits##x##size b = vtest##shorttype##bits##x##size(j); \
92 ret |= test_arith_v##sign##int##bits##x##size##_add(a, b); \ 112 ret |= test_arith_v##type##bits##x##size##_add(a, b); \
93 ret |= test_arith_v##sign##int##bits##x##size##_sub(a, b); \ 113 ret |= test_arith_v##type##bits##x##size##_sub(a, b); \
94 ret |= test_arith_v##sign##int##bits##x##size##_mul(a, b); \ 114 ret |= test_arith_v##type##bits##x##size##_mul(a, b); \
95 ret |= test_arith_v##sign##int##bits##x##size##_div(a, b); \ 115 ret |= test_arith_v##type##bits##x##size##_div(a, b); \
96 ret |= test_arith_v##sign##int##bits##x##size##_mod(a, b); \ 116 ret |= test_arith_v##type##bits##x##size##_mod(a, b); \
97 ret |= test_arith_v##sign##int##bits##x##size##_and(a, b); \ 117 ret |= test_arith_v##type##bits##x##size##_and(a, b); \
98 ret |= test_arith_v##sign##int##bits##x##size##_or(a, b); \ 118 ret |= test_arith_v##type##bits##x##size##_or(a, b); \
99 ret |= test_arith_v##sign##int##bits##x##size##_xor(a, b); \ 119 ret |= test_arith_v##type##bits##x##size##_xor(a, b); \
100 ret |= test_arith_v##sign##int##bits##x##size##_avg(a, b); \ 120 ret |= test_arith_v##type##bits##x##size##_avg(a, b); \
101 ret |= test_arith_v##sign##int##bits##x##size##_min(a, b); \ 121 ret |= test_arith_v##type##bits##x##size##_min(a, b); \
102 ret |= test_arith_v##sign##int##bits##x##size##_max(a, b); \ 122 ret |= test_arith_v##type##bits##x##size##_max(a, b); \
103 } \ 123 } \
104 } \ 124 } \
105 \ 125 \
106 for (size_t i = 0U; i < ARRAY_SIZE(testval##sign##bits); i++) { \ 126 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \
107 const v##sign##int##bits##x##size a = vtest##sign##bits##x##size(i); \ 127 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \
108 for (uint32_t j = 0U; j < bits; j++) { \ 128 for (uint32_t j = 0U; j < bits; j++) { \
109 const vuint##bits##x##size b = vuint##bits##x##size##_splat(j); \ 129 const vuint##bits##x##size b = vuint##bits##x##size##_splat(j); \
110 ret |= test_arith_v##sign##int##bits##x##size##_rshift(a, b); \ 130 ret |= test_arith_v##type##bits##x##size##_rshift(a, b); \
111 ret |= test_arith_v##sign##int##bits##x##size##_lshift(a, b); \ 131 ret |= test_arith_v##type##bits##x##size##_lshift(a, b); \
112 ret |= test_arith_v##sign##int##bits##x##size##_lrshift(a, b); \ 132 ret |= test_arith_v##type##bits##x##size##_lrshift(a, b); \
113 } \ 133 } \
114 } 134 }
115 135
116 #define RUN_TESTS(bits, size) \ 136 #define RUN_TESTS(bits, size) \
117 RUN_TESTS_SIGN( , bits, size) \ 137 RUN_TESTS_SIGN( , int, bits, size) \
118 RUN_TESTS_SIGN(u, bits, size) 138 RUN_TESTS_SIGN(u, uint, bits, size)
139
140 #define RUN_TESTS_FLOAT(shorttype, type, bits, size) \
141 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \
142 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \
143 for (size_t j = 0U; j < ARRAY_SIZE(testval##shorttype##bits); j++) { \
144 const v##type##bits##x##size b = vtest##shorttype##bits##x##size(j); \
145 ret |= test_arith_v##type##bits##x##size##_add(a, b); \
146 ret |= test_arith_v##type##bits##x##size##_sub(a, b); \
147 ret |= test_arith_v##type##bits##x##size##_mul(a, b); \
148 ret |= test_arith_v##type##bits##x##size##_div(a, b); \
149 ret |= test_arith_v##type##bits##x##size##_mod(a, b); \
150 ret |= test_arith_v##type##bits##x##size##_avg(a, b); \
151 ret |= test_arith_v##type##bits##x##size##_min(a, b); \
152 ret |= test_arith_v##type##bits##x##size##_max(a, b); \
153 } \
154 }
119 155
120 RUN_TESTS(8, 2) 156 RUN_TESTS(8, 2)
121 157
122 RUN_TESTS(8, 4) 158 RUN_TESTS(8, 4)
123 RUN_TESTS(16, 2) 159 RUN_TESTS(16, 2)
139 RUN_TESTS(8, 64) 175 RUN_TESTS(8, 64)
140 RUN_TESTS(16, 32) 176 RUN_TESTS(16, 32)
141 RUN_TESTS(32, 16) 177 RUN_TESTS(32, 16)
142 RUN_TESTS(64, 8) 178 RUN_TESTS(64, 8)
143 179
180 RUN_TESTS_FLOAT(f, f, 32, 2)
181 RUN_TESTS_FLOAT(f, f, 32, 4)
182 RUN_TESTS_FLOAT(f, f, 32, 8)
183 RUN_TESTS_FLOAT(f, f, 32, 16)
184
185 RUN_TESTS_FLOAT(f, f, 64, 2)
186 RUN_TESTS_FLOAT(f, f, 64, 4)
187 RUN_TESTS_FLOAT(f, f, 64, 8)
188
189 #undef RUN_TESTS_FLOAT
144 #undef RUN_TESTS_SIGN 190 #undef RUN_TESTS_SIGN
145 #undef RUN_TESTS 191 #undef RUN_TESTS
146 192
147 return ret; 193 return ret;
148 } 194 }