Mercurial > vec
comparison test/test_arith.h @ 45:7955bed1d169 default tip
*: add preliminary floating point support
no x86 intrinsics just yet, but I did add altivec since it's
(arguably) the simplest :)
author | Paper <paper@tflc.us> |
---|---|
date | Wed, 30 Apr 2025 18:36:38 -0400 |
parents | c6e0df09b86f |
children |
comparison
equal
deleted
inserted
replaced
44:b0a3f0248ecc | 45:7955bed1d169 |
---|---|
1 #define CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, secondsign, secondcsign) \ | 1 #define CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, secondtype, secondctype) \ |
2 static int test_arith_v##sign##int##bits##x##size##_##op(v##sign##int##bits##x##size a, v##secondsign##int##bits##x##size b) \ | 2 static int test_arith_v##type##bits##x##size##_##op(v##type##bits##x##size a, v##secondtype##bits##x##size b) \ |
3 { \ | 3 { \ |
4 V##csign##INT##bits##x##size##_ALIGNED_ARRAY(orig_a); \ | 4 V##ctype##bits##x##size##_ALIGNED_ARRAY(orig_a); \ |
5 V##secondcsign##INT##bits##x##size##_ALIGNED_ARRAY(orig_b); \ | 5 V##secondctype##bits##x##size##_ALIGNED_ARRAY(orig_b); \ |
6 V##csign##INT##bits##x##size##_ALIGNED_ARRAY(orig_c); \ | 6 V##ctype##bits##x##size##_ALIGNED_ARRAY(orig_c); \ |
7 \ | 7 \ |
8 v##sign##int##bits##x##size c = v##sign##int##bits##x##size##_##op(a, b); \ | 8 v##type##bits##x##size c = v##type##bits##x##size##_##op(a, b); \ |
9 \ | 9 \ |
10 v##sign##int##bits##x##size##_store_aligned(a, orig_a); \ | 10 v##type##bits##x##size##_store_aligned(a, orig_a); \ |
11 v##secondsign##int##bits##x##size##_store_aligned(b, orig_b); \ | 11 v##secondtype##bits##x##size##_store_aligned(b, orig_b); \ |
12 v##sign##int##bits##x##size##_store_aligned(c, orig_c); \ | 12 v##type##bits##x##size##_store_aligned(c, orig_c); \ |
13 \ | 13 \ |
14 for (int i = 0; i < size; i++) { \ | 14 for (int i = 0; i < size; i++) { \ |
15 if ((sign##int##bits##_t)(equiv) != orig_c[i]) { \ | 15 if ((vec_##type##bits)(equiv) != orig_c[i]) { \ |
16 fprintf(stderr, "v" #sign "int" #bits "x" #size "_" #op " test FAILED at index %d: (%s) [%" PRI ## psign ## bits "] does not equal result [%" PRI ## psign ## bits "]!\n", i, #equiv, (vec_##sign##int##bits)(equiv), orig_c[i]); \ | 16 fprintf(stderr, "v" #type #bits "x" #size "_" #op " test FAILED at index %d: (%s) [%" print "] does not equal result [%" print "]!\n", i, #equiv, (vec_##type##bits)(equiv), orig_c[i]); \ |
17 print_v##sign##int##bits##x##size(stderr,a); \ | 17 print_v##type##bits##x##size(stderr,a); \ |
18 print_v##secondsign##int##bits##x##size(stderr,b); \ | 18 print_v##secondtype##bits##x##size(stderr,b); \ |
19 print_v##sign##int##bits##x##size(stderr,c); \ | 19 print_v##type##bits##x##size(stderr,c); \ |
20 fprintf(stderr, "\n"); \ | 20 fprintf(stderr, "\n"); \ |
21 return 1; \ | 21 return 1; \ |
22 } \ | 22 } \ |
23 } \ | 23 } \ |
24 \ | 24 \ |
25 return 0; \ | 25 return 0; \ |
26 } | 26 } |
27 | 27 |
28 #define CREATE_TEST(sign, psign, csign, bits, size, op, equiv) \ | 28 #define CREATE_TEST(type, ctype, print, bits, size, op, equiv) \ |
29 CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, sign, csign) | 29 CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, type, ctype) |
30 | 30 |
31 #define CREATE_TEST_SHIFT(sign, psign, csign, bits, size, op, equiv) \ | 31 #define CREATE_TEST_SHIFT(type, ctype, print, bits, size, op, equiv) \ |
32 CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, u, U) | 32 CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, uint, UINT) |
33 | 33 |
34 #define CREATE_TESTS_SIGN(sign, psign, csign, bits, size) \ | 34 #define CREATE_TESTS_INT(type, ctype, sign, print, bits, size) \ |
35 CREATE_TEST(sign, psign, csign, bits, size, add, orig_a[i] + orig_b[i]) \ | 35 CREATE_TEST(type, ctype, print, bits, size, add, orig_a[i] + orig_b[i]) \ |
36 CREATE_TEST(sign, psign, csign, bits, size, sub, orig_a[i] - orig_b[i]) \ | 36 CREATE_TEST(type, ctype, print, bits, size, sub, orig_a[i] - orig_b[i]) \ |
37 CREATE_TEST(sign, psign, csign, bits, size, mul, orig_a[i] * orig_b[i]) \ | 37 CREATE_TEST(type, ctype, print, bits, size, mul, orig_a[i] * orig_b[i]) \ |
38 CREATE_TEST(sign, psign, csign, bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ | 38 CREATE_TEST(type, ctype, print, bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ |
39 CREATE_TEST(sign, psign, csign, bits, size, mod, (orig_b[i]) ? (orig_a[i] % orig_b[i]) : 0) \ | 39 CREATE_TEST(type, ctype, print, bits, size, mod, (orig_b[i]) ? (orig_a[i] % orig_b[i]) : 0) \ |
40 CREATE_TEST(sign, psign, csign, bits, size, and, orig_a[i] & orig_b[i]) \ | 40 CREATE_TEST(type, ctype, print, bits, size, and, orig_a[i] & orig_b[i]) \ |
41 CREATE_TEST(sign, psign, csign, bits, size, or, orig_a[i] | orig_b[i]) \ | 41 CREATE_TEST(type, ctype, print, bits, size, or, orig_a[i] | orig_b[i]) \ |
42 CREATE_TEST(sign, psign, csign, bits, size, xor, orig_a[i] ^ orig_b[i]) \ | 42 CREATE_TEST(type, ctype, print, bits, size, xor, orig_a[i] ^ orig_b[i]) \ |
43 CREATE_TEST(sign, psign, csign, bits, size, avg, (vec_##sign##int##bits)vec_im##sign##avg(orig_a[i], orig_b[i])) \ | 43 CREATE_TEST(type, ctype, print, bits, size, avg, (vec_##type##bits)vec_im##sign##avg(orig_a[i], orig_b[i])) \ |
44 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, rshift, vec_##sign##rshift(orig_a[i], orig_b[i])) \ | 44 CREATE_TEST_SHIFT(type, ctype, print, bits, size, rshift, vec_##sign##rshift(orig_a[i], orig_b[i])) \ |
45 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, lshift, vec_##sign##lshift(orig_a[i], orig_b[i])) \ | 45 CREATE_TEST_SHIFT(type, ctype, print, bits, size, lshift, vec_##sign##lshift(orig_a[i], orig_b[i])) \ |
46 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, lrshift, vec_urshift((vec_uint##bits)orig_a[i], orig_b[i])) \ | 46 CREATE_TEST_SHIFT(type, ctype, print, bits, size, lrshift, vec_urshift((vec_uint##bits)orig_a[i], orig_b[i])) \ |
47 CREATE_TEST(sign, psign, csign, bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ | 47 CREATE_TEST(type, ctype, print, bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ |
48 CREATE_TEST(sign, psign, csign, bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) | 48 CREATE_TEST(type, ctype, print, bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) |
49 | |
50 #define CREATE_TESTS_FLOAT(bits, size) \ | |
51 CREATE_TEST(f, F, "f", bits, size, add, orig_a[i] + orig_b[i]) \ | |
52 CREATE_TEST(f, F, "f", bits, size, sub, orig_a[i] - orig_b[i]) \ | |
53 CREATE_TEST(f, F, "f", bits, size, mul, orig_a[i] * orig_b[i]) \ | |
54 CREATE_TEST(f, F, "f", bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ | |
55 CREATE_TEST(f, F, "f", bits, size, mod, (orig_b[i]) ? (fmod(orig_a[i], orig_b[i])) : 0) \ | |
56 CREATE_TEST(f, F, "f", bits, size, avg, (orig_a[i] + orig_b[i]) / 2) \ | |
57 CREATE_TEST(f, F, "f", bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ | |
58 CREATE_TEST(f, F, "f", bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) | |
49 | 59 |
50 #define CREATE_TESTS(bits, size) \ | 60 #define CREATE_TESTS(bits, size) \ |
51 CREATE_TESTS_SIGN(, d, , bits, size) \ | 61 CREATE_TESTS_INT(int, INT, /* nothing */, PRI##d##bits, bits, size) \ |
52 CREATE_TESTS_SIGN(u, u, U, bits, size) | 62 CREATE_TESTS_INT(uint, UINT, u, PRI##u##bits, bits, size) |
53 | 63 |
54 CREATE_TESTS(8, 2) | 64 CREATE_TESTS(8, 2) |
55 | 65 |
56 CREATE_TESTS(8, 4) | 66 CREATE_TESTS(8, 4) |
57 CREATE_TESTS(16, 2) | 67 CREATE_TESTS(16, 2) |
73 CREATE_TESTS(8, 64) | 83 CREATE_TESTS(8, 64) |
74 CREATE_TESTS(16, 32) | 84 CREATE_TESTS(16, 32) |
75 CREATE_TESTS(32, 16) | 85 CREATE_TESTS(32, 16) |
76 CREATE_TESTS(64, 8) | 86 CREATE_TESTS(64, 8) |
77 | 87 |
78 #undef CREATE_TESTS_SIGN | 88 CREATE_TESTS_FLOAT(32, 2) |
89 CREATE_TESTS_FLOAT(32, 4) | |
90 CREATE_TESTS_FLOAT(32, 8) | |
91 CREATE_TESTS_FLOAT(32, 16) | |
92 | |
93 CREATE_TESTS_FLOAT(64, 2) | |
94 CREATE_TESTS_FLOAT(64, 4) | |
95 CREATE_TESTS_FLOAT(64, 8) | |
96 | |
97 #undef CREATE_TESTS_INT | |
98 #undef CREATE_TESTS_FLOAT | |
79 #undef CREATE_TESTS | 99 #undef CREATE_TESTS |
80 #undef CREATE_TEST | 100 #undef CREATE_TEST |
81 #undef CREATE_TEST_SHIFT | 101 #undef CREATE_TEST_SHIFT |
82 | 102 |
83 static int test_arith(void) | 103 static int test_arith(void) |
84 { | 104 { |
85 int ret = 0; | 105 int ret = 0; |
86 | 106 |
87 #define RUN_TESTS_SIGN(sign, bits, size) \ | 107 #define RUN_TESTS_SIGN(shorttype, type, bits, size) \ |
88 for (size_t i = 0U; i < ARRAY_SIZE(testval##sign##bits); i++) { \ | 108 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \ |
89 const v##sign##int##bits##x##size a = vtest##sign##bits##x##size(i); \ | 109 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \ |
90 for (size_t j = 0U; j < ARRAY_SIZE(testval##sign##bits); j++) { \ | 110 for (size_t j = 0U; j < ARRAY_SIZE(testval##shorttype##bits); j++) { \ |
91 const v##sign##int##bits##x##size b = vtest##sign##bits##x##size(j); \ | 111 const v##type##bits##x##size b = vtest##shorttype##bits##x##size(j); \ |
92 ret |= test_arith_v##sign##int##bits##x##size##_add(a, b); \ | 112 ret |= test_arith_v##type##bits##x##size##_add(a, b); \ |
93 ret |= test_arith_v##sign##int##bits##x##size##_sub(a, b); \ | 113 ret |= test_arith_v##type##bits##x##size##_sub(a, b); \ |
94 ret |= test_arith_v##sign##int##bits##x##size##_mul(a, b); \ | 114 ret |= test_arith_v##type##bits##x##size##_mul(a, b); \ |
95 ret |= test_arith_v##sign##int##bits##x##size##_div(a, b); \ | 115 ret |= test_arith_v##type##bits##x##size##_div(a, b); \ |
96 ret |= test_arith_v##sign##int##bits##x##size##_mod(a, b); \ | 116 ret |= test_arith_v##type##bits##x##size##_mod(a, b); \ |
97 ret |= test_arith_v##sign##int##bits##x##size##_and(a, b); \ | 117 ret |= test_arith_v##type##bits##x##size##_and(a, b); \ |
98 ret |= test_arith_v##sign##int##bits##x##size##_or(a, b); \ | 118 ret |= test_arith_v##type##bits##x##size##_or(a, b); \ |
99 ret |= test_arith_v##sign##int##bits##x##size##_xor(a, b); \ | 119 ret |= test_arith_v##type##bits##x##size##_xor(a, b); \ |
100 ret |= test_arith_v##sign##int##bits##x##size##_avg(a, b); \ | 120 ret |= test_arith_v##type##bits##x##size##_avg(a, b); \ |
101 ret |= test_arith_v##sign##int##bits##x##size##_min(a, b); \ | 121 ret |= test_arith_v##type##bits##x##size##_min(a, b); \ |
102 ret |= test_arith_v##sign##int##bits##x##size##_max(a, b); \ | 122 ret |= test_arith_v##type##bits##x##size##_max(a, b); \ |
103 } \ | 123 } \ |
104 } \ | 124 } \ |
105 \ | 125 \ |
106 for (size_t i = 0U; i < ARRAY_SIZE(testval##sign##bits); i++) { \ | 126 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \ |
107 const v##sign##int##bits##x##size a = vtest##sign##bits##x##size(i); \ | 127 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \ |
108 for (uint32_t j = 0U; j < bits; j++) { \ | 128 for (uint32_t j = 0U; j < bits; j++) { \ |
109 const vuint##bits##x##size b = vuint##bits##x##size##_splat(j); \ | 129 const vuint##bits##x##size b = vuint##bits##x##size##_splat(j); \ |
110 ret |= test_arith_v##sign##int##bits##x##size##_rshift(a, b); \ | 130 ret |= test_arith_v##type##bits##x##size##_rshift(a, b); \ |
111 ret |= test_arith_v##sign##int##bits##x##size##_lshift(a, b); \ | 131 ret |= test_arith_v##type##bits##x##size##_lshift(a, b); \ |
112 ret |= test_arith_v##sign##int##bits##x##size##_lrshift(a, b); \ | 132 ret |= test_arith_v##type##bits##x##size##_lrshift(a, b); \ |
113 } \ | 133 } \ |
114 } | 134 } |
115 | 135 |
116 #define RUN_TESTS(bits, size) \ | 136 #define RUN_TESTS(bits, size) \ |
117 RUN_TESTS_SIGN( , bits, size) \ | 137 RUN_TESTS_SIGN( , int, bits, size) \ |
118 RUN_TESTS_SIGN(u, bits, size) | 138 RUN_TESTS_SIGN(u, uint, bits, size) |
139 | |
140 #define RUN_TESTS_FLOAT(shorttype, type, bits, size) \ | |
141 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \ | |
142 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \ | |
143 for (size_t j = 0U; j < ARRAY_SIZE(testval##shorttype##bits); j++) { \ | |
144 const v##type##bits##x##size b = vtest##shorttype##bits##x##size(j); \ | |
145 ret |= test_arith_v##type##bits##x##size##_add(a, b); \ | |
146 ret |= test_arith_v##type##bits##x##size##_sub(a, b); \ | |
147 ret |= test_arith_v##type##bits##x##size##_mul(a, b); \ | |
148 ret |= test_arith_v##type##bits##x##size##_div(a, b); \ | |
149 ret |= test_arith_v##type##bits##x##size##_mod(a, b); \ | |
150 ret |= test_arith_v##type##bits##x##size##_avg(a, b); \ | |
151 ret |= test_arith_v##type##bits##x##size##_min(a, b); \ | |
152 ret |= test_arith_v##type##bits##x##size##_max(a, b); \ | |
153 } \ | |
154 } | |
119 | 155 |
120 RUN_TESTS(8, 2) | 156 RUN_TESTS(8, 2) |
121 | 157 |
122 RUN_TESTS(8, 4) | 158 RUN_TESTS(8, 4) |
123 RUN_TESTS(16, 2) | 159 RUN_TESTS(16, 2) |
139 RUN_TESTS(8, 64) | 175 RUN_TESTS(8, 64) |
140 RUN_TESTS(16, 32) | 176 RUN_TESTS(16, 32) |
141 RUN_TESTS(32, 16) | 177 RUN_TESTS(32, 16) |
142 RUN_TESTS(64, 8) | 178 RUN_TESTS(64, 8) |
143 | 179 |
180 RUN_TESTS_FLOAT(f, f, 32, 2) | |
181 RUN_TESTS_FLOAT(f, f, 32, 4) | |
182 RUN_TESTS_FLOAT(f, f, 32, 8) | |
183 RUN_TESTS_FLOAT(f, f, 32, 16) | |
184 | |
185 RUN_TESTS_FLOAT(f, f, 64, 2) | |
186 RUN_TESTS_FLOAT(f, f, 64, 4) | |
187 RUN_TESTS_FLOAT(f, f, 64, 8) | |
188 | |
189 #undef RUN_TESTS_FLOAT | |
144 #undef RUN_TESTS_SIGN | 190 #undef RUN_TESTS_SIGN |
145 #undef RUN_TESTS | 191 #undef RUN_TESTS |
146 | 192 |
147 return ret; | 193 return ret; |
148 } | 194 } |