Mercurial > vec
comparison test/test_arith.h @ 45:7955bed1d169
*: add preliminary floating point support
no x86 intrinsics just yet, but I did add altivec since it's
(arguably) the simplest :)
| author | Paper <paper@tflc.us> |
|---|---|
| date | Wed, 30 Apr 2025 18:36:38 -0400 |
| parents | c6e0df09b86f |
| children | 31cee67540b5 |
comparison
equal
deleted
inserted
replaced
| 44:b0a3f0248ecc | 45:7955bed1d169 |
|---|---|
| 1 #define CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, secondsign, secondcsign) \ | 1 #define CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, secondtype, secondctype) \ |
| 2 static int test_arith_v##sign##int##bits##x##size##_##op(v##sign##int##bits##x##size a, v##secondsign##int##bits##x##size b) \ | 2 static int test_arith_v##type##bits##x##size##_##op(v##type##bits##x##size a, v##secondtype##bits##x##size b) \ |
| 3 { \ | 3 { \ |
| 4 V##csign##INT##bits##x##size##_ALIGNED_ARRAY(orig_a); \ | 4 V##ctype##bits##x##size##_ALIGNED_ARRAY(orig_a); \ |
| 5 V##secondcsign##INT##bits##x##size##_ALIGNED_ARRAY(orig_b); \ | 5 V##secondctype##bits##x##size##_ALIGNED_ARRAY(orig_b); \ |
| 6 V##csign##INT##bits##x##size##_ALIGNED_ARRAY(orig_c); \ | 6 V##ctype##bits##x##size##_ALIGNED_ARRAY(orig_c); \ |
| 7 \ | 7 \ |
| 8 v##sign##int##bits##x##size c = v##sign##int##bits##x##size##_##op(a, b); \ | 8 v##type##bits##x##size c = v##type##bits##x##size##_##op(a, b); \ |
| 9 \ | 9 \ |
| 10 v##sign##int##bits##x##size##_store_aligned(a, orig_a); \ | 10 v##type##bits##x##size##_store_aligned(a, orig_a); \ |
| 11 v##secondsign##int##bits##x##size##_store_aligned(b, orig_b); \ | 11 v##secondtype##bits##x##size##_store_aligned(b, orig_b); \ |
| 12 v##sign##int##bits##x##size##_store_aligned(c, orig_c); \ | 12 v##type##bits##x##size##_store_aligned(c, orig_c); \ |
| 13 \ | 13 \ |
| 14 for (int i = 0; i < size; i++) { \ | 14 for (int i = 0; i < size; i++) { \ |
| 15 if ((sign##int##bits##_t)(equiv) != orig_c[i]) { \ | 15 if ((vec_##type##bits)(equiv) != orig_c[i]) { \ |
| 16 fprintf(stderr, "v" #sign "int" #bits "x" #size "_" #op " test FAILED at index %d: (%s) [%" PRI ## psign ## bits "] does not equal result [%" PRI ## psign ## bits "]!\n", i, #equiv, (vec_##sign##int##bits)(equiv), orig_c[i]); \ | 16 fprintf(stderr, "v" #type #bits "x" #size "_" #op " test FAILED at index %d: (%s) [%" print "] does not equal result [%" print "]!\n", i, #equiv, (vec_##type##bits)(equiv), orig_c[i]); \ |
| 17 print_v##sign##int##bits##x##size(stderr,a); \ | 17 print_v##type##bits##x##size(stderr,a); \ |
| 18 print_v##secondsign##int##bits##x##size(stderr,b); \ | 18 print_v##secondtype##bits##x##size(stderr,b); \ |
| 19 print_v##sign##int##bits##x##size(stderr,c); \ | 19 print_v##type##bits##x##size(stderr,c); \ |
| 20 fprintf(stderr, "\n"); \ | 20 fprintf(stderr, "\n"); \ |
| 21 return 1; \ | 21 return 1; \ |
| 22 } \ | 22 } \ |
| 23 } \ | 23 } \ |
| 24 \ | 24 \ |
| 25 return 0; \ | 25 return 0; \ |
| 26 } | 26 } |
| 27 | 27 |
| 28 #define CREATE_TEST(sign, psign, csign, bits, size, op, equiv) \ | 28 #define CREATE_TEST(type, ctype, print, bits, size, op, equiv) \ |
| 29 CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, sign, csign) | 29 CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, type, ctype) |
| 30 | 30 |
| 31 #define CREATE_TEST_SHIFT(sign, psign, csign, bits, size, op, equiv) \ | 31 #define CREATE_TEST_SHIFT(type, ctype, print, bits, size, op, equiv) \ |
| 32 CREATE_TEST_EX(sign, psign, csign, bits, size, op, equiv, u, U) | 32 CREATE_TEST_EX(type, ctype, print, bits, size, op, equiv, uint, UINT) |
| 33 | 33 |
| 34 #define CREATE_TESTS_SIGN(sign, psign, csign, bits, size) \ | 34 #define CREATE_TESTS_INT(type, ctype, sign, print, bits, size) \ |
| 35 CREATE_TEST(sign, psign, csign, bits, size, add, orig_a[i] + orig_b[i]) \ | 35 CREATE_TEST(type, ctype, print, bits, size, add, orig_a[i] + orig_b[i]) \ |
| 36 CREATE_TEST(sign, psign, csign, bits, size, sub, orig_a[i] - orig_b[i]) \ | 36 CREATE_TEST(type, ctype, print, bits, size, sub, orig_a[i] - orig_b[i]) \ |
| 37 CREATE_TEST(sign, psign, csign, bits, size, mul, orig_a[i] * orig_b[i]) \ | 37 CREATE_TEST(type, ctype, print, bits, size, mul, orig_a[i] * orig_b[i]) \ |
| 38 CREATE_TEST(sign, psign, csign, bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ | 38 CREATE_TEST(type, ctype, print, bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ |
| 39 CREATE_TEST(sign, psign, csign, bits, size, mod, (orig_b[i]) ? (orig_a[i] % orig_b[i]) : 0) \ | 39 CREATE_TEST(type, ctype, print, bits, size, mod, (orig_b[i]) ? (orig_a[i] % orig_b[i]) : 0) \ |
| 40 CREATE_TEST(sign, psign, csign, bits, size, and, orig_a[i] & orig_b[i]) \ | 40 CREATE_TEST(type, ctype, print, bits, size, and, orig_a[i] & orig_b[i]) \ |
| 41 CREATE_TEST(sign, psign, csign, bits, size, or, orig_a[i] | orig_b[i]) \ | 41 CREATE_TEST(type, ctype, print, bits, size, or, orig_a[i] | orig_b[i]) \ |
| 42 CREATE_TEST(sign, psign, csign, bits, size, xor, orig_a[i] ^ orig_b[i]) \ | 42 CREATE_TEST(type, ctype, print, bits, size, xor, orig_a[i] ^ orig_b[i]) \ |
| 43 CREATE_TEST(sign, psign, csign, bits, size, avg, (vec_##sign##int##bits)vec_im##sign##avg(orig_a[i], orig_b[i])) \ | 43 CREATE_TEST(type, ctype, print, bits, size, avg, (vec_##type##bits)vec_im##sign##avg(orig_a[i], orig_b[i])) \ |
| 44 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, rshift, vec_##sign##rshift(orig_a[i], orig_b[i])) \ | 44 CREATE_TEST_SHIFT(type, ctype, print, bits, size, rshift, vec_##sign##rshift(orig_a[i], orig_b[i])) \ |
| 45 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, lshift, vec_##sign##lshift(orig_a[i], orig_b[i])) \ | 45 CREATE_TEST_SHIFT(type, ctype, print, bits, size, lshift, vec_##sign##lshift(orig_a[i], orig_b[i])) \ |
| 46 CREATE_TEST_SHIFT(sign, psign, csign, bits, size, lrshift, vec_urshift((vec_uint##bits)orig_a[i], orig_b[i])) \ | 46 CREATE_TEST_SHIFT(type, ctype, print, bits, size, lrshift, vec_urshift((vec_uint##bits)orig_a[i], orig_b[i])) \ |
| 47 CREATE_TEST(sign, psign, csign, bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ | 47 CREATE_TEST(type, ctype, print, bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ |
| 48 CREATE_TEST(sign, psign, csign, bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) | 48 CREATE_TEST(type, ctype, print, bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) |
| 49 | |
| 50 #define CREATE_TESTS_FLOAT(bits, size) \ | |
| 51 CREATE_TEST(f, F, "f", bits, size, add, orig_a[i] + orig_b[i]) \ | |
| 52 CREATE_TEST(f, F, "f", bits, size, sub, orig_a[i] - orig_b[i]) \ | |
| 53 CREATE_TEST(f, F, "f", bits, size, mul, orig_a[i] * orig_b[i]) \ | |
| 54 CREATE_TEST(f, F, "f", bits, size, div, (orig_b[i]) ? (orig_a[i] / orig_b[i]) : 0) \ | |
| 55 CREATE_TEST(f, F, "f", bits, size, mod, (orig_b[i]) ? (fmod(orig_a[i], orig_b[i])) : 0) \ | |
| 56 CREATE_TEST(f, F, "f", bits, size, avg, (orig_a[i] + orig_b[i]) / 2) \ | |
| 57 CREATE_TEST(f, F, "f", bits, size, min, (orig_a[i] < orig_b[i]) ? orig_a[i] : orig_b[i]) \ | |
| 58 CREATE_TEST(f, F, "f", bits, size, max, (orig_a[i] > orig_b[i]) ? orig_a[i] : orig_b[i]) | |
| 49 | 59 |
| 50 #define CREATE_TESTS(bits, size) \ | 60 #define CREATE_TESTS(bits, size) \ |
| 51 CREATE_TESTS_SIGN(, d, , bits, size) \ | 61 CREATE_TESTS_INT(int, INT, /* nothing */, PRI##d##bits, bits, size) \ |
| 52 CREATE_TESTS_SIGN(u, u, U, bits, size) | 62 CREATE_TESTS_INT(uint, UINT, u, PRI##u##bits, bits, size) |
| 53 | 63 |
| 54 CREATE_TESTS(8, 2) | 64 CREATE_TESTS(8, 2) |
| 55 | 65 |
| 56 CREATE_TESTS(8, 4) | 66 CREATE_TESTS(8, 4) |
| 57 CREATE_TESTS(16, 2) | 67 CREATE_TESTS(16, 2) |
| 73 CREATE_TESTS(8, 64) | 83 CREATE_TESTS(8, 64) |
| 74 CREATE_TESTS(16, 32) | 84 CREATE_TESTS(16, 32) |
| 75 CREATE_TESTS(32, 16) | 85 CREATE_TESTS(32, 16) |
| 76 CREATE_TESTS(64, 8) | 86 CREATE_TESTS(64, 8) |
| 77 | 87 |
| 78 #undef CREATE_TESTS_SIGN | 88 CREATE_TESTS_FLOAT(32, 2) |
| 89 CREATE_TESTS_FLOAT(32, 4) | |
| 90 CREATE_TESTS_FLOAT(32, 8) | |
| 91 CREATE_TESTS_FLOAT(32, 16) | |
| 92 | |
| 93 CREATE_TESTS_FLOAT(64, 2) | |
| 94 CREATE_TESTS_FLOAT(64, 4) | |
| 95 CREATE_TESTS_FLOAT(64, 8) | |
| 96 | |
| 97 #undef CREATE_TESTS_INT | |
| 98 #undef CREATE_TESTS_FLOAT | |
| 79 #undef CREATE_TESTS | 99 #undef CREATE_TESTS |
| 80 #undef CREATE_TEST | 100 #undef CREATE_TEST |
| 81 #undef CREATE_TEST_SHIFT | 101 #undef CREATE_TEST_SHIFT |
| 82 | 102 |
| 83 static int test_arith(void) | 103 static int test_arith(void) |
| 84 { | 104 { |
| 85 int ret = 0; | 105 int ret = 0; |
| 86 | 106 |
| 87 #define RUN_TESTS_SIGN(sign, bits, size) \ | 107 #define RUN_TESTS_SIGN(shorttype, type, bits, size) \ |
| 88 for (size_t i = 0U; i < ARRAY_SIZE(testval##sign##bits); i++) { \ | 108 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \ |
| 89 const v##sign##int##bits##x##size a = vtest##sign##bits##x##size(i); \ | 109 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \ |
| 90 for (size_t j = 0U; j < ARRAY_SIZE(testval##sign##bits); j++) { \ | 110 for (size_t j = 0U; j < ARRAY_SIZE(testval##shorttype##bits); j++) { \ |
| 91 const v##sign##int##bits##x##size b = vtest##sign##bits##x##size(j); \ | 111 const v##type##bits##x##size b = vtest##shorttype##bits##x##size(j); \ |
| 92 ret |= test_arith_v##sign##int##bits##x##size##_add(a, b); \ | 112 ret |= test_arith_v##type##bits##x##size##_add(a, b); \ |
| 93 ret |= test_arith_v##sign##int##bits##x##size##_sub(a, b); \ | 113 ret |= test_arith_v##type##bits##x##size##_sub(a, b); \ |
| 94 ret |= test_arith_v##sign##int##bits##x##size##_mul(a, b); \ | 114 ret |= test_arith_v##type##bits##x##size##_mul(a, b); \ |
| 95 ret |= test_arith_v##sign##int##bits##x##size##_div(a, b); \ | 115 ret |= test_arith_v##type##bits##x##size##_div(a, b); \ |
| 96 ret |= test_arith_v##sign##int##bits##x##size##_mod(a, b); \ | 116 ret |= test_arith_v##type##bits##x##size##_mod(a, b); \ |
| 97 ret |= test_arith_v##sign##int##bits##x##size##_and(a, b); \ | 117 ret |= test_arith_v##type##bits##x##size##_and(a, b); \ |
| 98 ret |= test_arith_v##sign##int##bits##x##size##_or(a, b); \ | 118 ret |= test_arith_v##type##bits##x##size##_or(a, b); \ |
| 99 ret |= test_arith_v##sign##int##bits##x##size##_xor(a, b); \ | 119 ret |= test_arith_v##type##bits##x##size##_xor(a, b); \ |
| 100 ret |= test_arith_v##sign##int##bits##x##size##_avg(a, b); \ | 120 ret |= test_arith_v##type##bits##x##size##_avg(a, b); \ |
| 101 ret |= test_arith_v##sign##int##bits##x##size##_min(a, b); \ | 121 ret |= test_arith_v##type##bits##x##size##_min(a, b); \ |
| 102 ret |= test_arith_v##sign##int##bits##x##size##_max(a, b); \ | 122 ret |= test_arith_v##type##bits##x##size##_max(a, b); \ |
| 103 } \ | 123 } \ |
| 104 } \ | 124 } \ |
| 105 \ | 125 \ |
| 106 for (size_t i = 0U; i < ARRAY_SIZE(testval##sign##bits); i++) { \ | 126 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \ |
| 107 const v##sign##int##bits##x##size a = vtest##sign##bits##x##size(i); \ | 127 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \ |
| 108 for (uint32_t j = 0U; j < bits; j++) { \ | 128 for (uint32_t j = 0U; j < bits; j++) { \ |
| 109 const vuint##bits##x##size b = vuint##bits##x##size##_splat(j); \ | 129 const vuint##bits##x##size b = vuint##bits##x##size##_splat(j); \ |
| 110 ret |= test_arith_v##sign##int##bits##x##size##_rshift(a, b); \ | 130 ret |= test_arith_v##type##bits##x##size##_rshift(a, b); \ |
| 111 ret |= test_arith_v##sign##int##bits##x##size##_lshift(a, b); \ | 131 ret |= test_arith_v##type##bits##x##size##_lshift(a, b); \ |
| 112 ret |= test_arith_v##sign##int##bits##x##size##_lrshift(a, b); \ | 132 ret |= test_arith_v##type##bits##x##size##_lrshift(a, b); \ |
| 113 } \ | 133 } \ |
| 114 } | 134 } |
| 115 | 135 |
| 116 #define RUN_TESTS(bits, size) \ | 136 #define RUN_TESTS(bits, size) \ |
| 117 RUN_TESTS_SIGN( , bits, size) \ | 137 RUN_TESTS_SIGN( , int, bits, size) \ |
| 118 RUN_TESTS_SIGN(u, bits, size) | 138 RUN_TESTS_SIGN(u, uint, bits, size) |
| 139 | |
| 140 #define RUN_TESTS_FLOAT(shorttype, type, bits, size) \ | |
| 141 for (size_t i = 0U; i < ARRAY_SIZE(testval##shorttype##bits); i++) { \ | |
| 142 const v##type##bits##x##size a = vtest##shorttype##bits##x##size(i); \ | |
| 143 for (size_t j = 0U; j < ARRAY_SIZE(testval##shorttype##bits); j++) { \ | |
| 144 const v##type##bits##x##size b = vtest##shorttype##bits##x##size(j); \ | |
| 145 ret |= test_arith_v##type##bits##x##size##_add(a, b); \ | |
| 146 ret |= test_arith_v##type##bits##x##size##_sub(a, b); \ | |
| 147 ret |= test_arith_v##type##bits##x##size##_mul(a, b); \ | |
| 148 ret |= test_arith_v##type##bits##x##size##_div(a, b); \ | |
| 149 ret |= test_arith_v##type##bits##x##size##_mod(a, b); \ | |
| 150 ret |= test_arith_v##type##bits##x##size##_avg(a, b); \ | |
| 151 ret |= test_arith_v##type##bits##x##size##_min(a, b); \ | |
| 152 ret |= test_arith_v##type##bits##x##size##_max(a, b); \ | |
| 153 } \ | |
| 154 } | |
| 119 | 155 |
| 120 RUN_TESTS(8, 2) | 156 RUN_TESTS(8, 2) |
| 121 | 157 |
| 122 RUN_TESTS(8, 4) | 158 RUN_TESTS(8, 4) |
| 123 RUN_TESTS(16, 2) | 159 RUN_TESTS(16, 2) |
| 139 RUN_TESTS(8, 64) | 175 RUN_TESTS(8, 64) |
| 140 RUN_TESTS(16, 32) | 176 RUN_TESTS(16, 32) |
| 141 RUN_TESTS(32, 16) | 177 RUN_TESTS(32, 16) |
| 142 RUN_TESTS(64, 8) | 178 RUN_TESTS(64, 8) |
| 143 | 179 |
| 180 RUN_TESTS_FLOAT(f, f, 32, 2) | |
| 181 RUN_TESTS_FLOAT(f, f, 32, 4) | |
| 182 RUN_TESTS_FLOAT(f, f, 32, 8) | |
| 183 RUN_TESTS_FLOAT(f, f, 32, 16) | |
| 184 | |
| 185 RUN_TESTS_FLOAT(f, f, 64, 2) | |
| 186 RUN_TESTS_FLOAT(f, f, 64, 4) | |
| 187 RUN_TESTS_FLOAT(f, f, 64, 8) | |
| 188 | |
| 189 #undef RUN_TESTS_FLOAT | |
| 144 #undef RUN_TESTS_SIGN | 190 #undef RUN_TESTS_SIGN |
| 145 #undef RUN_TESTS | 191 #undef RUN_TESTS |
| 146 | 192 |
| 147 return ret; | 193 return ret; |
| 148 } | 194 } |
