1*750541c4SAleksandar Markovic /* 2*750541c4SAleksandar Markovic * Test program for MSA instruction HSUB_U.H 3*750541c4SAleksandar Markovic * 4*750541c4SAleksandar Markovic * Copyright (C) 2019 Wave Computing, Inc. 5*750541c4SAleksandar Markovic * Copyright (C) 2019 Aleksandar Markovic <amarkovic@wavecomp.com> 6*750541c4SAleksandar Markovic * Copyright (C) 2019 RT-RK Computer Based Systems LLC 7*750541c4SAleksandar Markovic * Copyright (C) 2019 Mateja Marjanovic <mateja.marjanovic@rt-rk.com> 8*750541c4SAleksandar Markovic * 9*750541c4SAleksandar Markovic * This program is free software: you can redistribute it and/or modify 10*750541c4SAleksandar Markovic * it under the terms of the GNU General Public License as published by 11*750541c4SAleksandar Markovic * the Free Software Foundation, either version 2 of the License, or 12*750541c4SAleksandar Markovic * (at your option) any later version. 13*750541c4SAleksandar Markovic * 14*750541c4SAleksandar Markovic * This program is distributed in the hope that it will be useful, 15*750541c4SAleksandar Markovic * but WITHOUT ANY WARRANTY; without even the implied warranty of 16*750541c4SAleksandar Markovic * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 17*750541c4SAleksandar Markovic * GNU General Public License for more details. 18*750541c4SAleksandar Markovic * 19*750541c4SAleksandar Markovic * You should have received a copy of the GNU General Public License 20*750541c4SAleksandar Markovic * along with this program. If not, see <https://www.gnu.org/licenses/>. 21*750541c4SAleksandar Markovic * 22*750541c4SAleksandar Markovic */ 23*750541c4SAleksandar Markovic 24*750541c4SAleksandar Markovic #include <sys/time.h> 25*750541c4SAleksandar Markovic #include <stdint.h> 26*750541c4SAleksandar Markovic 27*750541c4SAleksandar Markovic #include "../../../../include/wrappers_msa.h" 28*750541c4SAleksandar Markovic #include "../../../../include/test_inputs_128.h" 29*750541c4SAleksandar Markovic #include "../../../../include/test_utils_128.h" 30*750541c4SAleksandar Markovic 31*750541c4SAleksandar Markovic #define TEST_COUNT_TOTAL ( \ 32*750541c4SAleksandar Markovic (PATTERN_INPUTS_SHORT_COUNT) * (PATTERN_INPUTS_SHORT_COUNT) + \ 33*750541c4SAleksandar Markovic (RANDOM_INPUTS_SHORT_COUNT) * (RANDOM_INPUTS_SHORT_COUNT)) 34*750541c4SAleksandar Markovic 35*750541c4SAleksandar Markovic 36*750541c4SAleksandar Markovic int32_t main(void) 37*750541c4SAleksandar Markovic { 38*750541c4SAleksandar Markovic char *instruction_name = "HSUB_U.H"; 39*750541c4SAleksandar Markovic int32_t ret; 40*750541c4SAleksandar Markovic uint32_t i, j; 41*750541c4SAleksandar Markovic struct timeval start, end; 42*750541c4SAleksandar Markovic double elapsed_time; 43*750541c4SAleksandar Markovic 44*750541c4SAleksandar Markovic uint64_t b128_result[TEST_COUNT_TOTAL][2]; 45*750541c4SAleksandar Markovic uint64_t b128_expect[TEST_COUNT_TOTAL][2] = { 46*750541c4SAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 0 */ 47*750541c4SAleksandar Markovic { 0x00ff00ff00ff00ffULL, 0x00ff00ff00ff00ffULL, }, 48*750541c4SAleksandar Markovic { 0x0055005500550055ULL, 0x0055005500550055ULL, }, 49*750541c4SAleksandar Markovic { 0x00aa00aa00aa00aaULL, 0x00aa00aa00aa00aaULL, }, 50*750541c4SAleksandar Markovic { 0x0033003300330033ULL, 0x0033003300330033ULL, }, 51*750541c4SAleksandar Markovic { 0x00cc00cc00cc00ccULL, 0x00cc00cc00cc00ccULL, }, 52*750541c4SAleksandar Markovic { 0x0071001c00c70071ULL, 0x001c00c70071001cULL, }, 53*750541c4SAleksandar Markovic { 0x008e00e30038008eULL, 0x00e30038008e00e3ULL, }, 54*750541c4SAleksandar Markovic { 0xff01ff01ff01ff01ULL, 0xff01ff01ff01ff01ULL, }, /* 8 */ 55*750541c4SAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 56*750541c4SAleksandar Markovic { 0xff56ff56ff56ff56ULL, 0xff56ff56ff56ff56ULL, }, 57*750541c4SAleksandar Markovic { 0xffabffabffabffabULL, 0xffabffabffabffabULL, }, 58*750541c4SAleksandar Markovic { 0xff34ff34ff34ff34ULL, 0xff34ff34ff34ff34ULL, }, 59*750541c4SAleksandar Markovic { 0xffcdffcdffcdffcdULL, 0xffcdffcdffcdffcdULL, }, 60*750541c4SAleksandar Markovic { 0xff72ff1dffc8ff72ULL, 0xff1dffc8ff72ff1dULL, }, 61*750541c4SAleksandar Markovic { 0xff8fffe4ff39ff8fULL, 0xffe4ff39ff8fffe4ULL, }, 62*750541c4SAleksandar Markovic { 0xffabffabffabffabULL, 0xffabffabffabffabULL, }, /* 16 */ 63*750541c4SAleksandar Markovic { 0x00aa00aa00aa00aaULL, 0x00aa00aa00aa00aaULL, }, 64*750541c4SAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 65*750541c4SAleksandar Markovic { 0x0055005500550055ULL, 0x0055005500550055ULL, }, 66*750541c4SAleksandar Markovic { 0xffdeffdeffdeffdeULL, 0xffdeffdeffdeffdeULL, }, 67*750541c4SAleksandar Markovic { 0x0077007700770077ULL, 0x0077007700770077ULL, }, 68*750541c4SAleksandar Markovic { 0x001cffc70072001cULL, 0xffc70072001cffc7ULL, }, 69*750541c4SAleksandar Markovic { 0x0039008effe30039ULL, 0x008effe30039008eULL, }, 70*750541c4SAleksandar Markovic { 0xff56ff56ff56ff56ULL, 0xff56ff56ff56ff56ULL, }, /* 24 */ 71*750541c4SAleksandar Markovic { 0x0055005500550055ULL, 0x0055005500550055ULL, }, 72*750541c4SAleksandar Markovic { 0xffabffabffabffabULL, 0xffabffabffabffabULL, }, 73*750541c4SAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 74*750541c4SAleksandar Markovic { 0xff89ff89ff89ff89ULL, 0xff89ff89ff89ff89ULL, }, 75*750541c4SAleksandar Markovic { 0x0022002200220022ULL, 0x0022002200220022ULL, }, 76*750541c4SAleksandar Markovic { 0xffc7ff72001dffc7ULL, 0xff72001dffc7ff72ULL, }, 77*750541c4SAleksandar Markovic { 0xffe40039ff8effe4ULL, 0x0039ff8effe40039ULL, }, 78*750541c4SAleksandar Markovic { 0xffcdffcdffcdffcdULL, 0xffcdffcdffcdffcdULL, }, /* 32 */ 79*750541c4SAleksandar Markovic { 0x00cc00cc00cc00ccULL, 0x00cc00cc00cc00ccULL, }, 80*750541c4SAleksandar Markovic { 0x0022002200220022ULL, 0x0022002200220022ULL, }, 81*750541c4SAleksandar Markovic { 0x0077007700770077ULL, 0x0077007700770077ULL, }, 82*750541c4SAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 83*750541c4SAleksandar Markovic { 0x0099009900990099ULL, 0x0099009900990099ULL, }, 84*750541c4SAleksandar Markovic { 0x003effe90094003eULL, 0xffe90094003effe9ULL, }, 85*750541c4SAleksandar Markovic { 0x005b00b00005005bULL, 0x00b00005005b00b0ULL, }, 86*750541c4SAleksandar Markovic { 0xff34ff34ff34ff34ULL, 0xff34ff34ff34ff34ULL, }, /* 40 */ 87*750541c4SAleksandar Markovic { 0x0033003300330033ULL, 0x0033003300330033ULL, }, 88*750541c4SAleksandar Markovic { 0xff89ff89ff89ff89ULL, 0xff89ff89ff89ff89ULL, }, 89*750541c4SAleksandar Markovic { 0xffdeffdeffdeffdeULL, 0xffdeffdeffdeffdeULL, }, 90*750541c4SAleksandar Markovic { 0xff67ff67ff67ff67ULL, 0xff67ff67ff67ff67ULL, }, 91*750541c4SAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 92*750541c4SAleksandar Markovic { 0xffa5ff50fffbffa5ULL, 0xff50fffbffa5ff50ULL, }, 93*750541c4SAleksandar Markovic { 0xffc20017ff6cffc2ULL, 0x0017ff6cffc20017ULL, }, 94*750541c4SAleksandar Markovic { 0xffe4ff39ff8fffe4ULL, 0xff39ff8fffe4ff39ULL, }, /* 48 */ 95*750541c4SAleksandar Markovic { 0x00e30038008e00e3ULL, 0x0038008e00e30038ULL, }, 96*750541c4SAleksandar Markovic { 0x0039ff8effe40039ULL, 0xff8effe40039ff8eULL, }, 97*750541c4SAleksandar Markovic { 0x008effe30039008eULL, 0xffe30039008effe3ULL, }, 98*750541c4SAleksandar Markovic { 0x0017ff6cffc20017ULL, 0xff6cffc20017ff6cULL, }, 99*750541c4SAleksandar Markovic { 0x00b00005005b00b0ULL, 0x0005005b00b00005ULL, }, 100*750541c4SAleksandar Markovic { 0x0055ff5500560055ULL, 0xff5500560055ff55ULL, }, 101*750541c4SAleksandar Markovic { 0x0072001cffc70072ULL, 0x001cffc70072001cULL, }, 102*750541c4SAleksandar Markovic { 0xff1dffc8ff72ff1dULL, 0xffc8ff72ff1dffc8ULL, }, /* 56 */ 103*750541c4SAleksandar Markovic { 0x001c00c70071001cULL, 0x00c70071001c00c7ULL, }, 104*750541c4SAleksandar Markovic { 0xff72001dffc7ff72ULL, 0x001dffc7ff72001dULL, }, 105*750541c4SAleksandar Markovic { 0xffc70072001cffc7ULL, 0x0072001cffc70072ULL, }, 106*750541c4SAleksandar Markovic { 0xff50fffbffa5ff50ULL, 0xfffbffa5ff50fffbULL, }, 107*750541c4SAleksandar Markovic { 0xffe90094003effe9ULL, 0x0094003effe90094ULL, }, 108*750541c4SAleksandar Markovic { 0xff8effe40039ff8eULL, 0xffe40039ff8effe4ULL, }, 109*750541c4SAleksandar Markovic { 0xffab00abffaaffabULL, 0x00abffaaffab00abULL, }, 110*750541c4SAleksandar Markovic { 0x001e001affc60015ULL, 0xffe4ffad008300a4ULL, }, /* 64 */ 111*750541c4SAleksandar Markovic { 0xffca0083ff95004dULL, 0xff54fff100bfffb4ULL, }, 112*750541c4SAleksandar Markovic { 0x002e003cff59ffd5ULL, 0xff73ff0c00d3009cULL, }, 113*750541c4SAleksandar Markovic { 0x00390099fff70007ULL, 0xff5aff3300bc0010ULL, }, 114*750541c4SAleksandar Markovic { 0x0091ff34ffeb0087ULL, 0xffab005dff9a0046ULL, }, 115*750541c4SAleksandar Markovic { 0x003dff9dffba00bfULL, 0xff1b00a1ffd6ff56ULL, }, 116*750541c4SAleksandar Markovic { 0x00a1ff56ff7e0047ULL, 0xff3affbcffea003eULL, }, 117*750541c4SAleksandar Markovic { 0x00acffb3001c0079ULL, 0xff21ffe3ffd3ffb2ULL, }, 118*750541c4SAleksandar Markovic { 0x0042ffe20057004bULL, 0xffc0006800300019ULL, }, /* 72 */ 119*750541c4SAleksandar Markovic { 0xffee004b00260083ULL, 0xff3000ac006cff29ULL, }, 120*750541c4SAleksandar Markovic { 0x00520004ffea000bULL, 0xff4fffc700800011ULL, }, 121*750541c4SAleksandar Markovic { 0x005d00610088003dULL, 0xff36ffee0069ff85ULL, }, 122*750541c4SAleksandar Markovic { 0x0006ff4afffc00a2ULL, 0x0026002a002e00d6ULL, }, 123*750541c4SAleksandar Markovic { 0xffb2ffb3ffcb00daULL, 0xff96006e006affe6ULL, }, 124*750541c4SAleksandar Markovic { 0x0016ff6cff8f0062ULL, 0xffb5ff89007e00ceULL, }, 125*750541c4SAleksandar Markovic { 0x0021ffc9002d0094ULL, 0xff9cffb000670042ULL, }, 126*750541c4SAleksandar Markovic }; 127*750541c4SAleksandar Markovic 128*750541c4SAleksandar Markovic gettimeofday(&start, NULL); 129*750541c4SAleksandar Markovic 130*750541c4SAleksandar Markovic for (i = 0; i < PATTERN_INPUTS_SHORT_COUNT; i++) { 131*750541c4SAleksandar Markovic for (j = 0; j < PATTERN_INPUTS_SHORT_COUNT; j++) { 132*750541c4SAleksandar Markovic do_msa_HSUB_U_H(b128_pattern[i], b128_pattern[j], 133*750541c4SAleksandar Markovic b128_result[PATTERN_INPUTS_SHORT_COUNT * i + j]); 134*750541c4SAleksandar Markovic } 135*750541c4SAleksandar Markovic } 136*750541c4SAleksandar Markovic 137*750541c4SAleksandar Markovic for (i = 0; i < RANDOM_INPUTS_SHORT_COUNT; i++) { 138*750541c4SAleksandar Markovic for (j = 0; j < RANDOM_INPUTS_SHORT_COUNT; j++) { 139*750541c4SAleksandar Markovic do_msa_HSUB_U_H(b128_random[i], b128_random[j], 140*750541c4SAleksandar Markovic b128_result[((PATTERN_INPUTS_SHORT_COUNT) * 141*750541c4SAleksandar Markovic (PATTERN_INPUTS_SHORT_COUNT)) + 142*750541c4SAleksandar Markovic RANDOM_INPUTS_SHORT_COUNT * i + j]); 143*750541c4SAleksandar Markovic } 144*750541c4SAleksandar Markovic } 145*750541c4SAleksandar Markovic 146*750541c4SAleksandar Markovic gettimeofday(&end, NULL); 147*750541c4SAleksandar Markovic 148*750541c4SAleksandar Markovic elapsed_time = (end.tv_sec - start.tv_sec) * 1000.0; 149*750541c4SAleksandar Markovic elapsed_time += (end.tv_usec - start.tv_usec) / 1000.0; 150*750541c4SAleksandar Markovic 151*750541c4SAleksandar Markovic ret = check_results(instruction_name, TEST_COUNT_TOTAL, elapsed_time, 152*750541c4SAleksandar Markovic &b128_result[0][0], &b128_expect[0][0]); 153*750541c4SAleksandar Markovic 154*750541c4SAleksandar Markovic return ret; 155*750541c4SAleksandar Markovic } 156