1*8598f5faSAleksandar Markovic /* 2*8598f5faSAleksandar Markovic * Test program for MSA instruction FMIN.W 3*8598f5faSAleksandar Markovic * 4*8598f5faSAleksandar Markovic * Copyright (C) 2019 Wave Computing, Inc. 5*8598f5faSAleksandar Markovic * Copyright (C) 2019 Aleksandar Markovic <amarkovic@wavecomp.com> 6*8598f5faSAleksandar Markovic * 7*8598f5faSAleksandar Markovic * This program is free software: you can redistribute it and/or modify 8*8598f5faSAleksandar Markovic * it under the terms of the GNU General Public License as published by 9*8598f5faSAleksandar Markovic * the Free Software Foundation, either version 2 of the License, or 10*8598f5faSAleksandar Markovic * (at your option) any later version. 11*8598f5faSAleksandar Markovic * 12*8598f5faSAleksandar Markovic * This program is distributed in the hope that it will be useful, 13*8598f5faSAleksandar Markovic * but WITHOUT ANY WARRANTY; without even the implied warranty of 14*8598f5faSAleksandar Markovic * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 15*8598f5faSAleksandar Markovic * GNU General Public License for more details. 16*8598f5faSAleksandar Markovic * 17*8598f5faSAleksandar Markovic * You should have received a copy of the GNU General Public License 18*8598f5faSAleksandar Markovic * along with this program. If not, see <https://www.gnu.org/licenses/>. 19*8598f5faSAleksandar Markovic * 20*8598f5faSAleksandar Markovic */ 21*8598f5faSAleksandar Markovic 22*8598f5faSAleksandar Markovic #include <sys/time.h> 23*8598f5faSAleksandar Markovic #include <stdint.h> 24*8598f5faSAleksandar Markovic 25*8598f5faSAleksandar Markovic #include "../../../../include/wrappers_msa.h" 26*8598f5faSAleksandar Markovic #include "../../../../include/test_inputs_128.h" 27*8598f5faSAleksandar Markovic #include "../../../../include/test_utils_128.h" 28*8598f5faSAleksandar Markovic 29*8598f5faSAleksandar Markovic #define TEST_COUNT_TOTAL ( \ 30*8598f5faSAleksandar Markovic (PATTERN_INPUTS_SHORT_COUNT) * (PATTERN_INPUTS_SHORT_COUNT) + \ 31*8598f5faSAleksandar Markovic (RANDOM_INPUTS_SHORT_COUNT) * (RANDOM_INPUTS_SHORT_COUNT)) 32*8598f5faSAleksandar Markovic 33*8598f5faSAleksandar Markovic 34*8598f5faSAleksandar Markovic int32_t main(void) 35*8598f5faSAleksandar Markovic { 36*8598f5faSAleksandar Markovic char *instruction_name = "FMIN.W"; 37*8598f5faSAleksandar Markovic int32_t ret; 38*8598f5faSAleksandar Markovic uint32_t i, j; 39*8598f5faSAleksandar Markovic struct timeval start, end; 40*8598f5faSAleksandar Markovic double elapsed_time; 41*8598f5faSAleksandar Markovic 42*8598f5faSAleksandar Markovic uint64_t b128_result[TEST_COUNT_TOTAL][2]; 43*8598f5faSAleksandar Markovic uint64_t b128_expect[TEST_COUNT_TOTAL][2] = { 44*8598f5faSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, /* 0 */ 45*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 46*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 47*8598f5faSAleksandar Markovic { 0x5555555555555555ULL, 0x5555555555555555ULL, }, 48*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 49*8598f5faSAleksandar Markovic { 0x3333333333333333ULL, 0x3333333333333333ULL, }, 50*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x38e38e38e38e38e3ULL, }, 51*8598f5faSAleksandar Markovic { 0x1c71c71c71c71c71ULL, 0xc71c71c71c71c71cULL, }, 52*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 8 */ 53*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 54*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 55*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 56*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 57*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 58*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x00000000e38e38e3ULL, }, 59*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0xc71c71c700000000ULL, }, 60*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, /* 16 */ 61*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 62*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 63*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 64*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 65*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 66*8598f5faSAleksandar Markovic { 0xe38e38e3aaaaaaaaULL, 0xaaaaaaaae38e38e3ULL, }, 67*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xc71c71c7aaaaaaaaULL, }, 68*8598f5faSAleksandar Markovic { 0x5555555555555555ULL, 0x5555555555555555ULL, }, /* 24 */ 69*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 70*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 71*8598f5faSAleksandar Markovic { 0x5555555555555555ULL, 0x5555555555555555ULL, }, 72*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 73*8598f5faSAleksandar Markovic { 0x3333333333333333ULL, 0x3333333333333333ULL, }, 74*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x38e38e38e38e38e3ULL, }, 75*8598f5faSAleksandar Markovic { 0x1c71c71c55555555ULL, 0xc71c71c71c71c71cULL, }, 76*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, /* 32 */ 77*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 78*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 79*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 80*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 81*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 82*8598f5faSAleksandar Markovic { 0xe38e38e3ccccccccULL, 0xcccccccce38e38e3ULL, }, 83*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 84*8598f5faSAleksandar Markovic { 0x3333333333333333ULL, 0x3333333333333333ULL, }, /* 40 */ 85*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 86*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xaaaaaaaaaaaaaaaaULL, }, 87*8598f5faSAleksandar Markovic { 0x3333333333333333ULL, 0x3333333333333333ULL, }, 88*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 89*8598f5faSAleksandar Markovic { 0x3333333333333333ULL, 0x3333333333333333ULL, }, 90*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x33333333e38e38e3ULL, }, 91*8598f5faSAleksandar Markovic { 0x1c71c71c33333333ULL, 0xc71c71c71c71c71cULL, }, 92*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x38e38e38e38e38e3ULL, }, /* 48 */ 93*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x00000000e38e38e3ULL, }, 94*8598f5faSAleksandar Markovic { 0xe38e38e3aaaaaaaaULL, 0xaaaaaaaae38e38e3ULL, }, 95*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x38e38e38e38e38e3ULL, }, 96*8598f5faSAleksandar Markovic { 0xe38e38e3ccccccccULL, 0xcccccccce38e38e3ULL, }, 97*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x33333333e38e38e3ULL, }, 98*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0x38e38e38e38e38e3ULL, }, 99*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0xc71c71c7e38e38e3ULL, }, 100*8598f5faSAleksandar Markovic { 0x1c71c71c71c71c71ULL, 0xc71c71c71c71c71cULL, }, /* 56 */ 101*8598f5faSAleksandar Markovic { 0x0000000000000000ULL, 0xc71c71c700000000ULL, }, 102*8598f5faSAleksandar Markovic { 0xaaaaaaaaaaaaaaaaULL, 0xc71c71c7aaaaaaaaULL, }, 103*8598f5faSAleksandar Markovic { 0x1c71c71c55555555ULL, 0xc71c71c71c71c71cULL, }, 104*8598f5faSAleksandar Markovic { 0xccccccccccccccccULL, 0xccccccccccccccccULL, }, 105*8598f5faSAleksandar Markovic { 0x1c71c71c33333333ULL, 0xc71c71c71c71c71cULL, }, 106*8598f5faSAleksandar Markovic { 0xe38e38e38e38e38eULL, 0xc71c71c7e38e38e3ULL, }, 107*8598f5faSAleksandar Markovic { 0x1c71c71c71c71c71ULL, 0xc71c71c71c71c71cULL, }, 108*8598f5faSAleksandar Markovic { 0x886ae6cc28625540ULL, 0x4b670b5efe7bb00cULL, }, /* 64 */ 109*8598f5faSAleksandar Markovic { 0xfbbe006328625540ULL, 0x12f7bb1afe7bb00cULL, }, 110*8598f5faSAleksandar Markovic { 0xac5aaeaab9cf8b80ULL, 0x27d8c6fffe7bb00cULL, }, 111*8598f5faSAleksandar Markovic { 0x886ae6cc28625540ULL, 0x8df188d8fe7bb00cULL, }, 112*8598f5faSAleksandar Markovic { 0xfbbe006328625540ULL, 0x12f7bb1afe7bb00cULL, }, 113*8598f5faSAleksandar Markovic { 0xfbbe00634d93c708ULL, 0x12f7bb1a153f52fcULL, }, 114*8598f5faSAleksandar Markovic { 0xfbbe0063b9cf8b80ULL, 0x12f7bb1aab2b2514ULL, }, 115*8598f5faSAleksandar Markovic { 0xfbbe00634d93c708ULL, 0x8df188d8a942e2a0ULL, }, 116*8598f5faSAleksandar Markovic { 0xac5aaeaab9cf8b80ULL, 0x27d8c6fffe7bb00cULL, }, /* 72 */ 117*8598f5faSAleksandar Markovic { 0xfbbe0063b9cf8b80ULL, 0x12f7bb1aab2b2514ULL, }, 118*8598f5faSAleksandar Markovic { 0xac5aaeaab9cf8b80ULL, 0x27d8c6ffab2b2514ULL, }, 119*8598f5faSAleksandar Markovic { 0xac5aaeaab9cf8b80ULL, 0x8df188d8ab2b2514ULL, }, 120*8598f5faSAleksandar Markovic { 0x886ae6cc28625540ULL, 0x8df188d8fe7bb00cULL, }, 121*8598f5faSAleksandar Markovic { 0xfbbe00634d93c708ULL, 0x8df188d8a942e2a0ULL, }, 122*8598f5faSAleksandar Markovic { 0xac5aaeaab9cf8b80ULL, 0x8df188d8ab2b2514ULL, }, 123*8598f5faSAleksandar Markovic { 0x704f164d5e31e24eULL, 0x8df188d8a942e2a0ULL, }, 124*8598f5faSAleksandar Markovic }; 125*8598f5faSAleksandar Markovic 126*8598f5faSAleksandar Markovic reset_msa_registers(); 127*8598f5faSAleksandar Markovic 128*8598f5faSAleksandar Markovic gettimeofday(&start, NULL); 129*8598f5faSAleksandar Markovic 130*8598f5faSAleksandar Markovic for (i = 0; i < PATTERN_INPUTS_SHORT_COUNT; i++) { 131*8598f5faSAleksandar Markovic for (j = 0; j < PATTERN_INPUTS_SHORT_COUNT; j++) { 132*8598f5faSAleksandar Markovic do_msa_FMIN_W(b128_pattern[i], b128_pattern[j], 133*8598f5faSAleksandar Markovic b128_result[PATTERN_INPUTS_SHORT_COUNT * i + j]); 134*8598f5faSAleksandar Markovic } 135*8598f5faSAleksandar Markovic } 136*8598f5faSAleksandar Markovic 137*8598f5faSAleksandar Markovic for (i = 0; i < RANDOM_INPUTS_SHORT_COUNT; i++) { 138*8598f5faSAleksandar Markovic for (j = 0; j < RANDOM_INPUTS_SHORT_COUNT; j++) { 139*8598f5faSAleksandar Markovic do_msa_FMIN_W(b128_random[i], b128_random[j], 140*8598f5faSAleksandar Markovic b128_result[((PATTERN_INPUTS_SHORT_COUNT) * 141*8598f5faSAleksandar Markovic (PATTERN_INPUTS_SHORT_COUNT)) + 142*8598f5faSAleksandar Markovic RANDOM_INPUTS_SHORT_COUNT * i + j]); 143*8598f5faSAleksandar Markovic } 144*8598f5faSAleksandar Markovic } 145*8598f5faSAleksandar Markovic 146*8598f5faSAleksandar Markovic gettimeofday(&end, NULL); 147*8598f5faSAleksandar Markovic 148*8598f5faSAleksandar Markovic elapsed_time = (end.tv_sec - start.tv_sec) * 1000.0; 149*8598f5faSAleksandar Markovic elapsed_time += (end.tv_usec - start.tv_usec) / 1000.0; 150*8598f5faSAleksandar Markovic 151*8598f5faSAleksandar Markovic ret = check_results(instruction_name, TEST_COUNT_TOTAL, elapsed_time, 152*8598f5faSAleksandar Markovic &b128_result[0][0], &b128_expect[0][0]); 153*8598f5faSAleksandar Markovic 154*8598f5faSAleksandar Markovic return ret; 155*8598f5faSAleksandar Markovic } 156