1520e210cSAleksandar Markovic /* 2520e210cSAleksandar Markovic * Test program for MSA instruction CLT_S.D 3520e210cSAleksandar Markovic * 4*dd8d6a2dSAleksandar Markovic * Copyright (C) 2019 Wave Computing, Inc. 5*dd8d6a2dSAleksandar Markovic * Copyright (C) 2019 Aleksandar Markovic <amarkovic@wavecomp.com> 6520e210cSAleksandar Markovic * 7520e210cSAleksandar Markovic * This program is free software: you can redistribute it and/or modify 8520e210cSAleksandar Markovic * it under the terms of the GNU General Public License as published by 9520e210cSAleksandar Markovic * the Free Software Foundation, either version 2 of the License, or 10520e210cSAleksandar Markovic * (at your option) any later version. 11520e210cSAleksandar Markovic * 12520e210cSAleksandar Markovic * This program is distributed in the hope that it will be useful, 13520e210cSAleksandar Markovic * but WITHOUT ANY WARRANTY; without even the implied warranty of 14520e210cSAleksandar Markovic * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 15520e210cSAleksandar Markovic * GNU General Public License for more details. 16520e210cSAleksandar Markovic * 17520e210cSAleksandar Markovic * You should have received a copy of the GNU General Public License 18520e210cSAleksandar Markovic * along with this program. If not, see <https://www.gnu.org/licenses/>. 19520e210cSAleksandar Markovic * 20520e210cSAleksandar Markovic */ 21520e210cSAleksandar Markovic 22520e210cSAleksandar Markovic #include <sys/time.h> 23520e210cSAleksandar Markovic #include <stdint.h> 24520e210cSAleksandar Markovic 25520e210cSAleksandar Markovic #include "../../../../include/wrappers_msa.h" 26520e210cSAleksandar Markovic #include "../../../../include/test_inputs.h" 27520e210cSAleksandar Markovic #include "../../../../include/test_utils.h" 28520e210cSAleksandar Markovic 29520e210cSAleksandar Markovic #define TEST_COUNT_TOTAL ( \ 30520e210cSAleksandar Markovic (PATTERN_INPUTS_SHORT_COUNT) * (PATTERN_INPUTS_SHORT_COUNT) + \ 31520e210cSAleksandar Markovic (RANDOM_INPUTS_SHORT_COUNT) * (RANDOM_INPUTS_SHORT_COUNT)) 32520e210cSAleksandar Markovic 33520e210cSAleksandar Markovic 34520e210cSAleksandar Markovic int32_t main(void) 35520e210cSAleksandar Markovic { 36520e210cSAleksandar Markovic char *instruction_name = "CLT_S.D"; 37520e210cSAleksandar Markovic int32_t ret; 38520e210cSAleksandar Markovic uint32_t i, j; 39520e210cSAleksandar Markovic struct timeval start, end; 40520e210cSAleksandar Markovic double elapsed_time; 41520e210cSAleksandar Markovic 42520e210cSAleksandar Markovic uint64_t b128_result[TEST_COUNT_TOTAL][2]; 43520e210cSAleksandar Markovic uint64_t b128_expect[TEST_COUNT_TOTAL][2] = { 44520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 0 */ 45520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 46520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 47520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 48520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 49520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 50520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 51520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 52520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 8 */ 53520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 54520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 55520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 56520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 57520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 58520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 59520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 60520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, /* 16 */ 61520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 62520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 63520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 64520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 65520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 66520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 67520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 68520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 24 */ 69520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 70520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 71520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 72520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 73520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 74520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 75520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 76520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, /* 32 */ 77520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 78520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 79520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 80520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 81520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 82520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 83520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 84520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 40 */ 85520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 86520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 87520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 88520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 89520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 90520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 91520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 92520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, /* 48 */ 93520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 94520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 95520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 96520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 97520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 98520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 99520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 100520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, /* 56 */ 101520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 102520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 103520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 104520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 105520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0xffffffffffffffffULL, }, 106520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 107520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 108520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, /* 64 */ 109520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 110520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 111520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 112520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 113520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 114520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 115520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 116520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, /* 72 */ 117520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 118520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 119520e210cSAleksandar Markovic { 0xffffffffffffffffULL, 0x0000000000000000ULL, }, 120520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 121520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 122520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0xffffffffffffffffULL, }, 123520e210cSAleksandar Markovic { 0x0000000000000000ULL, 0x0000000000000000ULL, }, 124520e210cSAleksandar Markovic }; 125520e210cSAleksandar Markovic 126520e210cSAleksandar Markovic gettimeofday(&start, NULL); 127520e210cSAleksandar Markovic 128520e210cSAleksandar Markovic for (i = 0; i < PATTERN_INPUTS_SHORT_COUNT; i++) { 129520e210cSAleksandar Markovic for (j = 0; j < PATTERN_INPUTS_SHORT_COUNT; j++) { 130520e210cSAleksandar Markovic do_msa_CLT_S_D(b128_pattern[i], b128_pattern[j], 131520e210cSAleksandar Markovic b128_result[PATTERN_INPUTS_SHORT_COUNT * i + j]); 132520e210cSAleksandar Markovic } 133520e210cSAleksandar Markovic } 134520e210cSAleksandar Markovic 135520e210cSAleksandar Markovic for (i = 0; i < RANDOM_INPUTS_SHORT_COUNT; i++) { 136520e210cSAleksandar Markovic for (j = 0; j < RANDOM_INPUTS_SHORT_COUNT; j++) { 137520e210cSAleksandar Markovic do_msa_CLT_S_D(b128_random[i], b128_random[j], 138520e210cSAleksandar Markovic b128_result[((PATTERN_INPUTS_SHORT_COUNT) * 139520e210cSAleksandar Markovic (PATTERN_INPUTS_SHORT_COUNT)) + 140520e210cSAleksandar Markovic RANDOM_INPUTS_SHORT_COUNT * i + j]); 141520e210cSAleksandar Markovic } 142520e210cSAleksandar Markovic } 143520e210cSAleksandar Markovic 144520e210cSAleksandar Markovic gettimeofday(&end, NULL); 145520e210cSAleksandar Markovic 146520e210cSAleksandar Markovic elapsed_time = (end.tv_sec - start.tv_sec) * 1000.0; 147520e210cSAleksandar Markovic elapsed_time += (end.tv_usec - start.tv_usec) / 1000.0; 148520e210cSAleksandar Markovic 149520e210cSAleksandar Markovic ret = check_results(instruction_name, TEST_COUNT_TOTAL, elapsed_time, 150520e210cSAleksandar Markovic &b128_result[0][0], &b128_expect[0][0]); 151520e210cSAleksandar Markovic 152520e210cSAleksandar Markovic return ret; 153520e210cSAleksandar Markovic } 154