1520e210cSAleksandar Markovic /*
2520e210cSAleksandar Markovic  *  Test program for MSA instruction CLT_S.D
3520e210cSAleksandar Markovic  *
4*dd8d6a2dSAleksandar Markovic  *  Copyright (C) 2019  Wave Computing, Inc.
5*dd8d6a2dSAleksandar Markovic  *  Copyright (C) 2019  Aleksandar Markovic <amarkovic@wavecomp.com>
6520e210cSAleksandar Markovic  *
7520e210cSAleksandar Markovic  *  This program is free software: you can redistribute it and/or modify
8520e210cSAleksandar Markovic  *  it under the terms of the GNU General Public License as published by
9520e210cSAleksandar Markovic  *  the Free Software Foundation, either version 2 of the License, or
10520e210cSAleksandar Markovic  *  (at your option) any later version.
11520e210cSAleksandar Markovic  *
12520e210cSAleksandar Markovic  *  This program is distributed in the hope that it will be useful,
13520e210cSAleksandar Markovic  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
14520e210cSAleksandar Markovic  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15520e210cSAleksandar Markovic  *  GNU General Public License for more details.
16520e210cSAleksandar Markovic  *
17520e210cSAleksandar Markovic  *  You should have received a copy of the GNU General Public License
18520e210cSAleksandar Markovic  *  along with this program.  If not, see <https://www.gnu.org/licenses/>.
19520e210cSAleksandar Markovic  *
20520e210cSAleksandar Markovic  */
21520e210cSAleksandar Markovic 
22520e210cSAleksandar Markovic #include <sys/time.h>
23520e210cSAleksandar Markovic #include <stdint.h>
24520e210cSAleksandar Markovic 
25520e210cSAleksandar Markovic #include "../../../../include/wrappers_msa.h"
26520e210cSAleksandar Markovic #include "../../../../include/test_inputs.h"
27520e210cSAleksandar Markovic #include "../../../../include/test_utils.h"
28520e210cSAleksandar Markovic 
29520e210cSAleksandar Markovic #define TEST_COUNT_TOTAL (                                                \
30520e210cSAleksandar Markovic             (PATTERN_INPUTS_SHORT_COUNT) * (PATTERN_INPUTS_SHORT_COUNT) + \
31520e210cSAleksandar Markovic             (RANDOM_INPUTS_SHORT_COUNT) * (RANDOM_INPUTS_SHORT_COUNT))
32520e210cSAleksandar Markovic 
33520e210cSAleksandar Markovic 
34520e210cSAleksandar Markovic int32_t main(void)
35520e210cSAleksandar Markovic {
36520e210cSAleksandar Markovic     char *instruction_name = "CLT_S.D";
37520e210cSAleksandar Markovic     int32_t ret;
38520e210cSAleksandar Markovic     uint32_t i, j;
39520e210cSAleksandar Markovic     struct timeval start, end;
40520e210cSAleksandar Markovic     double elapsed_time;
41520e210cSAleksandar Markovic 
42520e210cSAleksandar Markovic     uint64_t b128_result[TEST_COUNT_TOTAL][2];
43520e210cSAleksandar Markovic     uint64_t b128_expect[TEST_COUNT_TOTAL][2] = {
44520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },    /*   0  */
45520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
46520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
47520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
48520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
49520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
50520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
51520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
52520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },    /*   8  */
53520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
54520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
55520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
56520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
57520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
58520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
59520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
60520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },    /*  16  */
61520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
62520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
63520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
64520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
65520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
66520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
67520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
68520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },    /*  24  */
69520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
70520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
71520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
72520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
73520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
74520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
75520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
76520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },    /*  32  */
77520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
78520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
79520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
80520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
81520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
82520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
83520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
84520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },    /*  40  */
85520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
86520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
87520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
88520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
89520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
90520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
91520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
92520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },    /*  48  */
93520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
94520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
95520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
96520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
97520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
98520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
99520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
100520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },    /*  56  */
101520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
102520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
103520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
104520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
105520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0xffffffffffffffffULL, },
106520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
107520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
108520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },    /*  64  */
109520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
110520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
111520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
112520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
113520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
114520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
115520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
116520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },    /*  72  */
117520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
118520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
119520e210cSAleksandar Markovic         { 0xffffffffffffffffULL, 0x0000000000000000ULL, },
120520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
121520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
122520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0xffffffffffffffffULL, },
123520e210cSAleksandar Markovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
124520e210cSAleksandar Markovic     };
125520e210cSAleksandar Markovic 
126520e210cSAleksandar Markovic     gettimeofday(&start, NULL);
127520e210cSAleksandar Markovic 
128520e210cSAleksandar Markovic     for (i = 0; i < PATTERN_INPUTS_SHORT_COUNT; i++) {
129520e210cSAleksandar Markovic         for (j = 0; j < PATTERN_INPUTS_SHORT_COUNT; j++) {
130520e210cSAleksandar Markovic             do_msa_CLT_S_D(b128_pattern[i], b128_pattern[j],
131520e210cSAleksandar Markovic                           b128_result[PATTERN_INPUTS_SHORT_COUNT * i + j]);
132520e210cSAleksandar Markovic         }
133520e210cSAleksandar Markovic     }
134520e210cSAleksandar Markovic 
135520e210cSAleksandar Markovic     for (i = 0; i < RANDOM_INPUTS_SHORT_COUNT; i++) {
136520e210cSAleksandar Markovic         for (j = 0; j < RANDOM_INPUTS_SHORT_COUNT; j++) {
137520e210cSAleksandar Markovic             do_msa_CLT_S_D(b128_random[i], b128_random[j],
138520e210cSAleksandar Markovic                            b128_result[((PATTERN_INPUTS_SHORT_COUNT) *
139520e210cSAleksandar Markovic                                         (PATTERN_INPUTS_SHORT_COUNT)) +
140520e210cSAleksandar Markovic                                        RANDOM_INPUTS_SHORT_COUNT * i + j]);
141520e210cSAleksandar Markovic         }
142520e210cSAleksandar Markovic     }
143520e210cSAleksandar Markovic 
144520e210cSAleksandar Markovic     gettimeofday(&end, NULL);
145520e210cSAleksandar Markovic 
146520e210cSAleksandar Markovic     elapsed_time = (end.tv_sec - start.tv_sec) * 1000.0;
147520e210cSAleksandar Markovic     elapsed_time += (end.tv_usec - start.tv_usec) / 1000.0;
148520e210cSAleksandar Markovic 
149520e210cSAleksandar Markovic     ret = check_results(instruction_name, TEST_COUNT_TOTAL, elapsed_time,
150520e210cSAleksandar Markovic                         &b128_result[0][0], &b128_expect[0][0]);
151520e210cSAleksandar Markovic 
152520e210cSAleksandar Markovic     return ret;
153520e210cSAleksandar Markovic }
154