1*4b302ce9SMateja Marjanovic /*
2*4b302ce9SMateja Marjanovic  *  Test program for MSA instruction MULV.W
3*4b302ce9SMateja Marjanovic  *
4*4b302ce9SMateja Marjanovic  *  Copyright (C) 2018  Wave Computing, Inc.
5*4b302ce9SMateja Marjanovic  *  Copyright (C) 2018  Mateja Marjanovic <mateja.marjanovic@rt-rk.com>
6*4b302ce9SMateja Marjanovic  *
7*4b302ce9SMateja Marjanovic  *  This program is free software: you can redistribute it and/or modify
8*4b302ce9SMateja Marjanovic  *  it under the terms of the GNU General Public License as published by
9*4b302ce9SMateja Marjanovic  *  the Free Software Foundation, either version 2 of the License, or
10*4b302ce9SMateja Marjanovic  *  (at your option) any later version.
11*4b302ce9SMateja Marjanovic  *
12*4b302ce9SMateja Marjanovic  *  This program is distributed in the hope that it will be useful,
13*4b302ce9SMateja Marjanovic  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
14*4b302ce9SMateja Marjanovic  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15*4b302ce9SMateja Marjanovic  *  GNU General Public License for more details.
16*4b302ce9SMateja Marjanovic  *
17*4b302ce9SMateja Marjanovic  *  You should have received a copy of the GNU General Public License
18*4b302ce9SMateja Marjanovic  *  along with this program.  If not, see <https://www.gnu.org/licenses/>.
19*4b302ce9SMateja Marjanovic  *
20*4b302ce9SMateja Marjanovic  */
21*4b302ce9SMateja Marjanovic 
22*4b302ce9SMateja Marjanovic #include <sys/time.h>
23*4b302ce9SMateja Marjanovic #include <stdint.h>
24*4b302ce9SMateja Marjanovic 
25*4b302ce9SMateja Marjanovic #include "../../../../include/wrappers_msa.h"
26*4b302ce9SMateja Marjanovic #include "../../../../include/test_inputs.h"
27*4b302ce9SMateja Marjanovic #include "../../../../include/test_utils.h"
28*4b302ce9SMateja Marjanovic 
29*4b302ce9SMateja Marjanovic #define TEST_COUNT_TOTAL (                                                \
30*4b302ce9SMateja Marjanovic             (PATTERN_INPUTS_SHORT_COUNT) * (PATTERN_INPUTS_SHORT_COUNT) + \
31*4b302ce9SMateja Marjanovic             (RANDOM_INPUTS_SHORT_COUNT) * (RANDOM_INPUTS_SHORT_COUNT))
32*4b302ce9SMateja Marjanovic 
33*4b302ce9SMateja Marjanovic 
34*4b302ce9SMateja Marjanovic int32_t main(void)
35*4b302ce9SMateja Marjanovic {
36*4b302ce9SMateja Marjanovic     char *instruction_name = "MULV.W";
37*4b302ce9SMateja Marjanovic     int32_t ret;
38*4b302ce9SMateja Marjanovic     uint32_t i, j;
39*4b302ce9SMateja Marjanovic     struct timeval start, end;
40*4b302ce9SMateja Marjanovic     double elapsed_time;
41*4b302ce9SMateja Marjanovic 
42*4b302ce9SMateja Marjanovic     uint64_t b128_result[TEST_COUNT_TOTAL][2];
43*4b302ce9SMateja Marjanovic     uint64_t b128_expect[TEST_COUNT_TOTAL][2] = {
44*4b302ce9SMateja Marjanovic         { 0x0000000100000001ULL, 0x0000000100000001ULL, },    /*   0  */
45*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
46*4b302ce9SMateja Marjanovic         { 0x5555555655555556ULL, 0x5555555655555556ULL, },
47*4b302ce9SMateja Marjanovic         { 0xaaaaaaabaaaaaaabULL, 0xaaaaaaabaaaaaaabULL, },
48*4b302ce9SMateja Marjanovic         { 0x3333333433333334ULL, 0x3333333433333334ULL, },
49*4b302ce9SMateja Marjanovic         { 0xcccccccdcccccccdULL, 0xcccccccdcccccccdULL, },
50*4b302ce9SMateja Marjanovic         { 0x1c71c71d71c71c72ULL, 0xc71c71c81c71c71dULL, },
51*4b302ce9SMateja Marjanovic         { 0xe38e38e48e38e38fULL, 0x38e38e39e38e38e4ULL, },
52*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },    /*   8  */
53*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
54*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
55*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
56*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
57*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
58*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
59*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
60*4b302ce9SMateja Marjanovic         { 0x5555555655555556ULL, 0x5555555655555556ULL, },    /*  16  */
61*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
62*4b302ce9SMateja Marjanovic         { 0xe38e38e4e38e38e4ULL, 0xe38e38e4e38e38e4ULL, },
63*4b302ce9SMateja Marjanovic         { 0x71c71c7271c71c72ULL, 0x71c71c7271c71c72ULL, },
64*4b302ce9SMateja Marjanovic         { 0x7777777877777778ULL, 0x7777777877777778ULL, },
65*4b302ce9SMateja Marjanovic         { 0xdddddddedddddddeULL, 0xdddddddedddddddeULL, },
66*4b302ce9SMateja Marjanovic         { 0x12f684bea12f684cULL, 0x84bda13012f684beULL, },
67*4b302ce9SMateja Marjanovic         { 0x425ed098b425ed0aULL, 0xd097b426425ed098ULL, },
68*4b302ce9SMateja Marjanovic         { 0xaaaaaaabaaaaaaabULL, 0xaaaaaaabaaaaaaabULL, },    /*  24  */
69*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
70*4b302ce9SMateja Marjanovic         { 0x71c71c7271c71c72ULL, 0x71c71c7271c71c72ULL, },
71*4b302ce9SMateja Marjanovic         { 0x38e38e3938e38e39ULL, 0x38e38e3938e38e39ULL, },
72*4b302ce9SMateja Marjanovic         { 0xbbbbbbbcbbbbbbbcULL, 0xbbbbbbbcbbbbbbbcULL, },
73*4b302ce9SMateja Marjanovic         { 0xeeeeeeefeeeeeeefULL, 0xeeeeeeefeeeeeeefULL, },
74*4b302ce9SMateja Marjanovic         { 0x097b425fd097b426ULL, 0x425ed098097b425fULL, },
75*4b302ce9SMateja Marjanovic         { 0xa12f684cda12f685ULL, 0x684bda13a12f684cULL, },
76*4b302ce9SMateja Marjanovic         { 0x3333333433333334ULL, 0x3333333433333334ULL, },    /*  32  */
77*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
78*4b302ce9SMateja Marjanovic         { 0x7777777877777778ULL, 0x7777777877777778ULL, },
79*4b302ce9SMateja Marjanovic         { 0xbbbbbbbcbbbbbbbcULL, 0xbbbbbbbcbbbbbbbcULL, },
80*4b302ce9SMateja Marjanovic         { 0x28f5c29028f5c290ULL, 0x28f5c29028f5c290ULL, },
81*4b302ce9SMateja Marjanovic         { 0x0a3d70a40a3d70a4ULL, 0x0a3d70a40a3d70a4ULL, },
82*4b302ce9SMateja Marjanovic         { 0xe38e38e427d27d28ULL, 0x9f49f4a0e38e38e4ULL, },
83*4b302ce9SMateja Marjanovic         { 0x4fa4fa500b60b60cULL, 0x93e93e944fa4fa50ULL, },
84*4b302ce9SMateja Marjanovic         { 0xcccccccdcccccccdULL, 0xcccccccdcccccccdULL, },    /*  40  */
85*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
86*4b302ce9SMateja Marjanovic         { 0xdddddddedddddddeULL, 0xdddddddedddddddeULL, },
87*4b302ce9SMateja Marjanovic         { 0xeeeeeeefeeeeeeefULL, 0xeeeeeeefeeeeeeefULL, },
88*4b302ce9SMateja Marjanovic         { 0x0a3d70a40a3d70a4ULL, 0x0a3d70a40a3d70a4ULL, },
89*4b302ce9SMateja Marjanovic         { 0xc28f5c29c28f5c29ULL, 0xc28f5c29c28f5c29ULL, },
90*4b302ce9SMateja Marjanovic         { 0x38e38e3949f49f4aULL, 0x27d27d2838e38e39ULL, },
91*4b302ce9SMateja Marjanovic         { 0x93e93e9482d82d83ULL, 0xa4fa4fa593e93e94ULL, },
92*4b302ce9SMateja Marjanovic         { 0x1c71c71d71c71c72ULL, 0xc71c71c81c71c71dULL, },    /*  48  */
93*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
94*4b302ce9SMateja Marjanovic         { 0x12f684bea12f684cULL, 0x84bda13012f684beULL, },
95*4b302ce9SMateja Marjanovic         { 0x097b425fd097b426ULL, 0x425ed098097b425fULL, },
96*4b302ce9SMateja Marjanovic         { 0xe38e38e427d27d28ULL, 0x9f49f4a0e38e38e4ULL, },
97*4b302ce9SMateja Marjanovic         { 0x38e38e3949f49f4aULL, 0x27d27d2838e38e39ULL, },
98*4b302ce9SMateja Marjanovic         { 0xba781949e06522c4ULL, 0x06522c40ba781949ULL, },
99*4b302ce9SMateja Marjanovic         { 0x61f9add49161f9aeULL, 0xc0ca458861f9add4ULL, },
100*4b302ce9SMateja Marjanovic         { 0xe38e38e48e38e38fULL, 0x38e38e39e38e38e4ULL, },    /*  56  */
101*4b302ce9SMateja Marjanovic         { 0x0000000000000000ULL, 0x0000000000000000ULL, },
102*4b302ce9SMateja Marjanovic         { 0x425ed098b425ed0aULL, 0xd097b426425ed098ULL, },
103*4b302ce9SMateja Marjanovic         { 0xa12f684cda12f685ULL, 0x684bda13a12f684cULL, },
104*4b302ce9SMateja Marjanovic         { 0x4fa4fa500b60b60cULL, 0x93e93e944fa4fa50ULL, },
105*4b302ce9SMateja Marjanovic         { 0x93e93e9482d82d83ULL, 0xa4fa4fa593e93e94ULL, },
106*4b302ce9SMateja Marjanovic         { 0x61f9add49161f9aeULL, 0xc0ca458861f9add4ULL, },
107*4b302ce9SMateja Marjanovic         { 0x81948b10fcd6e9e1ULL, 0x781948b181948b10ULL, },
108*4b302ce9SMateja Marjanovic         { 0xb103329061639000ULL, 0x3a25368474988090ULL, },    /*  64  */
109*4b302ce9SMateja Marjanovic         { 0x10bf40e4e7176a00ULL, 0x8176d18c6f1923d0ULL, },
110*4b302ce9SMateja Marjanovic         { 0x7393eb78c4346000ULL, 0xb7bf06a2581f7cf0ULL, },
111*4b302ce9SMateja Marjanovic         { 0xb0f0f35cee787980ULL, 0xd67987508dd09f80ULL, },
112*4b302ce9SMateja Marjanovic         { 0x10bf40e4e7176a00ULL, 0x8176d18c6f1923d0ULL, },
113*4b302ce9SMateja Marjanovic         { 0xb4f42649fded7040ULL, 0x3ceafea44aee6810ULL, },
114*4b302ce9SMateja Marjanovic         { 0xf73d8bbebe6cdc00ULL, 0x53697ae61444e7b0ULL, },
115*4b302ce9SMateja Marjanovic         { 0x7abb9fc72143b470ULL, 0x11e5adf0efce5580ULL, },
116*4b302ce9SMateja Marjanovic         { 0x7393eb78c4346000ULL, 0xb7bf06a2581f7cf0ULL, },    /*  72  */
117*4b302ce9SMateja Marjanovic         { 0xf73d8bbebe6cdc00ULL, 0x53697ae61444e7b0ULL, },
118*4b302ce9SMateja Marjanovic         { 0xb6b388e4e5044000ULL, 0x1aff72013216c990ULL, },
119*4b302ce9SMateja Marjanovic         { 0xe8bf252289e38100ULL, 0x91ae5f28d4dad480ULL, },
120*4b302ce9SMateja Marjanovic         { 0xb0f0f35cee787980ULL, 0xd67987508dd09f80ULL, },
121*4b302ce9SMateja Marjanovic         { 0x7abb9fc72143b470ULL, 0x11e5adf0efce5580ULL, },
122*4b302ce9SMateja Marjanovic };
123*4b302ce9SMateja Marjanovic 
124*4b302ce9SMateja Marjanovic     gettimeofday(&start, NULL);
125*4b302ce9SMateja Marjanovic 
126*4b302ce9SMateja Marjanovic     for (i = 0; i < PATTERN_INPUTS_SHORT_COUNT; i++) {
127*4b302ce9SMateja Marjanovic         for (j = 0; j < PATTERN_INPUTS_SHORT_COUNT; j++) {
128*4b302ce9SMateja Marjanovic             do_msa_MULV_W(b128_pattern[i], b128_pattern[j],
129*4b302ce9SMateja Marjanovic                            b128_result[PATTERN_INPUTS_SHORT_COUNT * i + j]);
130*4b302ce9SMateja Marjanovic         }
131*4b302ce9SMateja Marjanovic     }
132*4b302ce9SMateja Marjanovic 
133*4b302ce9SMateja Marjanovic     for (i = 0; i < RANDOM_INPUTS_SHORT_COUNT; i++) {
134*4b302ce9SMateja Marjanovic         for (j = 0; j < RANDOM_INPUTS_SHORT_COUNT; j++) {
135*4b302ce9SMateja Marjanovic             do_msa_MULV_W(b128_random[i], b128_random[j],
136*4b302ce9SMateja Marjanovic                            b128_result[((PATTERN_INPUTS_SHORT_COUNT) *
137*4b302ce9SMateja Marjanovic                                         (PATTERN_INPUTS_SHORT_COUNT)) +
138*4b302ce9SMateja Marjanovic                                        RANDOM_INPUTS_SHORT_COUNT * i + j]);
139*4b302ce9SMateja Marjanovic         }
140*4b302ce9SMateja Marjanovic     }
141*4b302ce9SMateja Marjanovic 
142*4b302ce9SMateja Marjanovic     gettimeofday(&end, NULL);
143*4b302ce9SMateja Marjanovic 
144*4b302ce9SMateja Marjanovic     elapsed_time = (end.tv_sec - start.tv_sec) * 1000.0;
145*4b302ce9SMateja Marjanovic     elapsed_time += (end.tv_usec - start.tv_usec) / 1000.0;
146*4b302ce9SMateja Marjanovic 
147*4b302ce9SMateja Marjanovic     ret = check_results(instruction_name, TEST_COUNT_TOTAL, elapsed_time,
148*4b302ce9SMateja Marjanovic                         &b128_result[0][0], &b128_expect[0][0]);
149*4b302ce9SMateja Marjanovic 
150*4b302ce9SMateja Marjanovic     return ret;
151*4b302ce9SMateja Marjanovic }
152