1 /*
2 * Test program for MSA instruction PCNT.D
3 *
4 * Copyright (C) 2019 Wave Computing, Inc.
5 * Copyright (C) 2019 Aleksandar Markovic <amarkovic@wavecomp.com>
6 *
7 * This program is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 2 of the License, or
10 * (at your option) any later version.
11 *
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with this program. If not, see <https://www.gnu.org/licenses/>.
19 *
20 */
21
22 #include <sys/time.h>
23 #include <stdint.h>
24
25 #include "../../../../include/wrappers_msa.h"
26 #include "../../../../include/test_inputs_128.h"
27 #include "../../../../include/test_utils_128.h"
28
29 #define TEST_COUNT_TOTAL (PATTERN_INPUTS_COUNT + RANDOM_INPUTS_COUNT)
30
31
main(void)32 int32_t main(void)
33 {
34 char *isa_ase_name = "MSA";
35 char *group_name = "Bit Count";
36 char *instruction_name = "PCNT.D";
37 int32_t ret;
38 uint32_t i;
39 struct timeval start, end;
40 double elapsed_time;
41
42 uint64_t b128_result[TEST_COUNT_TOTAL][2];
43 uint64_t b128_expect[TEST_COUNT_TOTAL][2] = {
44 { 0x0000000000000040ULL, 0x0000000000000040ULL, }, /* 0 */
45 { 0x0000000000000000ULL, 0x0000000000000000ULL, },
46 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
47 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
48 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
49 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
50 { 0x0000000000000021ULL, 0x0000000000000020ULL, },
51 { 0x000000000000001fULL, 0x0000000000000020ULL, },
52 { 0x0000000000000020ULL, 0x0000000000000020ULL, }, /* 8 */
53 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
54 { 0x0000000000000022ULL, 0x000000000000001fULL, },
55 { 0x000000000000001eULL, 0x0000000000000021ULL, },
56 { 0x0000000000000022ULL, 0x0000000000000020ULL, },
57 { 0x000000000000001eULL, 0x0000000000000020ULL, },
58 { 0x0000000000000023ULL, 0x000000000000001eULL, },
59 { 0x000000000000001dULL, 0x0000000000000022ULL, },
60 { 0x0000000000000020ULL, 0x0000000000000020ULL, }, /* 16 */
61 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
62 { 0x0000000000000024ULL, 0x000000000000001dULL, },
63 { 0x000000000000001cULL, 0x0000000000000023ULL, },
64 { 0x0000000000000022ULL, 0x0000000000000022ULL, },
65 { 0x000000000000001eULL, 0x000000000000001eULL, },
66 { 0x0000000000000021ULL, 0x0000000000000021ULL, },
67 { 0x000000000000001fULL, 0x000000000000001fULL, },
68 { 0x0000000000000024ULL, 0x0000000000000020ULL, }, /* 24 */
69 { 0x000000000000001cULL, 0x0000000000000020ULL, },
70 { 0x0000000000000026ULL, 0x000000000000001bULL, },
71 { 0x000000000000001aULL, 0x0000000000000025ULL, },
72 { 0x0000000000000024ULL, 0x0000000000000022ULL, },
73 { 0x000000000000001cULL, 0x000000000000001eULL, },
74 { 0x0000000000000022ULL, 0x0000000000000022ULL, },
75 { 0x000000000000001eULL, 0x000000000000001eULL, },
76 { 0x0000000000000020ULL, 0x0000000000000020ULL, }, /* 32 */
77 { 0x0000000000000020ULL, 0x0000000000000020ULL, },
78 { 0x0000000000000022ULL, 0x0000000000000022ULL, },
79 { 0x000000000000001eULL, 0x000000000000001eULL, },
80 { 0x0000000000000024ULL, 0x0000000000000024ULL, },
81 { 0x000000000000001cULL, 0x000000000000001cULL, },
82 { 0x0000000000000026ULL, 0x0000000000000021ULL, },
83 { 0x000000000000001aULL, 0x000000000000001fULL, },
84 { 0x0000000000000028ULL, 0x000000000000001cULL, }, /* 40 */
85 { 0x0000000000000018ULL, 0x0000000000000024ULL, },
86 { 0x000000000000002aULL, 0x0000000000000017ULL, },
87 { 0x0000000000000016ULL, 0x0000000000000029ULL, },
88 { 0x000000000000002aULL, 0x0000000000000018ULL, },
89 { 0x0000000000000016ULL, 0x0000000000000028ULL, },
90 { 0x0000000000000029ULL, 0x000000000000001cULL, },
91 { 0x0000000000000017ULL, 0x0000000000000024ULL, },
92 { 0x0000000000000028ULL, 0x0000000000000020ULL, }, /* 48 */
93 { 0x0000000000000018ULL, 0x0000000000000020ULL, },
94 { 0x0000000000000027ULL, 0x0000000000000024ULL, },
95 { 0x0000000000000019ULL, 0x000000000000001cULL, },
96 { 0x0000000000000026ULL, 0x0000000000000026ULL, },
97 { 0x000000000000001aULL, 0x000000000000001aULL, },
98 { 0x0000000000000025ULL, 0x0000000000000025ULL, },
99 { 0x000000000000001bULL, 0x000000000000001bULL, },
100 { 0x0000000000000024ULL, 0x0000000000000024ULL, }, /* 56 */
101 { 0x000000000000001cULL, 0x000000000000001cULL, },
102 { 0x0000000000000023ULL, 0x0000000000000023ULL, },
103 { 0x000000000000001dULL, 0x000000000000001dULL, },
104 { 0x0000000000000022ULL, 0x0000000000000022ULL, },
105 { 0x000000000000001eULL, 0x000000000000001eULL, },
106 { 0x0000000000000021ULL, 0x0000000000000021ULL, },
107 { 0x000000000000001fULL, 0x000000000000001fULL, },
108 { 0x0000000000000019ULL, 0x0000000000000023ULL, }, /* 64 */
109 { 0x000000000000001fULL, 0x0000000000000024ULL, },
110 { 0x0000000000000021ULL, 0x0000000000000022ULL, },
111 { 0x000000000000001fULL, 0x000000000000001bULL, },
112 { 0x0000000000000023ULL, 0x0000000000000022ULL, },
113 { 0x0000000000000024ULL, 0x000000000000001cULL, },
114 { 0x000000000000001eULL, 0x000000000000001cULL, },
115 { 0x0000000000000022ULL, 0x0000000000000022ULL, },
116 { 0x000000000000001dULL, 0x0000000000000022ULL, }, /* 72 */
117 { 0x0000000000000025ULL, 0x000000000000001eULL, },
118 { 0x0000000000000024ULL, 0x000000000000001dULL, },
119 { 0x000000000000001fULL, 0x0000000000000024ULL, },
120 { 0x000000000000001dULL, 0x000000000000001eULL, },
121 { 0x000000000000001dULL, 0x0000000000000021ULL, },
122 { 0x000000000000001eULL, 0x0000000000000022ULL, },
123 { 0x0000000000000024ULL, 0x0000000000000022ULL, },
124 };
125
126 reset_msa_registers();
127
128 gettimeofday(&start, NULL);
129
130 for (i = 0; i < TEST_COUNT_TOTAL; i++) {
131 if (i < PATTERN_INPUTS_COUNT) {
132 do_msa_PCNT_D(b128_pattern[i], b128_result[i]);
133 } else {
134 do_msa_PCNT_D(b128_random[i - PATTERN_INPUTS_COUNT],
135 b128_result[i]);
136 }
137 }
138
139 gettimeofday(&end, NULL);
140
141 elapsed_time = (end.tv_sec - start.tv_sec) * 1000.0;
142 elapsed_time += (end.tv_usec - start.tv_usec) / 1000.0;
143
144 ret = check_results_128(isa_ase_name, group_name, instruction_name,
145 TEST_COUNT_TOTAL, elapsed_time,
146 &b128_result[0][0], &b128_expect[0][0]);
147
148 return ret;
149 }
150