1dd165a65SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
2cc4589ebSDavid Woodhouse /* -*- linux-c -*- ------------------------------------------------------- *
3cc4589ebSDavid Woodhouse *
4cc4589ebSDavid Woodhouse * Copyright 2002 H. Peter Anvin - All Rights Reserved
5cc4589ebSDavid Woodhouse *
6cc4589ebSDavid Woodhouse * ----------------------------------------------------------------------- */
7cc4589ebSDavid Woodhouse
8cc4589ebSDavid Woodhouse /*
9a8e026c7SNeilBrown * raid6/algos.c
10cc4589ebSDavid Woodhouse *
11cc4589ebSDavid Woodhouse * Algorithm list and algorithm selection for RAID-6
12cc4589ebSDavid Woodhouse */
13cc4589ebSDavid Woodhouse
14cc4589ebSDavid Woodhouse #include <linux/raid/pq.h>
15cc4589ebSDavid Woodhouse #ifndef __KERNEL__
16cc4589ebSDavid Woodhouse #include <sys/mman.h>
17cc4589ebSDavid Woodhouse #include <stdio.h>
18cc4589ebSDavid Woodhouse #else
19f674ef7bSJim Kukunas #include <linux/module.h>
20d5302fe4SNeilBrown #include <linux/gfp.h>
21cc4589ebSDavid Woodhouse /* In .bss so it's zeroed */
22cc4589ebSDavid Woodhouse const char raid6_empty_zero_page[PAGE_SIZE] __attribute__((aligned(256)));
23cc4589ebSDavid Woodhouse EXPORT_SYMBOL(raid6_empty_zero_page);
24cc4589ebSDavid Woodhouse #endif
25cc4589ebSDavid Woodhouse
26cc4589ebSDavid Woodhouse struct raid6_calls raid6_call;
27cc4589ebSDavid Woodhouse EXPORT_SYMBOL_GPL(raid6_call);
28cc4589ebSDavid Woodhouse
29cc4589ebSDavid Woodhouse const struct raid6_calls * const raid6_algos[] = {
30cc4589ebSDavid Woodhouse #if defined(__i386__) && !defined(__arch_um__)
31e0a491c1SGayatri Kammela #ifdef CONFIG_AS_AVX512
32e0a491c1SGayatri Kammela &raid6_avx512x2,
330437de4fSDaniel Verkamp &raid6_avx512x1,
34e0a491c1SGayatri Kammela #endif
350437de4fSDaniel Verkamp &raid6_avx2x2,
360437de4fSDaniel Verkamp &raid6_avx2x1,
370437de4fSDaniel Verkamp &raid6_sse2x2,
380437de4fSDaniel Verkamp &raid6_sse2x1,
390437de4fSDaniel Verkamp &raid6_sse1x2,
400437de4fSDaniel Verkamp &raid6_sse1x1,
410437de4fSDaniel Verkamp &raid6_mmxx2,
420437de4fSDaniel Verkamp &raid6_mmxx1,
43cc4589ebSDavid Woodhouse #endif
44cc4589ebSDavid Woodhouse #if defined(__x86_64__) && !defined(__arch_um__)
45e0a491c1SGayatri Kammela #ifdef CONFIG_AS_AVX512
46e0a491c1SGayatri Kammela &raid6_avx512x4,
470437de4fSDaniel Verkamp &raid6_avx512x2,
480437de4fSDaniel Verkamp &raid6_avx512x1,
49e0a491c1SGayatri Kammela #endif
500437de4fSDaniel Verkamp &raid6_avx2x4,
510437de4fSDaniel Verkamp &raid6_avx2x2,
520437de4fSDaniel Verkamp &raid6_avx2x1,
530437de4fSDaniel Verkamp &raid6_sse2x4,
540437de4fSDaniel Verkamp &raid6_sse2x2,
550437de4fSDaniel Verkamp &raid6_sse2x1,
56cc4589ebSDavid Woodhouse #endif
57cc4589ebSDavid Woodhouse #ifdef CONFIG_ALTIVEC
58751ba79cSMatt Brown &raid6_vpermxor8,
590437de4fSDaniel Verkamp &raid6_vpermxor4,
600437de4fSDaniel Verkamp &raid6_vpermxor2,
610437de4fSDaniel Verkamp &raid6_vpermxor1,
620437de4fSDaniel Verkamp &raid6_altivec8,
630437de4fSDaniel Verkamp &raid6_altivec4,
640437de4fSDaniel Verkamp &raid6_altivec2,
650437de4fSDaniel Verkamp &raid6_altivec1,
66cc4589ebSDavid Woodhouse #endif
67474fd6e8SMartin Schwidefsky #if defined(CONFIG_S390)
68474fd6e8SMartin Schwidefsky &raid6_s390vx8,
69474fd6e8SMartin Schwidefsky #endif
707d11965dSArd Biesheuvel #ifdef CONFIG_KERNEL_MODE_NEON
717d11965dSArd Biesheuvel &raid6_neonx8,
720437de4fSDaniel Verkamp &raid6_neonx4,
730437de4fSDaniel Verkamp &raid6_neonx2,
740437de4fSDaniel Verkamp &raid6_neonx1,
757d11965dSArd Biesheuvel #endif
768f3f06dfSWANG Xuerui #ifdef CONFIG_LOONGARCH
778f3f06dfSWANG Xuerui #ifdef CONFIG_CPU_HAS_LASX
788f3f06dfSWANG Xuerui &raid6_lasx,
798f3f06dfSWANG Xuerui #endif
808f3f06dfSWANG Xuerui #ifdef CONFIG_CPU_HAS_LSX
818f3f06dfSWANG Xuerui &raid6_lsx,
828f3f06dfSWANG Xuerui #endif
838f3f06dfSWANG Xuerui #endif
840437de4fSDaniel Verkamp #if defined(__ia64__)
850437de4fSDaniel Verkamp &raid6_intx32,
860437de4fSDaniel Verkamp &raid6_intx16,
870437de4fSDaniel Verkamp #endif
880437de4fSDaniel Verkamp &raid6_intx8,
890437de4fSDaniel Verkamp &raid6_intx4,
900437de4fSDaniel Verkamp &raid6_intx2,
910437de4fSDaniel Verkamp &raid6_intx1,
92cc4589ebSDavid Woodhouse NULL
93cc4589ebSDavid Woodhouse };
94cc4589ebSDavid Woodhouse
95048a8b8cSJim Kukunas void (*raid6_2data_recov)(int, size_t, int, int, void **);
96048a8b8cSJim Kukunas EXPORT_SYMBOL_GPL(raid6_2data_recov);
97048a8b8cSJim Kukunas
98048a8b8cSJim Kukunas void (*raid6_datap_recov)(int, size_t, int, void **);
99048a8b8cSJim Kukunas EXPORT_SYMBOL_GPL(raid6_datap_recov);
100048a8b8cSJim Kukunas
101048a8b8cSJim Kukunas const struct raid6_recov_calls *const raid6_recov_algos[] = {
10292203b02SMasahiro Yamada #ifdef CONFIG_X86
10313c520b2SGayatri Kammela #ifdef CONFIG_AS_AVX512
10413c520b2SGayatri Kammela &raid6_recov_avx512,
10513c520b2SGayatri Kammela #endif
1067056741fSJim Kukunas &raid6_recov_avx2,
107048a8b8cSJim Kukunas &raid6_recov_ssse3,
108048a8b8cSJim Kukunas #endif
109f5b55fa1SMartin Schwidefsky #ifdef CONFIG_S390
110f5b55fa1SMartin Schwidefsky &raid6_recov_s390xc,
111f5b55fa1SMartin Schwidefsky #endif
1126ec4e251SArd Biesheuvel #if defined(CONFIG_KERNEL_MODE_NEON)
1136ec4e251SArd Biesheuvel &raid6_recov_neon,
1146ec4e251SArd Biesheuvel #endif
115*f2091321SWANG Xuerui #ifdef CONFIG_LOONGARCH
116*f2091321SWANG Xuerui #ifdef CONFIG_CPU_HAS_LASX
117*f2091321SWANG Xuerui &raid6_recov_lasx,
118*f2091321SWANG Xuerui #endif
119*f2091321SWANG Xuerui #ifdef CONFIG_CPU_HAS_LSX
120*f2091321SWANG Xuerui &raid6_recov_lsx,
121*f2091321SWANG Xuerui #endif
122*f2091321SWANG Xuerui #endif
123048a8b8cSJim Kukunas &raid6_recov_intx1,
124048a8b8cSJim Kukunas NULL
125048a8b8cSJim Kukunas };
126048a8b8cSJim Kukunas
127cc4589ebSDavid Woodhouse #ifdef __KERNEL__
128cc4589ebSDavid Woodhouse #define RAID6_TIME_JIFFIES_LG2 4
129cc4589ebSDavid Woodhouse #else
130cc4589ebSDavid Woodhouse /* Need more time to be stable in userspace */
131cc4589ebSDavid Woodhouse #define RAID6_TIME_JIFFIES_LG2 9
132cc4589ebSDavid Woodhouse #define time_before(x, y) ((x) < (y))
133cc4589ebSDavid Woodhouse #endif
134cc4589ebSDavid Woodhouse
135f591df3cSZhengyuan Liu #define RAID6_TEST_DISKS 8
136f591df3cSZhengyuan Liu #define RAID6_TEST_DISKS_ORDER 3
137f591df3cSZhengyuan Liu
raid6_choose_recov(void)13896e67703SJim Kukunas static inline const struct raid6_recov_calls *raid6_choose_recov(void)
139048a8b8cSJim Kukunas {
140048a8b8cSJim Kukunas const struct raid6_recov_calls *const *algo;
141048a8b8cSJim Kukunas const struct raid6_recov_calls *best;
142048a8b8cSJim Kukunas
143048a8b8cSJim Kukunas for (best = NULL, algo = raid6_recov_algos; *algo; algo++)
144048a8b8cSJim Kukunas if (!best || (*algo)->priority > best->priority)
145048a8b8cSJim Kukunas if (!(*algo)->valid || (*algo)->valid())
146048a8b8cSJim Kukunas best = *algo;
147048a8b8cSJim Kukunas
148048a8b8cSJim Kukunas if (best) {
149048a8b8cSJim Kukunas raid6_2data_recov = best->data2;
150048a8b8cSJim Kukunas raid6_datap_recov = best->datap;
151048a8b8cSJim Kukunas
152b395f75eSAnton Blanchard pr_info("raid6: using %s recovery algorithm\n", best->name);
153048a8b8cSJim Kukunas } else
154b395f75eSAnton Blanchard pr_err("raid6: Yikes! No recovery algorithm found!\n");
15596e67703SJim Kukunas
15696e67703SJim Kukunas return best;
157048a8b8cSJim Kukunas }
158048a8b8cSJim Kukunas
raid6_choose_gen(void * (* const dptrs)[RAID6_TEST_DISKS],const int disks)15996e67703SJim Kukunas static inline const struct raid6_calls *raid6_choose_gen(
160f591df3cSZhengyuan Liu void *(*const dptrs)[RAID6_TEST_DISKS], const int disks)
161cc4589ebSDavid Woodhouse {
16238640c48SDirk Müller unsigned long perf, bestgenperf, j0, j1;
163fe5cbc6eSMarkus Stockhausen int start = (disks>>1)-1, stop = disks-3; /* work on the second half of the disks */
164cc4589ebSDavid Woodhouse const struct raid6_calls *const *algo;
165cc4589ebSDavid Woodhouse const struct raid6_calls *best;
166cc4589ebSDavid Woodhouse
16738640c48SDirk Müller for (bestgenperf = 0, best = NULL, algo = raid6_algos; *algo; algo++) {
16836dacddbSDirk Müller if (!best || (*algo)->priority >= best->priority) {
16996e67703SJim Kukunas if ((*algo)->valid && !(*algo)->valid())
17096e67703SJim Kukunas continue;
171cc4589ebSDavid Woodhouse
172be85f93aSDaniel Verkamp if (!IS_ENABLED(CONFIG_RAID6_PQ_BENCHMARK)) {
173be85f93aSDaniel Verkamp best = *algo;
174be85f93aSDaniel Verkamp break;
175be85f93aSDaniel Verkamp }
176be85f93aSDaniel Verkamp
177cc4589ebSDavid Woodhouse perf = 0;
178cc4589ebSDavid Woodhouse
179cc4589ebSDavid Woodhouse preempt_disable();
180cc4589ebSDavid Woodhouse j0 = jiffies;
181cc4589ebSDavid Woodhouse while ((j1 = jiffies) == j0)
182cc4589ebSDavid Woodhouse cpu_relax();
183cc4589ebSDavid Woodhouse while (time_before(jiffies,
184cc4589ebSDavid Woodhouse j1 + (1<<RAID6_TIME_JIFFIES_LG2))) {
18596e67703SJim Kukunas (*algo)->gen_syndrome(disks, PAGE_SIZE, *dptrs);
186cc4589ebSDavid Woodhouse perf++;
187cc4589ebSDavid Woodhouse }
188cc4589ebSDavid Woodhouse preempt_enable();
189cc4589ebSDavid Woodhouse
190fe5cbc6eSMarkus Stockhausen if (perf > bestgenperf) {
191fe5cbc6eSMarkus Stockhausen bestgenperf = perf;
19296e67703SJim Kukunas best = *algo;
193cc4589ebSDavid Woodhouse }
194fe5cbc6eSMarkus Stockhausen pr_info("raid6: %-8s gen() %5ld MB/s\n", (*algo)->name,
195f591df3cSZhengyuan Liu (perf * HZ * (disks-2)) >>
196f591df3cSZhengyuan Liu (20 - PAGE_SHIFT + RAID6_TIME_JIFFIES_LG2));
19738640c48SDirk Müller }
19838640c48SDirk Müller }
199fe5cbc6eSMarkus Stockhausen
20038640c48SDirk Müller if (!best) {
20138640c48SDirk Müller pr_err("raid6: Yikes! No algorithm found!\n");
20238640c48SDirk Müller goto out;
20338640c48SDirk Müller }
204fe5cbc6eSMarkus Stockhausen
20538640c48SDirk Müller raid6_call = *best;
20638640c48SDirk Müller
20738640c48SDirk Müller if (!IS_ENABLED(CONFIG_RAID6_PQ_BENCHMARK)) {
20838640c48SDirk Müller pr_info("raid6: skipped pq benchmark and selected %s\n",
20938640c48SDirk Müller best->name);
21038640c48SDirk Müller goto out;
21138640c48SDirk Müller }
21238640c48SDirk Müller
21338640c48SDirk Müller pr_info("raid6: using algorithm %s gen() %ld MB/s\n",
21438640c48SDirk Müller best->name,
21538640c48SDirk Müller (bestgenperf * HZ * (disks - 2)) >>
21638640c48SDirk Müller (20 - PAGE_SHIFT + RAID6_TIME_JIFFIES_LG2));
21738640c48SDirk Müller
21838640c48SDirk Müller if (best->xor_syndrome) {
219fe5cbc6eSMarkus Stockhausen perf = 0;
220fe5cbc6eSMarkus Stockhausen
221fe5cbc6eSMarkus Stockhausen preempt_disable();
222fe5cbc6eSMarkus Stockhausen j0 = jiffies;
223fe5cbc6eSMarkus Stockhausen while ((j1 = jiffies) == j0)
224fe5cbc6eSMarkus Stockhausen cpu_relax();
225fe5cbc6eSMarkus Stockhausen while (time_before(jiffies,
226fe5cbc6eSMarkus Stockhausen j1 + (1 << RAID6_TIME_JIFFIES_LG2))) {
22738640c48SDirk Müller best->xor_syndrome(disks, start, stop,
228fe5cbc6eSMarkus Stockhausen PAGE_SIZE, *dptrs);
229fe5cbc6eSMarkus Stockhausen perf++;
230fe5cbc6eSMarkus Stockhausen }
231fe5cbc6eSMarkus Stockhausen preempt_enable();
232fe5cbc6eSMarkus Stockhausen
23338640c48SDirk Müller pr_info("raid6: .... xor() %ld MB/s, rmw enabled\n",
234f591df3cSZhengyuan Liu (perf * HZ * (disks - 2)) >>
235f591df3cSZhengyuan Liu (20 - PAGE_SHIFT + RAID6_TIME_JIFFIES_LG2 + 1));
236cc4589ebSDavid Woodhouse }
237cc4589ebSDavid Woodhouse
23838640c48SDirk Müller out:
23996e67703SJim Kukunas return best;
24096e67703SJim Kukunas }
24196e67703SJim Kukunas
24296e67703SJim Kukunas
24396e67703SJim Kukunas /* Try to pick the best algorithm */
24496e67703SJim Kukunas /* This code uses the gfmul table as convenient data set to abuse */
24596e67703SJim Kukunas
raid6_select_algo(void)24696e67703SJim Kukunas int __init raid6_select_algo(void)
24796e67703SJim Kukunas {
248f591df3cSZhengyuan Liu const int disks = RAID6_TEST_DISKS;
24996e67703SJim Kukunas
25096e67703SJim Kukunas const struct raid6_calls *gen_best;
25196e67703SJim Kukunas const struct raid6_recov_calls *rec_best;
252f591df3cSZhengyuan Liu char *disk_ptr, *p;
253f591df3cSZhengyuan Liu void *dptrs[RAID6_TEST_DISKS];
254f591df3cSZhengyuan Liu int i, cycle;
25596e67703SJim Kukunas
256f591df3cSZhengyuan Liu /* prepare the buffer and fill it circularly with gfmul table */
257f591df3cSZhengyuan Liu disk_ptr = (char *)__get_free_pages(GFP_KERNEL, RAID6_TEST_DISKS_ORDER);
258f591df3cSZhengyuan Liu if (!disk_ptr) {
259b395f75eSAnton Blanchard pr_err("raid6: Yikes! No memory available.\n");
26096e67703SJim Kukunas return -ENOMEM;
26196e67703SJim Kukunas }
26296e67703SJim Kukunas
263f591df3cSZhengyuan Liu p = disk_ptr;
264f591df3cSZhengyuan Liu for (i = 0; i < disks; i++)
265f591df3cSZhengyuan Liu dptrs[i] = p + PAGE_SIZE * i;
266f591df3cSZhengyuan Liu
267f591df3cSZhengyuan Liu cycle = ((disks - 2) * PAGE_SIZE) / 65536;
268f591df3cSZhengyuan Liu for (i = 0; i < cycle; i++) {
269f591df3cSZhengyuan Liu memcpy(p, raid6_gfmul, 65536);
270f591df3cSZhengyuan Liu p += 65536;
271f591df3cSZhengyuan Liu }
272f591df3cSZhengyuan Liu
273f591df3cSZhengyuan Liu if ((disks - 2) * PAGE_SIZE % 65536)
274f591df3cSZhengyuan Liu memcpy(p, raid6_gfmul, (disks - 2) * PAGE_SIZE % 65536);
27596e67703SJim Kukunas
27696e67703SJim Kukunas /* select raid gen_syndrome function */
27796e67703SJim Kukunas gen_best = raid6_choose_gen(&dptrs, disks);
278cc4589ebSDavid Woodhouse
279048a8b8cSJim Kukunas /* select raid recover functions */
28096e67703SJim Kukunas rec_best = raid6_choose_recov();
281048a8b8cSJim Kukunas
282f591df3cSZhengyuan Liu free_pages((unsigned long)disk_ptr, RAID6_TEST_DISKS_ORDER);
28396e67703SJim Kukunas
28496e67703SJim Kukunas return gen_best && rec_best ? 0 : -EINVAL;
285cc4589ebSDavid Woodhouse }
286cc4589ebSDavid Woodhouse
raid6_exit(void)287cc4589ebSDavid Woodhouse static void raid6_exit(void)
288cc4589ebSDavid Woodhouse {
289cc4589ebSDavid Woodhouse do { } while (0);
290cc4589ebSDavid Woodhouse }
291cc4589ebSDavid Woodhouse
292cc4589ebSDavid Woodhouse subsys_initcall(raid6_select_algo);
293cc4589ebSDavid Woodhouse module_exit(raid6_exit);
294cc4589ebSDavid Woodhouse MODULE_LICENSE("GPL");
295cc4589ebSDavid Woodhouse MODULE_DESCRIPTION("RAID6 Q-syndrome calculations");
296