1dd165a65SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
2cc4589ebSDavid Woodhouse /* -*- linux-c -*- ------------------------------------------------------- *
3cc4589ebSDavid Woodhouse *
4cc4589ebSDavid Woodhouse * Copyright 2002 H. Peter Anvin - All Rights Reserved
5cc4589ebSDavid Woodhouse *
6cc4589ebSDavid Woodhouse * ----------------------------------------------------------------------- */
7cc4589ebSDavid Woodhouse
8cc4589ebSDavid Woodhouse /*
9a8e026c7SNeilBrown * raid6/algos.c
10cc4589ebSDavid Woodhouse *
11cc4589ebSDavid Woodhouse * Algorithm list and algorithm selection for RAID-6
12cc4589ebSDavid Woodhouse */
13cc4589ebSDavid Woodhouse
14cc4589ebSDavid Woodhouse #include <linux/raid/pq.h>
15cc4589ebSDavid Woodhouse #ifndef __KERNEL__
16cc4589ebSDavid Woodhouse #include <sys/mman.h>
17cc4589ebSDavid Woodhouse #include <stdio.h>
18cc4589ebSDavid Woodhouse #else
19f674ef7bSJim Kukunas #include <linux/module.h>
20d5302fe4SNeilBrown #include <linux/gfp.h>
21cc4589ebSDavid Woodhouse /* In .bss so it's zeroed */
22cc4589ebSDavid Woodhouse const char raid6_empty_zero_page[PAGE_SIZE] __attribute__((aligned(256)));
23cc4589ebSDavid Woodhouse EXPORT_SYMBOL(raid6_empty_zero_page);
24cc4589ebSDavid Woodhouse #endif
25cc4589ebSDavid Woodhouse
26cc4589ebSDavid Woodhouse struct raid6_calls raid6_call;
27cc4589ebSDavid Woodhouse EXPORT_SYMBOL_GPL(raid6_call);
28cc4589ebSDavid Woodhouse
29cc4589ebSDavid Woodhouse const struct raid6_calls * const raid6_algos[] = {
30cc4589ebSDavid Woodhouse #if defined(__i386__) && !defined(__arch_um__)
31e0a491c1SGayatri Kammela #ifdef CONFIG_AS_AVX512
32e0a491c1SGayatri Kammela &raid6_avx512x2,
330437de4fSDaniel Verkamp &raid6_avx512x1,
34e0a491c1SGayatri Kammela #endif
350437de4fSDaniel Verkamp &raid6_avx2x2,
360437de4fSDaniel Verkamp &raid6_avx2x1,
370437de4fSDaniel Verkamp &raid6_sse2x2,
380437de4fSDaniel Verkamp &raid6_sse2x1,
390437de4fSDaniel Verkamp &raid6_sse1x2,
400437de4fSDaniel Verkamp &raid6_sse1x1,
410437de4fSDaniel Verkamp &raid6_mmxx2,
420437de4fSDaniel Verkamp &raid6_mmxx1,
43cc4589ebSDavid Woodhouse #endif
44cc4589ebSDavid Woodhouse #if defined(__x86_64__) && !defined(__arch_um__)
45e0a491c1SGayatri Kammela #ifdef CONFIG_AS_AVX512
46e0a491c1SGayatri Kammela &raid6_avx512x4,
470437de4fSDaniel Verkamp &raid6_avx512x2,
480437de4fSDaniel Verkamp &raid6_avx512x1,
49e0a491c1SGayatri Kammela #endif
500437de4fSDaniel Verkamp &raid6_avx2x4,
510437de4fSDaniel Verkamp &raid6_avx2x2,
520437de4fSDaniel Verkamp &raid6_avx2x1,
530437de4fSDaniel Verkamp &raid6_sse2x4,
540437de4fSDaniel Verkamp &raid6_sse2x2,
550437de4fSDaniel Verkamp &raid6_sse2x1,
56cc4589ebSDavid Woodhouse #endif
57cc4589ebSDavid Woodhouse #ifdef CONFIG_ALTIVEC
58751ba79cSMatt Brown &raid6_vpermxor8,
590437de4fSDaniel Verkamp &raid6_vpermxor4,
600437de4fSDaniel Verkamp &raid6_vpermxor2,
610437de4fSDaniel Verkamp &raid6_vpermxor1,
620437de4fSDaniel Verkamp &raid6_altivec8,
630437de4fSDaniel Verkamp &raid6_altivec4,
640437de4fSDaniel Verkamp &raid6_altivec2,
650437de4fSDaniel Verkamp &raid6_altivec1,
66cc4589ebSDavid Woodhouse #endif
67474fd6e8SMartin Schwidefsky #if defined(CONFIG_S390)
68474fd6e8SMartin Schwidefsky &raid6_s390vx8,
69474fd6e8SMartin Schwidefsky #endif
707d11965dSArd Biesheuvel #ifdef CONFIG_KERNEL_MODE_NEON
717d11965dSArd Biesheuvel &raid6_neonx8,
720437de4fSDaniel Verkamp &raid6_neonx4,
730437de4fSDaniel Verkamp &raid6_neonx2,
740437de4fSDaniel Verkamp &raid6_neonx1,
757d11965dSArd Biesheuvel #endif
768f3f06dfSWANG Xuerui #ifdef CONFIG_LOONGARCH
778f3f06dfSWANG Xuerui #ifdef CONFIG_CPU_HAS_LASX
788f3f06dfSWANG Xuerui &raid6_lasx,
798f3f06dfSWANG Xuerui #endif
808f3f06dfSWANG Xuerui #ifdef CONFIG_CPU_HAS_LSX
818f3f06dfSWANG Xuerui &raid6_lsx,
828f3f06dfSWANG Xuerui #endif
838f3f06dfSWANG Xuerui #endif
840437de4fSDaniel Verkamp &raid6_intx8,
850437de4fSDaniel Verkamp &raid6_intx4,
860437de4fSDaniel Verkamp &raid6_intx2,
870437de4fSDaniel Verkamp &raid6_intx1,
88cc4589ebSDavid Woodhouse NULL
89cc4589ebSDavid Woodhouse };
90cc4589ebSDavid Woodhouse
91048a8b8cSJim Kukunas void (*raid6_2data_recov)(int, size_t, int, int, void **);
92048a8b8cSJim Kukunas EXPORT_SYMBOL_GPL(raid6_2data_recov);
93048a8b8cSJim Kukunas
94048a8b8cSJim Kukunas void (*raid6_datap_recov)(int, size_t, int, void **);
95048a8b8cSJim Kukunas EXPORT_SYMBOL_GPL(raid6_datap_recov);
96048a8b8cSJim Kukunas
97048a8b8cSJim Kukunas const struct raid6_recov_calls *const raid6_recov_algos[] = {
9892203b02SMasahiro Yamada #ifdef CONFIG_X86
9913c520b2SGayatri Kammela #ifdef CONFIG_AS_AVX512
10013c520b2SGayatri Kammela &raid6_recov_avx512,
10113c520b2SGayatri Kammela #endif
1027056741fSJim Kukunas &raid6_recov_avx2,
103048a8b8cSJim Kukunas &raid6_recov_ssse3,
104048a8b8cSJim Kukunas #endif
105f5b55fa1SMartin Schwidefsky #ifdef CONFIG_S390
106f5b55fa1SMartin Schwidefsky &raid6_recov_s390xc,
107f5b55fa1SMartin Schwidefsky #endif
1086ec4e251SArd Biesheuvel #if defined(CONFIG_KERNEL_MODE_NEON)
1096ec4e251SArd Biesheuvel &raid6_recov_neon,
1106ec4e251SArd Biesheuvel #endif
111*f2091321SWANG Xuerui #ifdef CONFIG_LOONGARCH
112*f2091321SWANG Xuerui #ifdef CONFIG_CPU_HAS_LASX
113*f2091321SWANG Xuerui &raid6_recov_lasx,
114*f2091321SWANG Xuerui #endif
115*f2091321SWANG Xuerui #ifdef CONFIG_CPU_HAS_LSX
116*f2091321SWANG Xuerui &raid6_recov_lsx,
117*f2091321SWANG Xuerui #endif
118*f2091321SWANG Xuerui #endif
119048a8b8cSJim Kukunas &raid6_recov_intx1,
120048a8b8cSJim Kukunas NULL
121048a8b8cSJim Kukunas };
122048a8b8cSJim Kukunas
123cc4589ebSDavid Woodhouse #ifdef __KERNEL__
124cc4589ebSDavid Woodhouse #define RAID6_TIME_JIFFIES_LG2 4
125cc4589ebSDavid Woodhouse #else
126cc4589ebSDavid Woodhouse /* Need more time to be stable in userspace */
127cc4589ebSDavid Woodhouse #define RAID6_TIME_JIFFIES_LG2 9
128cc4589ebSDavid Woodhouse #define time_before(x, y) ((x) < (y))
129cc4589ebSDavid Woodhouse #endif
130cc4589ebSDavid Woodhouse
131f591df3cSZhengyuan Liu #define RAID6_TEST_DISKS 8
132f591df3cSZhengyuan Liu #define RAID6_TEST_DISKS_ORDER 3
133f591df3cSZhengyuan Liu
raid6_choose_recov(void)13496e67703SJim Kukunas static inline const struct raid6_recov_calls *raid6_choose_recov(void)
135048a8b8cSJim Kukunas {
136048a8b8cSJim Kukunas const struct raid6_recov_calls *const *algo;
137048a8b8cSJim Kukunas const struct raid6_recov_calls *best;
138048a8b8cSJim Kukunas
139048a8b8cSJim Kukunas for (best = NULL, algo = raid6_recov_algos; *algo; algo++)
140048a8b8cSJim Kukunas if (!best || (*algo)->priority > best->priority)
141048a8b8cSJim Kukunas if (!(*algo)->valid || (*algo)->valid())
142048a8b8cSJim Kukunas best = *algo;
143048a8b8cSJim Kukunas
144048a8b8cSJim Kukunas if (best) {
145048a8b8cSJim Kukunas raid6_2data_recov = best->data2;
146048a8b8cSJim Kukunas raid6_datap_recov = best->datap;
147048a8b8cSJim Kukunas
148b395f75eSAnton Blanchard pr_info("raid6: using %s recovery algorithm\n", best->name);
149048a8b8cSJim Kukunas } else
150b395f75eSAnton Blanchard pr_err("raid6: Yikes! No recovery algorithm found!\n");
15196e67703SJim Kukunas
15296e67703SJim Kukunas return best;
153048a8b8cSJim Kukunas }
154048a8b8cSJim Kukunas
raid6_choose_gen(void * (* const dptrs)[RAID6_TEST_DISKS],const int disks)15596e67703SJim Kukunas static inline const struct raid6_calls *raid6_choose_gen(
156f591df3cSZhengyuan Liu void *(*const dptrs)[RAID6_TEST_DISKS], const int disks)
157cc4589ebSDavid Woodhouse {
15838640c48SDirk Müller unsigned long perf, bestgenperf, j0, j1;
159fe5cbc6eSMarkus Stockhausen int start = (disks>>1)-1, stop = disks-3; /* work on the second half of the disks */
160cc4589ebSDavid Woodhouse const struct raid6_calls *const *algo;
161cc4589ebSDavid Woodhouse const struct raid6_calls *best;
162cc4589ebSDavid Woodhouse
16338640c48SDirk Müller for (bestgenperf = 0, best = NULL, algo = raid6_algos; *algo; algo++) {
16436dacddbSDirk Müller if (!best || (*algo)->priority >= best->priority) {
16596e67703SJim Kukunas if ((*algo)->valid && !(*algo)->valid())
16696e67703SJim Kukunas continue;
167cc4589ebSDavid Woodhouse
168be85f93aSDaniel Verkamp if (!IS_ENABLED(CONFIG_RAID6_PQ_BENCHMARK)) {
169be85f93aSDaniel Verkamp best = *algo;
170be85f93aSDaniel Verkamp break;
171be85f93aSDaniel Verkamp }
172be85f93aSDaniel Verkamp
173cc4589ebSDavid Woodhouse perf = 0;
174cc4589ebSDavid Woodhouse
175cc4589ebSDavid Woodhouse preempt_disable();
176cc4589ebSDavid Woodhouse j0 = jiffies;
177cc4589ebSDavid Woodhouse while ((j1 = jiffies) == j0)
178cc4589ebSDavid Woodhouse cpu_relax();
179cc4589ebSDavid Woodhouse while (time_before(jiffies,
180cc4589ebSDavid Woodhouse j1 + (1<<RAID6_TIME_JIFFIES_LG2))) {
18196e67703SJim Kukunas (*algo)->gen_syndrome(disks, PAGE_SIZE, *dptrs);
182cc4589ebSDavid Woodhouse perf++;
183cc4589ebSDavid Woodhouse }
184cc4589ebSDavid Woodhouse preempt_enable();
185cc4589ebSDavid Woodhouse
186fe5cbc6eSMarkus Stockhausen if (perf > bestgenperf) {
187fe5cbc6eSMarkus Stockhausen bestgenperf = perf;
18896e67703SJim Kukunas best = *algo;
189cc4589ebSDavid Woodhouse }
190fe5cbc6eSMarkus Stockhausen pr_info("raid6: %-8s gen() %5ld MB/s\n", (*algo)->name,
191f591df3cSZhengyuan Liu (perf * HZ * (disks-2)) >>
192f591df3cSZhengyuan Liu (20 - PAGE_SHIFT + RAID6_TIME_JIFFIES_LG2));
19338640c48SDirk Müller }
19438640c48SDirk Müller }
195fe5cbc6eSMarkus Stockhausen
19638640c48SDirk Müller if (!best) {
19738640c48SDirk Müller pr_err("raid6: Yikes! No algorithm found!\n");
19838640c48SDirk Müller goto out;
19938640c48SDirk Müller }
200fe5cbc6eSMarkus Stockhausen
20138640c48SDirk Müller raid6_call = *best;
20238640c48SDirk Müller
20338640c48SDirk Müller if (!IS_ENABLED(CONFIG_RAID6_PQ_BENCHMARK)) {
20438640c48SDirk Müller pr_info("raid6: skipped pq benchmark and selected %s\n",
20538640c48SDirk Müller best->name);
20638640c48SDirk Müller goto out;
20738640c48SDirk Müller }
20838640c48SDirk Müller
20938640c48SDirk Müller pr_info("raid6: using algorithm %s gen() %ld MB/s\n",
21038640c48SDirk Müller best->name,
21138640c48SDirk Müller (bestgenperf * HZ * (disks - 2)) >>
21238640c48SDirk Müller (20 - PAGE_SHIFT + RAID6_TIME_JIFFIES_LG2));
21338640c48SDirk Müller
21438640c48SDirk Müller if (best->xor_syndrome) {
215fe5cbc6eSMarkus Stockhausen perf = 0;
216fe5cbc6eSMarkus Stockhausen
217fe5cbc6eSMarkus Stockhausen preempt_disable();
218fe5cbc6eSMarkus Stockhausen j0 = jiffies;
219fe5cbc6eSMarkus Stockhausen while ((j1 = jiffies) == j0)
220fe5cbc6eSMarkus Stockhausen cpu_relax();
221fe5cbc6eSMarkus Stockhausen while (time_before(jiffies,
222fe5cbc6eSMarkus Stockhausen j1 + (1 << RAID6_TIME_JIFFIES_LG2))) {
22338640c48SDirk Müller best->xor_syndrome(disks, start, stop,
224fe5cbc6eSMarkus Stockhausen PAGE_SIZE, *dptrs);
225fe5cbc6eSMarkus Stockhausen perf++;
226fe5cbc6eSMarkus Stockhausen }
227fe5cbc6eSMarkus Stockhausen preempt_enable();
228fe5cbc6eSMarkus Stockhausen
22938640c48SDirk Müller pr_info("raid6: .... xor() %ld MB/s, rmw enabled\n",
230f591df3cSZhengyuan Liu (perf * HZ * (disks - 2)) >>
231f591df3cSZhengyuan Liu (20 - PAGE_SHIFT + RAID6_TIME_JIFFIES_LG2 + 1));
232cc4589ebSDavid Woodhouse }
233cc4589ebSDavid Woodhouse
23438640c48SDirk Müller out:
23596e67703SJim Kukunas return best;
23696e67703SJim Kukunas }
23796e67703SJim Kukunas
23896e67703SJim Kukunas
23996e67703SJim Kukunas /* Try to pick the best algorithm */
24096e67703SJim Kukunas /* This code uses the gfmul table as convenient data set to abuse */
24196e67703SJim Kukunas
raid6_select_algo(void)24296e67703SJim Kukunas int __init raid6_select_algo(void)
24396e67703SJim Kukunas {
244f591df3cSZhengyuan Liu const int disks = RAID6_TEST_DISKS;
24596e67703SJim Kukunas
24696e67703SJim Kukunas const struct raid6_calls *gen_best;
24796e67703SJim Kukunas const struct raid6_recov_calls *rec_best;
248f591df3cSZhengyuan Liu char *disk_ptr, *p;
249f591df3cSZhengyuan Liu void *dptrs[RAID6_TEST_DISKS];
250f591df3cSZhengyuan Liu int i, cycle;
25196e67703SJim Kukunas
252f591df3cSZhengyuan Liu /* prepare the buffer and fill it circularly with gfmul table */
253f591df3cSZhengyuan Liu disk_ptr = (char *)__get_free_pages(GFP_KERNEL, RAID6_TEST_DISKS_ORDER);
254f591df3cSZhengyuan Liu if (!disk_ptr) {
255b395f75eSAnton Blanchard pr_err("raid6: Yikes! No memory available.\n");
25696e67703SJim Kukunas return -ENOMEM;
25796e67703SJim Kukunas }
25896e67703SJim Kukunas
259f591df3cSZhengyuan Liu p = disk_ptr;
260f591df3cSZhengyuan Liu for (i = 0; i < disks; i++)
261f591df3cSZhengyuan Liu dptrs[i] = p + PAGE_SIZE * i;
262f591df3cSZhengyuan Liu
263f591df3cSZhengyuan Liu cycle = ((disks - 2) * PAGE_SIZE) / 65536;
264f591df3cSZhengyuan Liu for (i = 0; i < cycle; i++) {
265f591df3cSZhengyuan Liu memcpy(p, raid6_gfmul, 65536);
266f591df3cSZhengyuan Liu p += 65536;
267f591df3cSZhengyuan Liu }
268f591df3cSZhengyuan Liu
269f591df3cSZhengyuan Liu if ((disks - 2) * PAGE_SIZE % 65536)
270f591df3cSZhengyuan Liu memcpy(p, raid6_gfmul, (disks - 2) * PAGE_SIZE % 65536);
27196e67703SJim Kukunas
27296e67703SJim Kukunas /* select raid gen_syndrome function */
27396e67703SJim Kukunas gen_best = raid6_choose_gen(&dptrs, disks);
274cc4589ebSDavid Woodhouse
275048a8b8cSJim Kukunas /* select raid recover functions */
27696e67703SJim Kukunas rec_best = raid6_choose_recov();
277048a8b8cSJim Kukunas
278f591df3cSZhengyuan Liu free_pages((unsigned long)disk_ptr, RAID6_TEST_DISKS_ORDER);
27996e67703SJim Kukunas
28096e67703SJim Kukunas return gen_best && rec_best ? 0 : -EINVAL;
281cc4589ebSDavid Woodhouse }
282cc4589ebSDavid Woodhouse
raid6_exit(void)283cc4589ebSDavid Woodhouse static void raid6_exit(void)
284cc4589ebSDavid Woodhouse {
285cc4589ebSDavid Woodhouse do { } while (0);
286cc4589ebSDavid Woodhouse }
287cc4589ebSDavid Woodhouse
288cc4589ebSDavid Woodhouse subsys_initcall(raid6_select_algo);
289cc4589ebSDavid Woodhouse module_exit(raid6_exit);
290cc4589ebSDavid Woodhouse MODULE_LICENSE("GPL");
291cc4589ebSDavid Woodhouse MODULE_DESCRIPTION("RAID6 Q-syndrome calculations");
292