Linux Audio

Check our new training course

Loading...
v5.4
  1/* SPDX-License-Identifier: GPL-2.0-or-later */
  2/*
  3 * include/asm-generic/xor.h
  4 *
  5 * Generic optimized RAID-5 checksumming functions.
 
 
 
 
 
 
 
 
 
  6 */
  7
  8#include <linux/prefetch.h>
  9
 10static void
 11xor_8regs_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
 12{
 13	long lines = bytes / (sizeof (long)) / 8;
 14
 15	do {
 16		p1[0] ^= p2[0];
 17		p1[1] ^= p2[1];
 18		p1[2] ^= p2[2];
 19		p1[3] ^= p2[3];
 20		p1[4] ^= p2[4];
 21		p1[5] ^= p2[5];
 22		p1[6] ^= p2[6];
 23		p1[7] ^= p2[7];
 24		p1 += 8;
 25		p2 += 8;
 26	} while (--lines > 0);
 27}
 28
 29static void
 30xor_8regs_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
 31	    unsigned long *p3)
 32{
 33	long lines = bytes / (sizeof (long)) / 8;
 34
 35	do {
 36		p1[0] ^= p2[0] ^ p3[0];
 37		p1[1] ^= p2[1] ^ p3[1];
 38		p1[2] ^= p2[2] ^ p3[2];
 39		p1[3] ^= p2[3] ^ p3[3];
 40		p1[4] ^= p2[4] ^ p3[4];
 41		p1[5] ^= p2[5] ^ p3[5];
 42		p1[6] ^= p2[6] ^ p3[6];
 43		p1[7] ^= p2[7] ^ p3[7];
 44		p1 += 8;
 45		p2 += 8;
 46		p3 += 8;
 47	} while (--lines > 0);
 48}
 49
 50static void
 51xor_8regs_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
 52	    unsigned long *p3, unsigned long *p4)
 53{
 54	long lines = bytes / (sizeof (long)) / 8;
 55
 56	do {
 57		p1[0] ^= p2[0] ^ p3[0] ^ p4[0];
 58		p1[1] ^= p2[1] ^ p3[1] ^ p4[1];
 59		p1[2] ^= p2[2] ^ p3[2] ^ p4[2];
 60		p1[3] ^= p2[3] ^ p3[3] ^ p4[3];
 61		p1[4] ^= p2[4] ^ p3[4] ^ p4[4];
 62		p1[5] ^= p2[5] ^ p3[5] ^ p4[5];
 63		p1[6] ^= p2[6] ^ p3[6] ^ p4[6];
 64		p1[7] ^= p2[7] ^ p3[7] ^ p4[7];
 65		p1 += 8;
 66		p2 += 8;
 67		p3 += 8;
 68		p4 += 8;
 69	} while (--lines > 0);
 70}
 71
 72static void
 73xor_8regs_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
 74	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
 75{
 76	long lines = bytes / (sizeof (long)) / 8;
 77
 78	do {
 79		p1[0] ^= p2[0] ^ p3[0] ^ p4[0] ^ p5[0];
 80		p1[1] ^= p2[1] ^ p3[1] ^ p4[1] ^ p5[1];
 81		p1[2] ^= p2[2] ^ p3[2] ^ p4[2] ^ p5[2];
 82		p1[3] ^= p2[3] ^ p3[3] ^ p4[3] ^ p5[3];
 83		p1[4] ^= p2[4] ^ p3[4] ^ p4[4] ^ p5[4];
 84		p1[5] ^= p2[5] ^ p3[5] ^ p4[5] ^ p5[5];
 85		p1[6] ^= p2[6] ^ p3[6] ^ p4[6] ^ p5[6];
 86		p1[7] ^= p2[7] ^ p3[7] ^ p4[7] ^ p5[7];
 87		p1 += 8;
 88		p2 += 8;
 89		p3 += 8;
 90		p4 += 8;
 91		p5 += 8;
 92	} while (--lines > 0);
 93}
 94
 95static void
 96xor_32regs_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
 97{
 98	long lines = bytes / (sizeof (long)) / 8;
 99
100	do {
101		register long d0, d1, d2, d3, d4, d5, d6, d7;
102		d0 = p1[0];	/* Pull the stuff into registers	*/
103		d1 = p1[1];	/*  ... in bursts, if possible.		*/
104		d2 = p1[2];
105		d3 = p1[3];
106		d4 = p1[4];
107		d5 = p1[5];
108		d6 = p1[6];
109		d7 = p1[7];
110		d0 ^= p2[0];
111		d1 ^= p2[1];
112		d2 ^= p2[2];
113		d3 ^= p2[3];
114		d4 ^= p2[4];
115		d5 ^= p2[5];
116		d6 ^= p2[6];
117		d7 ^= p2[7];
118		p1[0] = d0;	/* Store the result (in bursts)		*/
119		p1[1] = d1;
120		p1[2] = d2;
121		p1[3] = d3;
122		p1[4] = d4;
123		p1[5] = d5;
124		p1[6] = d6;
125		p1[7] = d7;
126		p1 += 8;
127		p2 += 8;
128	} while (--lines > 0);
129}
130
131static void
132xor_32regs_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
133	    unsigned long *p3)
134{
135	long lines = bytes / (sizeof (long)) / 8;
136
137	do {
138		register long d0, d1, d2, d3, d4, d5, d6, d7;
139		d0 = p1[0];	/* Pull the stuff into registers	*/
140		d1 = p1[1];	/*  ... in bursts, if possible.		*/
141		d2 = p1[2];
142		d3 = p1[3];
143		d4 = p1[4];
144		d5 = p1[5];
145		d6 = p1[6];
146		d7 = p1[7];
147		d0 ^= p2[0];
148		d1 ^= p2[1];
149		d2 ^= p2[2];
150		d3 ^= p2[3];
151		d4 ^= p2[4];
152		d5 ^= p2[5];
153		d6 ^= p2[6];
154		d7 ^= p2[7];
155		d0 ^= p3[0];
156		d1 ^= p3[1];
157		d2 ^= p3[2];
158		d3 ^= p3[3];
159		d4 ^= p3[4];
160		d5 ^= p3[5];
161		d6 ^= p3[6];
162		d7 ^= p3[7];
163		p1[0] = d0;	/* Store the result (in bursts)		*/
164		p1[1] = d1;
165		p1[2] = d2;
166		p1[3] = d3;
167		p1[4] = d4;
168		p1[5] = d5;
169		p1[6] = d6;
170		p1[7] = d7;
171		p1 += 8;
172		p2 += 8;
173		p3 += 8;
174	} while (--lines > 0);
175}
176
177static void
178xor_32regs_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
179	    unsigned long *p3, unsigned long *p4)
180{
181	long lines = bytes / (sizeof (long)) / 8;
182
183	do {
184		register long d0, d1, d2, d3, d4, d5, d6, d7;
185		d0 = p1[0];	/* Pull the stuff into registers	*/
186		d1 = p1[1];	/*  ... in bursts, if possible.		*/
187		d2 = p1[2];
188		d3 = p1[3];
189		d4 = p1[4];
190		d5 = p1[5];
191		d6 = p1[6];
192		d7 = p1[7];
193		d0 ^= p2[0];
194		d1 ^= p2[1];
195		d2 ^= p2[2];
196		d3 ^= p2[3];
197		d4 ^= p2[4];
198		d5 ^= p2[5];
199		d6 ^= p2[6];
200		d7 ^= p2[7];
201		d0 ^= p3[0];
202		d1 ^= p3[1];
203		d2 ^= p3[2];
204		d3 ^= p3[3];
205		d4 ^= p3[4];
206		d5 ^= p3[5];
207		d6 ^= p3[6];
208		d7 ^= p3[7];
209		d0 ^= p4[0];
210		d1 ^= p4[1];
211		d2 ^= p4[2];
212		d3 ^= p4[3];
213		d4 ^= p4[4];
214		d5 ^= p4[5];
215		d6 ^= p4[6];
216		d7 ^= p4[7];
217		p1[0] = d0;	/* Store the result (in bursts)		*/
218		p1[1] = d1;
219		p1[2] = d2;
220		p1[3] = d3;
221		p1[4] = d4;
222		p1[5] = d5;
223		p1[6] = d6;
224		p1[7] = d7;
225		p1 += 8;
226		p2 += 8;
227		p3 += 8;
228		p4 += 8;
229	} while (--lines > 0);
230}
231
232static void
233xor_32regs_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
234	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
235{
236	long lines = bytes / (sizeof (long)) / 8;
237
238	do {
239		register long d0, d1, d2, d3, d4, d5, d6, d7;
240		d0 = p1[0];	/* Pull the stuff into registers	*/
241		d1 = p1[1];	/*  ... in bursts, if possible.		*/
242		d2 = p1[2];
243		d3 = p1[3];
244		d4 = p1[4];
245		d5 = p1[5];
246		d6 = p1[6];
247		d7 = p1[7];
248		d0 ^= p2[0];
249		d1 ^= p2[1];
250		d2 ^= p2[2];
251		d3 ^= p2[3];
252		d4 ^= p2[4];
253		d5 ^= p2[5];
254		d6 ^= p2[6];
255		d7 ^= p2[7];
256		d0 ^= p3[0];
257		d1 ^= p3[1];
258		d2 ^= p3[2];
259		d3 ^= p3[3];
260		d4 ^= p3[4];
261		d5 ^= p3[5];
262		d6 ^= p3[6];
263		d7 ^= p3[7];
264		d0 ^= p4[0];
265		d1 ^= p4[1];
266		d2 ^= p4[2];
267		d3 ^= p4[3];
268		d4 ^= p4[4];
269		d5 ^= p4[5];
270		d6 ^= p4[6];
271		d7 ^= p4[7];
272		d0 ^= p5[0];
273		d1 ^= p5[1];
274		d2 ^= p5[2];
275		d3 ^= p5[3];
276		d4 ^= p5[4];
277		d5 ^= p5[5];
278		d6 ^= p5[6];
279		d7 ^= p5[7];
280		p1[0] = d0;	/* Store the result (in bursts)		*/
281		p1[1] = d1;
282		p1[2] = d2;
283		p1[3] = d3;
284		p1[4] = d4;
285		p1[5] = d5;
286		p1[6] = d6;
287		p1[7] = d7;
288		p1 += 8;
289		p2 += 8;
290		p3 += 8;
291		p4 += 8;
292		p5 += 8;
293	} while (--lines > 0);
294}
295
296static void
297xor_8regs_p_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
298{
299	long lines = bytes / (sizeof (long)) / 8 - 1;
300	prefetchw(p1);
301	prefetch(p2);
302
303	do {
304		prefetchw(p1+8);
305		prefetch(p2+8);
306 once_more:
307		p1[0] ^= p2[0];
308		p1[1] ^= p2[1];
309		p1[2] ^= p2[2];
310		p1[3] ^= p2[3];
311		p1[4] ^= p2[4];
312		p1[5] ^= p2[5];
313		p1[6] ^= p2[6];
314		p1[7] ^= p2[7];
315		p1 += 8;
316		p2 += 8;
317	} while (--lines > 0);
318	if (lines == 0)
319		goto once_more;
320}
321
322static void
323xor_8regs_p_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
324	    unsigned long *p3)
325{
326	long lines = bytes / (sizeof (long)) / 8 - 1;
327	prefetchw(p1);
328	prefetch(p2);
329	prefetch(p3);
330
331	do {
332		prefetchw(p1+8);
333		prefetch(p2+8);
334		prefetch(p3+8);
335 once_more:
336		p1[0] ^= p2[0] ^ p3[0];
337		p1[1] ^= p2[1] ^ p3[1];
338		p1[2] ^= p2[2] ^ p3[2];
339		p1[3] ^= p2[3] ^ p3[3];
340		p1[4] ^= p2[4] ^ p3[4];
341		p1[5] ^= p2[5] ^ p3[5];
342		p1[6] ^= p2[6] ^ p3[6];
343		p1[7] ^= p2[7] ^ p3[7];
344		p1 += 8;
345		p2 += 8;
346		p3 += 8;
347	} while (--lines > 0);
348	if (lines == 0)
349		goto once_more;
350}
351
352static void
353xor_8regs_p_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
354	    unsigned long *p3, unsigned long *p4)
355{
356	long lines = bytes / (sizeof (long)) / 8 - 1;
357
358	prefetchw(p1);
359	prefetch(p2);
360	prefetch(p3);
361	prefetch(p4);
362
363	do {
364		prefetchw(p1+8);
365		prefetch(p2+8);
366		prefetch(p3+8);
367		prefetch(p4+8);
368 once_more:
369		p1[0] ^= p2[0] ^ p3[0] ^ p4[0];
370		p1[1] ^= p2[1] ^ p3[1] ^ p4[1];
371		p1[2] ^= p2[2] ^ p3[2] ^ p4[2];
372		p1[3] ^= p2[3] ^ p3[3] ^ p4[3];
373		p1[4] ^= p2[4] ^ p3[4] ^ p4[4];
374		p1[5] ^= p2[5] ^ p3[5] ^ p4[5];
375		p1[6] ^= p2[6] ^ p3[6] ^ p4[6];
376		p1[7] ^= p2[7] ^ p3[7] ^ p4[7];
377		p1 += 8;
378		p2 += 8;
379		p3 += 8;
380		p4 += 8;
381	} while (--lines > 0);
382	if (lines == 0)
383		goto once_more;
384}
385
386static void
387xor_8regs_p_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
388	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
389{
390	long lines = bytes / (sizeof (long)) / 8 - 1;
391
392	prefetchw(p1);
393	prefetch(p2);
394	prefetch(p3);
395	prefetch(p4);
396	prefetch(p5);
397
398	do {
399		prefetchw(p1+8);
400		prefetch(p2+8);
401		prefetch(p3+8);
402		prefetch(p4+8);
403		prefetch(p5+8);
404 once_more:
405		p1[0] ^= p2[0] ^ p3[0] ^ p4[0] ^ p5[0];
406		p1[1] ^= p2[1] ^ p3[1] ^ p4[1] ^ p5[1];
407		p1[2] ^= p2[2] ^ p3[2] ^ p4[2] ^ p5[2];
408		p1[3] ^= p2[3] ^ p3[3] ^ p4[3] ^ p5[3];
409		p1[4] ^= p2[4] ^ p3[4] ^ p4[4] ^ p5[4];
410		p1[5] ^= p2[5] ^ p3[5] ^ p4[5] ^ p5[5];
411		p1[6] ^= p2[6] ^ p3[6] ^ p4[6] ^ p5[6];
412		p1[7] ^= p2[7] ^ p3[7] ^ p4[7] ^ p5[7];
413		p1 += 8;
414		p2 += 8;
415		p3 += 8;
416		p4 += 8;
417		p5 += 8;
418	} while (--lines > 0);
419	if (lines == 0)
420		goto once_more;
421}
422
423static void
424xor_32regs_p_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
425{
426	long lines = bytes / (sizeof (long)) / 8 - 1;
427
428	prefetchw(p1);
429	prefetch(p2);
430
431	do {
432		register long d0, d1, d2, d3, d4, d5, d6, d7;
433
434		prefetchw(p1+8);
435		prefetch(p2+8);
436 once_more:
437		d0 = p1[0];	/* Pull the stuff into registers	*/
438		d1 = p1[1];	/*  ... in bursts, if possible.		*/
439		d2 = p1[2];
440		d3 = p1[3];
441		d4 = p1[4];
442		d5 = p1[5];
443		d6 = p1[6];
444		d7 = p1[7];
445		d0 ^= p2[0];
446		d1 ^= p2[1];
447		d2 ^= p2[2];
448		d3 ^= p2[3];
449		d4 ^= p2[4];
450		d5 ^= p2[5];
451		d6 ^= p2[6];
452		d7 ^= p2[7];
453		p1[0] = d0;	/* Store the result (in bursts)		*/
454		p1[1] = d1;
455		p1[2] = d2;
456		p1[3] = d3;
457		p1[4] = d4;
458		p1[5] = d5;
459		p1[6] = d6;
460		p1[7] = d7;
461		p1 += 8;
462		p2 += 8;
463	} while (--lines > 0);
464	if (lines == 0)
465		goto once_more;
466}
467
468static void
469xor_32regs_p_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
470	    unsigned long *p3)
471{
472	long lines = bytes / (sizeof (long)) / 8 - 1;
473
474	prefetchw(p1);
475	prefetch(p2);
476	prefetch(p3);
477
478	do {
479		register long d0, d1, d2, d3, d4, d5, d6, d7;
480
481		prefetchw(p1+8);
482		prefetch(p2+8);
483		prefetch(p3+8);
484 once_more:
485		d0 = p1[0];	/* Pull the stuff into registers	*/
486		d1 = p1[1];	/*  ... in bursts, if possible.		*/
487		d2 = p1[2];
488		d3 = p1[3];
489		d4 = p1[4];
490		d5 = p1[5];
491		d6 = p1[6];
492		d7 = p1[7];
493		d0 ^= p2[0];
494		d1 ^= p2[1];
495		d2 ^= p2[2];
496		d3 ^= p2[3];
497		d4 ^= p2[4];
498		d5 ^= p2[5];
499		d6 ^= p2[6];
500		d7 ^= p2[7];
501		d0 ^= p3[0];
502		d1 ^= p3[1];
503		d2 ^= p3[2];
504		d3 ^= p3[3];
505		d4 ^= p3[4];
506		d5 ^= p3[5];
507		d6 ^= p3[6];
508		d7 ^= p3[7];
509		p1[0] = d0;	/* Store the result (in bursts)		*/
510		p1[1] = d1;
511		p1[2] = d2;
512		p1[3] = d3;
513		p1[4] = d4;
514		p1[5] = d5;
515		p1[6] = d6;
516		p1[7] = d7;
517		p1 += 8;
518		p2 += 8;
519		p3 += 8;
520	} while (--lines > 0);
521	if (lines == 0)
522		goto once_more;
523}
524
525static void
526xor_32regs_p_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
527	    unsigned long *p3, unsigned long *p4)
528{
529	long lines = bytes / (sizeof (long)) / 8 - 1;
530
531	prefetchw(p1);
532	prefetch(p2);
533	prefetch(p3);
534	prefetch(p4);
535
536	do {
537		register long d0, d1, d2, d3, d4, d5, d6, d7;
538
539		prefetchw(p1+8);
540		prefetch(p2+8);
541		prefetch(p3+8);
542		prefetch(p4+8);
543 once_more:
544		d0 = p1[0];	/* Pull the stuff into registers	*/
545		d1 = p1[1];	/*  ... in bursts, if possible.		*/
546		d2 = p1[2];
547		d3 = p1[3];
548		d4 = p1[4];
549		d5 = p1[5];
550		d6 = p1[6];
551		d7 = p1[7];
552		d0 ^= p2[0];
553		d1 ^= p2[1];
554		d2 ^= p2[2];
555		d3 ^= p2[3];
556		d4 ^= p2[4];
557		d5 ^= p2[5];
558		d6 ^= p2[6];
559		d7 ^= p2[7];
560		d0 ^= p3[0];
561		d1 ^= p3[1];
562		d2 ^= p3[2];
563		d3 ^= p3[3];
564		d4 ^= p3[4];
565		d5 ^= p3[5];
566		d6 ^= p3[6];
567		d7 ^= p3[7];
568		d0 ^= p4[0];
569		d1 ^= p4[1];
570		d2 ^= p4[2];
571		d3 ^= p4[3];
572		d4 ^= p4[4];
573		d5 ^= p4[5];
574		d6 ^= p4[6];
575		d7 ^= p4[7];
576		p1[0] = d0;	/* Store the result (in bursts)		*/
577		p1[1] = d1;
578		p1[2] = d2;
579		p1[3] = d3;
580		p1[4] = d4;
581		p1[5] = d5;
582		p1[6] = d6;
583		p1[7] = d7;
584		p1 += 8;
585		p2 += 8;
586		p3 += 8;
587		p4 += 8;
588	} while (--lines > 0);
589	if (lines == 0)
590		goto once_more;
591}
592
593static void
594xor_32regs_p_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
595	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
596{
597	long lines = bytes / (sizeof (long)) / 8 - 1;
598
599	prefetchw(p1);
600	prefetch(p2);
601	prefetch(p3);
602	prefetch(p4);
603	prefetch(p5);
604
605	do {
606		register long d0, d1, d2, d3, d4, d5, d6, d7;
607
608		prefetchw(p1+8);
609		prefetch(p2+8);
610		prefetch(p3+8);
611		prefetch(p4+8);
612		prefetch(p5+8);
613 once_more:
614		d0 = p1[0];	/* Pull the stuff into registers	*/
615		d1 = p1[1];	/*  ... in bursts, if possible.		*/
616		d2 = p1[2];
617		d3 = p1[3];
618		d4 = p1[4];
619		d5 = p1[5];
620		d6 = p1[6];
621		d7 = p1[7];
622		d0 ^= p2[0];
623		d1 ^= p2[1];
624		d2 ^= p2[2];
625		d3 ^= p2[3];
626		d4 ^= p2[4];
627		d5 ^= p2[5];
628		d6 ^= p2[6];
629		d7 ^= p2[7];
630		d0 ^= p3[0];
631		d1 ^= p3[1];
632		d2 ^= p3[2];
633		d3 ^= p3[3];
634		d4 ^= p3[4];
635		d5 ^= p3[5];
636		d6 ^= p3[6];
637		d7 ^= p3[7];
638		d0 ^= p4[0];
639		d1 ^= p4[1];
640		d2 ^= p4[2];
641		d3 ^= p4[3];
642		d4 ^= p4[4];
643		d5 ^= p4[5];
644		d6 ^= p4[6];
645		d7 ^= p4[7];
646		d0 ^= p5[0];
647		d1 ^= p5[1];
648		d2 ^= p5[2];
649		d3 ^= p5[3];
650		d4 ^= p5[4];
651		d5 ^= p5[5];
652		d6 ^= p5[6];
653		d7 ^= p5[7];
654		p1[0] = d0;	/* Store the result (in bursts)		*/
655		p1[1] = d1;
656		p1[2] = d2;
657		p1[3] = d3;
658		p1[4] = d4;
659		p1[5] = d5;
660		p1[6] = d6;
661		p1[7] = d7;
662		p1 += 8;
663		p2 += 8;
664		p3 += 8;
665		p4 += 8;
666		p5 += 8;
667	} while (--lines > 0);
668	if (lines == 0)
669		goto once_more;
670}
671
672static struct xor_block_template xor_block_8regs = {
673	.name = "8regs",
674	.do_2 = xor_8regs_2,
675	.do_3 = xor_8regs_3,
676	.do_4 = xor_8regs_4,
677	.do_5 = xor_8regs_5,
678};
679
680static struct xor_block_template xor_block_32regs = {
681	.name = "32regs",
682	.do_2 = xor_32regs_2,
683	.do_3 = xor_32regs_3,
684	.do_4 = xor_32regs_4,
685	.do_5 = xor_32regs_5,
686};
687
688static struct xor_block_template xor_block_8regs_p __maybe_unused = {
689	.name = "8regs_prefetch",
690	.do_2 = xor_8regs_p_2,
691	.do_3 = xor_8regs_p_3,
692	.do_4 = xor_8regs_p_4,
693	.do_5 = xor_8regs_p_5,
694};
695
696static struct xor_block_template xor_block_32regs_p __maybe_unused = {
697	.name = "32regs_prefetch",
698	.do_2 = xor_32regs_p_2,
699	.do_3 = xor_32regs_p_3,
700	.do_4 = xor_32regs_p_4,
701	.do_5 = xor_32regs_p_5,
702};
703
704#define XOR_TRY_TEMPLATES			\
705	do {					\
706		xor_speed(&xor_block_8regs);	\
707		xor_speed(&xor_block_8regs_p);	\
708		xor_speed(&xor_block_32regs);	\
709		xor_speed(&xor_block_32regs_p);	\
710	} while (0)
v3.5.6
 
  1/*
  2 * include/asm-generic/xor.h
  3 *
  4 * Generic optimized RAID-5 checksumming functions.
  5 *
  6 * This program is free software; you can redistribute it and/or modify
  7 * it under the terms of the GNU General Public License as published by
  8 * the Free Software Foundation; either version 2, or (at your option)
  9 * any later version.
 10 *
 11 * You should have received a copy of the GNU General Public License
 12 * (for example /usr/src/linux/COPYING); if not, write to the Free
 13 * Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 14 */
 15
 16#include <linux/prefetch.h>
 17
 18static void
 19xor_8regs_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
 20{
 21	long lines = bytes / (sizeof (long)) / 8;
 22
 23	do {
 24		p1[0] ^= p2[0];
 25		p1[1] ^= p2[1];
 26		p1[2] ^= p2[2];
 27		p1[3] ^= p2[3];
 28		p1[4] ^= p2[4];
 29		p1[5] ^= p2[5];
 30		p1[6] ^= p2[6];
 31		p1[7] ^= p2[7];
 32		p1 += 8;
 33		p2 += 8;
 34	} while (--lines > 0);
 35}
 36
 37static void
 38xor_8regs_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
 39	    unsigned long *p3)
 40{
 41	long lines = bytes / (sizeof (long)) / 8;
 42
 43	do {
 44		p1[0] ^= p2[0] ^ p3[0];
 45		p1[1] ^= p2[1] ^ p3[1];
 46		p1[2] ^= p2[2] ^ p3[2];
 47		p1[3] ^= p2[3] ^ p3[3];
 48		p1[4] ^= p2[4] ^ p3[4];
 49		p1[5] ^= p2[5] ^ p3[5];
 50		p1[6] ^= p2[6] ^ p3[6];
 51		p1[7] ^= p2[7] ^ p3[7];
 52		p1 += 8;
 53		p2 += 8;
 54		p3 += 8;
 55	} while (--lines > 0);
 56}
 57
 58static void
 59xor_8regs_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
 60	    unsigned long *p3, unsigned long *p4)
 61{
 62	long lines = bytes / (sizeof (long)) / 8;
 63
 64	do {
 65		p1[0] ^= p2[0] ^ p3[0] ^ p4[0];
 66		p1[1] ^= p2[1] ^ p3[1] ^ p4[1];
 67		p1[2] ^= p2[2] ^ p3[2] ^ p4[2];
 68		p1[3] ^= p2[3] ^ p3[3] ^ p4[3];
 69		p1[4] ^= p2[4] ^ p3[4] ^ p4[4];
 70		p1[5] ^= p2[5] ^ p3[5] ^ p4[5];
 71		p1[6] ^= p2[6] ^ p3[6] ^ p4[6];
 72		p1[7] ^= p2[7] ^ p3[7] ^ p4[7];
 73		p1 += 8;
 74		p2 += 8;
 75		p3 += 8;
 76		p4 += 8;
 77	} while (--lines > 0);
 78}
 79
 80static void
 81xor_8regs_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
 82	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
 83{
 84	long lines = bytes / (sizeof (long)) / 8;
 85
 86	do {
 87		p1[0] ^= p2[0] ^ p3[0] ^ p4[0] ^ p5[0];
 88		p1[1] ^= p2[1] ^ p3[1] ^ p4[1] ^ p5[1];
 89		p1[2] ^= p2[2] ^ p3[2] ^ p4[2] ^ p5[2];
 90		p1[3] ^= p2[3] ^ p3[3] ^ p4[3] ^ p5[3];
 91		p1[4] ^= p2[4] ^ p3[4] ^ p4[4] ^ p5[4];
 92		p1[5] ^= p2[5] ^ p3[5] ^ p4[5] ^ p5[5];
 93		p1[6] ^= p2[6] ^ p3[6] ^ p4[6] ^ p5[6];
 94		p1[7] ^= p2[7] ^ p3[7] ^ p4[7] ^ p5[7];
 95		p1 += 8;
 96		p2 += 8;
 97		p3 += 8;
 98		p4 += 8;
 99		p5 += 8;
100	} while (--lines > 0);
101}
102
103static void
104xor_32regs_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
105{
106	long lines = bytes / (sizeof (long)) / 8;
107
108	do {
109		register long d0, d1, d2, d3, d4, d5, d6, d7;
110		d0 = p1[0];	/* Pull the stuff into registers	*/
111		d1 = p1[1];	/*  ... in bursts, if possible.		*/
112		d2 = p1[2];
113		d3 = p1[3];
114		d4 = p1[4];
115		d5 = p1[5];
116		d6 = p1[6];
117		d7 = p1[7];
118		d0 ^= p2[0];
119		d1 ^= p2[1];
120		d2 ^= p2[2];
121		d3 ^= p2[3];
122		d4 ^= p2[4];
123		d5 ^= p2[5];
124		d6 ^= p2[6];
125		d7 ^= p2[7];
126		p1[0] = d0;	/* Store the result (in bursts)		*/
127		p1[1] = d1;
128		p1[2] = d2;
129		p1[3] = d3;
130		p1[4] = d4;
131		p1[5] = d5;
132		p1[6] = d6;
133		p1[7] = d7;
134		p1 += 8;
135		p2 += 8;
136	} while (--lines > 0);
137}
138
139static void
140xor_32regs_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
141	    unsigned long *p3)
142{
143	long lines = bytes / (sizeof (long)) / 8;
144
145	do {
146		register long d0, d1, d2, d3, d4, d5, d6, d7;
147		d0 = p1[0];	/* Pull the stuff into registers	*/
148		d1 = p1[1];	/*  ... in bursts, if possible.		*/
149		d2 = p1[2];
150		d3 = p1[3];
151		d4 = p1[4];
152		d5 = p1[5];
153		d6 = p1[6];
154		d7 = p1[7];
155		d0 ^= p2[0];
156		d1 ^= p2[1];
157		d2 ^= p2[2];
158		d3 ^= p2[3];
159		d4 ^= p2[4];
160		d5 ^= p2[5];
161		d6 ^= p2[6];
162		d7 ^= p2[7];
163		d0 ^= p3[0];
164		d1 ^= p3[1];
165		d2 ^= p3[2];
166		d3 ^= p3[3];
167		d4 ^= p3[4];
168		d5 ^= p3[5];
169		d6 ^= p3[6];
170		d7 ^= p3[7];
171		p1[0] = d0;	/* Store the result (in bursts)		*/
172		p1[1] = d1;
173		p1[2] = d2;
174		p1[3] = d3;
175		p1[4] = d4;
176		p1[5] = d5;
177		p1[6] = d6;
178		p1[7] = d7;
179		p1 += 8;
180		p2 += 8;
181		p3 += 8;
182	} while (--lines > 0);
183}
184
185static void
186xor_32regs_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
187	    unsigned long *p3, unsigned long *p4)
188{
189	long lines = bytes / (sizeof (long)) / 8;
190
191	do {
192		register long d0, d1, d2, d3, d4, d5, d6, d7;
193		d0 = p1[0];	/* Pull the stuff into registers	*/
194		d1 = p1[1];	/*  ... in bursts, if possible.		*/
195		d2 = p1[2];
196		d3 = p1[3];
197		d4 = p1[4];
198		d5 = p1[5];
199		d6 = p1[6];
200		d7 = p1[7];
201		d0 ^= p2[0];
202		d1 ^= p2[1];
203		d2 ^= p2[2];
204		d3 ^= p2[3];
205		d4 ^= p2[4];
206		d5 ^= p2[5];
207		d6 ^= p2[6];
208		d7 ^= p2[7];
209		d0 ^= p3[0];
210		d1 ^= p3[1];
211		d2 ^= p3[2];
212		d3 ^= p3[3];
213		d4 ^= p3[4];
214		d5 ^= p3[5];
215		d6 ^= p3[6];
216		d7 ^= p3[7];
217		d0 ^= p4[0];
218		d1 ^= p4[1];
219		d2 ^= p4[2];
220		d3 ^= p4[3];
221		d4 ^= p4[4];
222		d5 ^= p4[5];
223		d6 ^= p4[6];
224		d7 ^= p4[7];
225		p1[0] = d0;	/* Store the result (in bursts)		*/
226		p1[1] = d1;
227		p1[2] = d2;
228		p1[3] = d3;
229		p1[4] = d4;
230		p1[5] = d5;
231		p1[6] = d6;
232		p1[7] = d7;
233		p1 += 8;
234		p2 += 8;
235		p3 += 8;
236		p4 += 8;
237	} while (--lines > 0);
238}
239
240static void
241xor_32regs_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
242	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
243{
244	long lines = bytes / (sizeof (long)) / 8;
245
246	do {
247		register long d0, d1, d2, d3, d4, d5, d6, d7;
248		d0 = p1[0];	/* Pull the stuff into registers	*/
249		d1 = p1[1];	/*  ... in bursts, if possible.		*/
250		d2 = p1[2];
251		d3 = p1[3];
252		d4 = p1[4];
253		d5 = p1[5];
254		d6 = p1[6];
255		d7 = p1[7];
256		d0 ^= p2[0];
257		d1 ^= p2[1];
258		d2 ^= p2[2];
259		d3 ^= p2[3];
260		d4 ^= p2[4];
261		d5 ^= p2[5];
262		d6 ^= p2[6];
263		d7 ^= p2[7];
264		d0 ^= p3[0];
265		d1 ^= p3[1];
266		d2 ^= p3[2];
267		d3 ^= p3[3];
268		d4 ^= p3[4];
269		d5 ^= p3[5];
270		d6 ^= p3[6];
271		d7 ^= p3[7];
272		d0 ^= p4[0];
273		d1 ^= p4[1];
274		d2 ^= p4[2];
275		d3 ^= p4[3];
276		d4 ^= p4[4];
277		d5 ^= p4[5];
278		d6 ^= p4[6];
279		d7 ^= p4[7];
280		d0 ^= p5[0];
281		d1 ^= p5[1];
282		d2 ^= p5[2];
283		d3 ^= p5[3];
284		d4 ^= p5[4];
285		d5 ^= p5[5];
286		d6 ^= p5[6];
287		d7 ^= p5[7];
288		p1[0] = d0;	/* Store the result (in bursts)		*/
289		p1[1] = d1;
290		p1[2] = d2;
291		p1[3] = d3;
292		p1[4] = d4;
293		p1[5] = d5;
294		p1[6] = d6;
295		p1[7] = d7;
296		p1 += 8;
297		p2 += 8;
298		p3 += 8;
299		p4 += 8;
300		p5 += 8;
301	} while (--lines > 0);
302}
303
304static void
305xor_8regs_p_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
306{
307	long lines = bytes / (sizeof (long)) / 8 - 1;
308	prefetchw(p1);
309	prefetch(p2);
310
311	do {
312		prefetchw(p1+8);
313		prefetch(p2+8);
314 once_more:
315		p1[0] ^= p2[0];
316		p1[1] ^= p2[1];
317		p1[2] ^= p2[2];
318		p1[3] ^= p2[3];
319		p1[4] ^= p2[4];
320		p1[5] ^= p2[5];
321		p1[6] ^= p2[6];
322		p1[7] ^= p2[7];
323		p1 += 8;
324		p2 += 8;
325	} while (--lines > 0);
326	if (lines == 0)
327		goto once_more;
328}
329
330static void
331xor_8regs_p_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
332	    unsigned long *p3)
333{
334	long lines = bytes / (sizeof (long)) / 8 - 1;
335	prefetchw(p1);
336	prefetch(p2);
337	prefetch(p3);
338
339	do {
340		prefetchw(p1+8);
341		prefetch(p2+8);
342		prefetch(p3+8);
343 once_more:
344		p1[0] ^= p2[0] ^ p3[0];
345		p1[1] ^= p2[1] ^ p3[1];
346		p1[2] ^= p2[2] ^ p3[2];
347		p1[3] ^= p2[3] ^ p3[3];
348		p1[4] ^= p2[4] ^ p3[4];
349		p1[5] ^= p2[5] ^ p3[5];
350		p1[6] ^= p2[6] ^ p3[6];
351		p1[7] ^= p2[7] ^ p3[7];
352		p1 += 8;
353		p2 += 8;
354		p3 += 8;
355	} while (--lines > 0);
356	if (lines == 0)
357		goto once_more;
358}
359
360static void
361xor_8regs_p_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
362	    unsigned long *p3, unsigned long *p4)
363{
364	long lines = bytes / (sizeof (long)) / 8 - 1;
365
366	prefetchw(p1);
367	prefetch(p2);
368	prefetch(p3);
369	prefetch(p4);
370
371	do {
372		prefetchw(p1+8);
373		prefetch(p2+8);
374		prefetch(p3+8);
375		prefetch(p4+8);
376 once_more:
377		p1[0] ^= p2[0] ^ p3[0] ^ p4[0];
378		p1[1] ^= p2[1] ^ p3[1] ^ p4[1];
379		p1[2] ^= p2[2] ^ p3[2] ^ p4[2];
380		p1[3] ^= p2[3] ^ p3[3] ^ p4[3];
381		p1[4] ^= p2[4] ^ p3[4] ^ p4[4];
382		p1[5] ^= p2[5] ^ p3[5] ^ p4[5];
383		p1[6] ^= p2[6] ^ p3[6] ^ p4[6];
384		p1[7] ^= p2[7] ^ p3[7] ^ p4[7];
385		p1 += 8;
386		p2 += 8;
387		p3 += 8;
388		p4 += 8;
389	} while (--lines > 0);
390	if (lines == 0)
391		goto once_more;
392}
393
394static void
395xor_8regs_p_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
396	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
397{
398	long lines = bytes / (sizeof (long)) / 8 - 1;
399
400	prefetchw(p1);
401	prefetch(p2);
402	prefetch(p3);
403	prefetch(p4);
404	prefetch(p5);
405
406	do {
407		prefetchw(p1+8);
408		prefetch(p2+8);
409		prefetch(p3+8);
410		prefetch(p4+8);
411		prefetch(p5+8);
412 once_more:
413		p1[0] ^= p2[0] ^ p3[0] ^ p4[0] ^ p5[0];
414		p1[1] ^= p2[1] ^ p3[1] ^ p4[1] ^ p5[1];
415		p1[2] ^= p2[2] ^ p3[2] ^ p4[2] ^ p5[2];
416		p1[3] ^= p2[3] ^ p3[3] ^ p4[3] ^ p5[3];
417		p1[4] ^= p2[4] ^ p3[4] ^ p4[4] ^ p5[4];
418		p1[5] ^= p2[5] ^ p3[5] ^ p4[5] ^ p5[5];
419		p1[6] ^= p2[6] ^ p3[6] ^ p4[6] ^ p5[6];
420		p1[7] ^= p2[7] ^ p3[7] ^ p4[7] ^ p5[7];
421		p1 += 8;
422		p2 += 8;
423		p3 += 8;
424		p4 += 8;
425		p5 += 8;
426	} while (--lines > 0);
427	if (lines == 0)
428		goto once_more;
429}
430
431static void
432xor_32regs_p_2(unsigned long bytes, unsigned long *p1, unsigned long *p2)
433{
434	long lines = bytes / (sizeof (long)) / 8 - 1;
435
436	prefetchw(p1);
437	prefetch(p2);
438
439	do {
440		register long d0, d1, d2, d3, d4, d5, d6, d7;
441
442		prefetchw(p1+8);
443		prefetch(p2+8);
444 once_more:
445		d0 = p1[0];	/* Pull the stuff into registers	*/
446		d1 = p1[1];	/*  ... in bursts, if possible.		*/
447		d2 = p1[2];
448		d3 = p1[3];
449		d4 = p1[4];
450		d5 = p1[5];
451		d6 = p1[6];
452		d7 = p1[7];
453		d0 ^= p2[0];
454		d1 ^= p2[1];
455		d2 ^= p2[2];
456		d3 ^= p2[3];
457		d4 ^= p2[4];
458		d5 ^= p2[5];
459		d6 ^= p2[6];
460		d7 ^= p2[7];
461		p1[0] = d0;	/* Store the result (in bursts)		*/
462		p1[1] = d1;
463		p1[2] = d2;
464		p1[3] = d3;
465		p1[4] = d4;
466		p1[5] = d5;
467		p1[6] = d6;
468		p1[7] = d7;
469		p1 += 8;
470		p2 += 8;
471	} while (--lines > 0);
472	if (lines == 0)
473		goto once_more;
474}
475
476static void
477xor_32regs_p_3(unsigned long bytes, unsigned long *p1, unsigned long *p2,
478	    unsigned long *p3)
479{
480	long lines = bytes / (sizeof (long)) / 8 - 1;
481
482	prefetchw(p1);
483	prefetch(p2);
484	prefetch(p3);
485
486	do {
487		register long d0, d1, d2, d3, d4, d5, d6, d7;
488
489		prefetchw(p1+8);
490		prefetch(p2+8);
491		prefetch(p3+8);
492 once_more:
493		d0 = p1[0];	/* Pull the stuff into registers	*/
494		d1 = p1[1];	/*  ... in bursts, if possible.		*/
495		d2 = p1[2];
496		d3 = p1[3];
497		d4 = p1[4];
498		d5 = p1[5];
499		d6 = p1[6];
500		d7 = p1[7];
501		d0 ^= p2[0];
502		d1 ^= p2[1];
503		d2 ^= p2[2];
504		d3 ^= p2[3];
505		d4 ^= p2[4];
506		d5 ^= p2[5];
507		d6 ^= p2[6];
508		d7 ^= p2[7];
509		d0 ^= p3[0];
510		d1 ^= p3[1];
511		d2 ^= p3[2];
512		d3 ^= p3[3];
513		d4 ^= p3[4];
514		d5 ^= p3[5];
515		d6 ^= p3[6];
516		d7 ^= p3[7];
517		p1[0] = d0;	/* Store the result (in bursts)		*/
518		p1[1] = d1;
519		p1[2] = d2;
520		p1[3] = d3;
521		p1[4] = d4;
522		p1[5] = d5;
523		p1[6] = d6;
524		p1[7] = d7;
525		p1 += 8;
526		p2 += 8;
527		p3 += 8;
528	} while (--lines > 0);
529	if (lines == 0)
530		goto once_more;
531}
532
533static void
534xor_32regs_p_4(unsigned long bytes, unsigned long *p1, unsigned long *p2,
535	    unsigned long *p3, unsigned long *p4)
536{
537	long lines = bytes / (sizeof (long)) / 8 - 1;
538
539	prefetchw(p1);
540	prefetch(p2);
541	prefetch(p3);
542	prefetch(p4);
543
544	do {
545		register long d0, d1, d2, d3, d4, d5, d6, d7;
546
547		prefetchw(p1+8);
548		prefetch(p2+8);
549		prefetch(p3+8);
550		prefetch(p4+8);
551 once_more:
552		d0 = p1[0];	/* Pull the stuff into registers	*/
553		d1 = p1[1];	/*  ... in bursts, if possible.		*/
554		d2 = p1[2];
555		d3 = p1[3];
556		d4 = p1[4];
557		d5 = p1[5];
558		d6 = p1[6];
559		d7 = p1[7];
560		d0 ^= p2[0];
561		d1 ^= p2[1];
562		d2 ^= p2[2];
563		d3 ^= p2[3];
564		d4 ^= p2[4];
565		d5 ^= p2[5];
566		d6 ^= p2[6];
567		d7 ^= p2[7];
568		d0 ^= p3[0];
569		d1 ^= p3[1];
570		d2 ^= p3[2];
571		d3 ^= p3[3];
572		d4 ^= p3[4];
573		d5 ^= p3[5];
574		d6 ^= p3[6];
575		d7 ^= p3[7];
576		d0 ^= p4[0];
577		d1 ^= p4[1];
578		d2 ^= p4[2];
579		d3 ^= p4[3];
580		d4 ^= p4[4];
581		d5 ^= p4[5];
582		d6 ^= p4[6];
583		d7 ^= p4[7];
584		p1[0] = d0;	/* Store the result (in bursts)		*/
585		p1[1] = d1;
586		p1[2] = d2;
587		p1[3] = d3;
588		p1[4] = d4;
589		p1[5] = d5;
590		p1[6] = d6;
591		p1[7] = d7;
592		p1 += 8;
593		p2 += 8;
594		p3 += 8;
595		p4 += 8;
596	} while (--lines > 0);
597	if (lines == 0)
598		goto once_more;
599}
600
601static void
602xor_32regs_p_5(unsigned long bytes, unsigned long *p1, unsigned long *p2,
603	    unsigned long *p3, unsigned long *p4, unsigned long *p5)
604{
605	long lines = bytes / (sizeof (long)) / 8 - 1;
606
607	prefetchw(p1);
608	prefetch(p2);
609	prefetch(p3);
610	prefetch(p4);
611	prefetch(p5);
612
613	do {
614		register long d0, d1, d2, d3, d4, d5, d6, d7;
615
616		prefetchw(p1+8);
617		prefetch(p2+8);
618		prefetch(p3+8);
619		prefetch(p4+8);
620		prefetch(p5+8);
621 once_more:
622		d0 = p1[0];	/* Pull the stuff into registers	*/
623		d1 = p1[1];	/*  ... in bursts, if possible.		*/
624		d2 = p1[2];
625		d3 = p1[3];
626		d4 = p1[4];
627		d5 = p1[5];
628		d6 = p1[6];
629		d7 = p1[7];
630		d0 ^= p2[0];
631		d1 ^= p2[1];
632		d2 ^= p2[2];
633		d3 ^= p2[3];
634		d4 ^= p2[4];
635		d5 ^= p2[5];
636		d6 ^= p2[6];
637		d7 ^= p2[7];
638		d0 ^= p3[0];
639		d1 ^= p3[1];
640		d2 ^= p3[2];
641		d3 ^= p3[3];
642		d4 ^= p3[4];
643		d5 ^= p3[5];
644		d6 ^= p3[6];
645		d7 ^= p3[7];
646		d0 ^= p4[0];
647		d1 ^= p4[1];
648		d2 ^= p4[2];
649		d3 ^= p4[3];
650		d4 ^= p4[4];
651		d5 ^= p4[5];
652		d6 ^= p4[6];
653		d7 ^= p4[7];
654		d0 ^= p5[0];
655		d1 ^= p5[1];
656		d2 ^= p5[2];
657		d3 ^= p5[3];
658		d4 ^= p5[4];
659		d5 ^= p5[5];
660		d6 ^= p5[6];
661		d7 ^= p5[7];
662		p1[0] = d0;	/* Store the result (in bursts)		*/
663		p1[1] = d1;
664		p1[2] = d2;
665		p1[3] = d3;
666		p1[4] = d4;
667		p1[5] = d5;
668		p1[6] = d6;
669		p1[7] = d7;
670		p1 += 8;
671		p2 += 8;
672		p3 += 8;
673		p4 += 8;
674		p5 += 8;
675	} while (--lines > 0);
676	if (lines == 0)
677		goto once_more;
678}
679
680static struct xor_block_template xor_block_8regs = {
681	.name = "8regs",
682	.do_2 = xor_8regs_2,
683	.do_3 = xor_8regs_3,
684	.do_4 = xor_8regs_4,
685	.do_5 = xor_8regs_5,
686};
687
688static struct xor_block_template xor_block_32regs = {
689	.name = "32regs",
690	.do_2 = xor_32regs_2,
691	.do_3 = xor_32regs_3,
692	.do_4 = xor_32regs_4,
693	.do_5 = xor_32regs_5,
694};
695
696static struct xor_block_template xor_block_8regs_p = {
697	.name = "8regs_prefetch",
698	.do_2 = xor_8regs_p_2,
699	.do_3 = xor_8regs_p_3,
700	.do_4 = xor_8regs_p_4,
701	.do_5 = xor_8regs_p_5,
702};
703
704static struct xor_block_template xor_block_32regs_p = {
705	.name = "32regs_prefetch",
706	.do_2 = xor_32regs_p_2,
707	.do_3 = xor_32regs_p_3,
708	.do_4 = xor_32regs_p_4,
709	.do_5 = xor_32regs_p_5,
710};
711
712#define XOR_TRY_TEMPLATES			\
713	do {					\
714		xor_speed(&xor_block_8regs);	\
715		xor_speed(&xor_block_8regs_p);	\
716		xor_speed(&xor_block_32regs);	\
717		xor_speed(&xor_block_32regs_p);	\
718	} while (0)