summaryrefslogtreecommitdiffstats
path: root/arch/powerpc/crypto/crct10dif-vpmsum_asm.S
blob: 5e3d81a0af1b98bc8d23982217e1d5064de4aaf0 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
/*
 * Calculate a CRC T10DIF  with vpmsum acceleration
 *
 * Constants generated by crc32-vpmsum, available at
 * https://github.com/antonblanchard/crc32-vpmsum
 *
 * crc32-vpmsum is
 * Copyright (C) 2015 Anton Blanchard <anton@au.ibm.com>, IBM
 * and is available under the GPL v2 or later.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version
 * 2 of the License, or (at your option) any later version.
 */
	.section	.rodata
.balign 16

.byteswap_constant:
	/* byte reverse permute constant */
	.octa 0x0F0E0D0C0B0A09080706050403020100

.constants:

	/* Reduce 262144 kbits to 1024 bits */
	/* x^261184 mod p(x), x^261120 mod p(x) */
	.octa 0x0000000056d300000000000052550000

	/* x^260160 mod p(x), x^260096 mod p(x) */
	.octa 0x00000000ee67000000000000a1e40000

	/* x^259136 mod p(x), x^259072 mod p(x) */
	.octa 0x0000000060830000000000004ad10000

	/* x^258112 mod p(x), x^258048 mod p(x) */
	.octa 0x000000008cfe0000000000009ab40000

	/* x^257088 mod p(x), x^257024 mod p(x) */
	.octa 0x000000003e93000000000000fdb50000

	/* x^256064 mod p(x), x^256000 mod p(x) */
	.octa 0x000000003c2000000000000045480000

	/* x^255040 mod p(x), x^254976 mod p(x) */
	.octa 0x00000000b1fc0000000000008d690000

	/* x^254016 mod p(x), x^253952 mod p(x) */
	.octa 0x00000000f82b00000000000024ad0000

	/* x^252992 mod p(x), x^252928 mod p(x) */
	.octa 0x0000000044420000000000009f1a0000

	/* x^251968 mod p(x), x^251904 mod p(x) */
	.octa 0x00000000e88c00000000000066ec0000

	/* x^250944 mod p(x), x^250880 mod p(x) */
	.octa 0x00000000385c000000000000c87d0000

	/* x^249920 mod p(x), x^249856 mod p(x) */
	.octa 0x000000003227000000000000c8ff0000

	/* x^248896 mod p(x), x^248832 mod p(x) */
	.octa 0x00000000a9a900000000000033440000

	/* x^247872 mod p(x), x^247808 mod p(x) */
	.octa 0x00000000abaa00000000000066eb0000

	/* x^246848 mod p(x), x^246784 mod p(x) */
	.octa 0x000000001ac3000000000000c4ef0000

	/* x^245824 mod p(x), x^245760 mod p(x) */
	.octa 0x0000000063f000000000000056f30000

	/* x^244800 mod p(x), x^244736 mod p(x) */
	.octa 0x0000000032cc00000000000002050000

	/* x^243776 mod p(x), x^243712 mod p(x) */
	.octa 0x00000000f8b5000000000000568e0000

	/* x^242752 mod p(x), x^242688 mod p(x) */
	.octa 0x000000008db100000000000064290000

	/* x^241728 mod p(x), x^241664 mod p(x) */
	.octa 0x0000000059ca0000000000006b660000

	/* x^240704 mod p(x), x^240640 mod p(x) */
	.octa 0x000000005f5c00000000000018f80000

	/* x^239680 mod p(x), x^239616 mod p(x) */
	.octa 0x0000000061af000000000000b6090000

	/* x^238656 mod p(x), x^238592 mod p(x) */
	.octa 0x00000000e29e000000000000099a0000

	/* x^237632 mod p(x), x^237568 mod p(x) */
	.octa 0x000000000975000000000000a8360000

	/* x^236608 mod p(x), x^236544 mod p(x) */
	.octa 0x0000000043900000000000004f570000

	/* x^235584 mod p(x), x^235520 mod p(x) */
	.octa 0x00000000f9cd000000000000134c0000

	/* x^234560 mod p(x), x^234496 mod p(x) */
	.octa 0x000000007c29000000000000ec380000

	/* x^233536 mod p(x), x^233472 mod p(x) */
	.octa 0x000000004c6a000000000000b0d10000

	/* x^232512 mod p(x), x^232448 mod p(x) */
	.octa 0x00000000e7290000000000007d3e0000

	/* x^231488 mod p(x), x^231424 mod p(x) */
	.octa 0x00000000f1ab000000000000f0b20000

	/* x^230464 mod p(x), x^230400 mod p(x) */
	.octa 0x0000000039db0000000000009c270000

	/* x^229440 mod p(x), x^229376 mod p(x) */
	.octa 0x000000005e2800000000000092890000

	/* x^228416 mod p(x), x^228352 mod p(x) */
	.octa 0x00000000d44e000000000000d5ee0000

	/* x^227392 mod p(x), x^227328 mod p(x) */
	.octa 0x00000000cd0a00000000000041f50000

	/* x^226368 mod p(x), x^226304 mod p(x) */
	.octa 0x00000000c5b400000000000010520000

	/* x^225344 mod p(x), x^225280 mod p(x) */
	.octa 0x00000000fd2100000000000042170000

	/* x^224320 mod p(x), x^224256 mod p(x) */
	.octa 0x000000002f2500000000000095c20000

	/* x^223296 mod p(x), x^223232 mod p(x) */
	.octa 0x000000001b0100000000000001ce0000

	/* x^222272 mod p(x), x^222208 mod p(x) */
	.octa 0x000000000d430000000000002aca0000

	/* x^221248 mod p(x), x^221184 mod p(x) */
	.octa 0x0000000030a6000000000000385e0000

	/* x^220224 mod p(x), x^220160 mod p(x) */
	.octa 0x00000000e37b0000000000006f7a0000

	/* x^219200 mod p(x), x^219136 mod p(x) */
	.octa 0x00000000873600000000000024320000

	/* x^218176 mod p(x), x^218112 mod p(x) */
	.octa 0x00000000e9fb000000000000bd9c0000

	/* x^217152 mod p(x), x^217088 mod p(x) */
	.octa 0x000000003b9500000000000054bc0000

	/* x^216128 mod p(x), x^216064 mod p(x) */
	.octa 0x00000000133e000000000000a4660000

	/* x^215104 mod p(x), x^215040 mod p(x) */
	.octa 0x00000000784500000000000079930000

	/* x^214080 mod p(x), x^214016 mod p(x) */
	.octa 0x00000000b9800000000000001bb80000

	/* x^213056 mod p(x), x^212992 mod p(x) */
	.octa 0x00000000687600000000000024400000

	/* x^212032 mod p(x), x^211968 mod p(x) */
	.octa 0x00000000aff300000000000029e10000

	/* x^211008 mod p(x), x^210944 mod p(x) */
	.octa 0x0000000024b50000000000005ded0000

	/* x^209984 mod p(x), x^209920 mod p(x) */
	.octa 0x0000000017e8000000000000b12e0000

	/* x^208960 mod p(x), x^208896 mod p(x) */
	.octa 0x00000000128400000000000026d20000

	/* x^207936 mod p(x), x^207872 mod p(x) */
	.octa 0x000000002115000000000000a32a0000

	/* x^206912 mod p(x), x^206848 mod p(x) */
	.octa 0x000000009595000000000000a1210000

	/* x^205888 mod p(x), x^205824 mod p(x) */
	.octa 0x00000000281e000000000000ee8b0000

	/* x^204864 mod p(x), x^204800 mod p(x) */
	.octa 0x0000000006010000000000003d0d0000

	/* x^203840 mod p(x), x^203776 mod p(x) */
	.octa 0x00000000e2b600000000000034e90000

	/* x^202816 mod p(x), x^202752 mod p(x) */
	.octa 0x000000001bd40000000000004cdb0000

	/* x^201792 mod p(x), x^201728 mod p(x) */
	.octa 0x00000000df2800000000000030e90000

	/* x^200768 mod p(x), x^200704 mod p(x) */
	.octa 0x0000000049c200000000000042590000

	/* x^199744 mod p(x), x^199680 mod p(x) */
	.octa 0x000000009b97000000000000df950000

	/* x^198720 mod p(x), x^198656 mod p(x) */
	.octa 0x000000006184000000000000da7b0000

	/* x^197696 mod p(x), x^197632 mod p(x) */
	.octa 0x00000000461700000000000012510000

	/* x^196672 mod p(x), x^196608 mod p(x) */
	.octa 0x000000009b40000000000000f37e0000

	/* x^195648 mod p(x), x^195584 mod p(x) */
	.octa 0x00000000eeb2000000000000ecf10000

	/* x^194624 mod p(x), x^194560 mod p(x) */
	.octa 0x00000000b2e800000000000050f20000

	/* x^193600 mod p(x), x^193536 mod p(x) */
	.octa 0x00000000f59a000000000000e0b30000

	/* x^192576 mod p(x), x^192512 mod p(x) */
	.octa 0x00000000467f0000000000004d5a0000

	/* x^191552 mod p(x), x^191488 mod p(x) */
	.octa 0x00000000da92000000000000bb010000

	/* x^190528 mod p(x), x^190464 mod p(x) */
	.octa 0x000000001e1000000000000022a40000

	/* x^189504 mod p(x), x^189440 mod p(x) */
	.octa 0x0000000058fe000000000000836f0000

	/* x^188480 mod p(x), x^188416 mod p(x) */
	.octa 0x00000000b9ce000000000000d78d0000

	/* x^187456 mod p(x), x^187392 mod p(x) */
	.octa 0x0000000022210000000000004f8d0000

	/* x^186432 mod p(x), x^186368 mod p(x) */
	.octa 0x00000000744600000000000033760000

	/* x^185408 mod p(x), x^185344 mod p(x) */
	.octa 0x000000001c2e000000000000a1e50000

	/* x^184384 mod p(x), x^184320 mod p(x) */
	.octa 0x00000000dcc8000000000000a1a40000

	/* x^183360 mod p(x), x^183296 mod p(x) */
	.octa 0x00000000910f00000000000019a20000

	/* x^182336 mod p(x), x^182272 mod p(x) */
	.octa 0x0000000055d5000000000000f6ae0000

	/* x^181312 mod p(x), x^181248 mod p(x) */
	.octa 0x00000000c8ba000000000000a7ac0000

	/* x^180288 mod p(x), x^180224 mod p(x) */
	.octa 0x0000000031f8000000000000eea20000

	/* x^179264 mod p(x), x^179200 mod p(x) */
	.octa 0x000000001966000000000000c4d90000

	/* x^178240 mod p(x), x^178176 mod p(x) */
	.octa 0x00000000b9810000000000002b470000

	/* x^177216 mod p(x), x^177152 mod p(x) */
	.octa 0x000000008303000000000000f7cf0000

	/* x^176192 mod p(x), x^176128 mod p(x) */
	.octa 0x000000002ce500000000000035b30000

	/* x^175168 mod p(x), x^175104 mod p(x) */
	.octa 0x000000002fae0000000000000c7c0000

	/* x^174144 mod p(x), x^174080 mod p(x) */
	.octa 0x00000000f50c0000000000009edf0000

	/* x^173120 mod p(x), x^173056 mod p(x) */
	.octa 0x00000000714f00000000000004cd0000

	/* x^172096 mod p(x), x^172032 mod p(x) */
	.octa 0x00000000c161000000000000541b0000

	/* x^171072 mod p(x), x^171008 mod p(x) */
	.octa 0x0000000021c8000000000000e2700000

	/* x^170048 mod p(x), x^169984 mod p(x) */
	.octa 0x00000000b93d00000000000009a60000

	/* x^169024 mod p(x), x^168960 mod p(x) */
	.octa 0x00000000fbcf000000000000761c0000

	/* x^168000 mod p(x), x^167936 mod p(x) */
	.octa 0x0000000026350000000000009db30000

	/* x^166976 mod p(x), x^166912 mod p(x) */
	.octa 0x00000000b64f0000000000003e9f0000

	/* x^165952 mod p(x), x^165888 mod p(x) */
	.octa 0x00000000bd0e00000000000078590000

	/* x^164928 mod p(x), x^164864 mod p(x) */
	.octa 0x00000000d9360000000000008bc80000

	/* x^163904 mod p(x), x^163840 mod p(x) */
	.octa 0x000000002f140000000000008c9f0000

	/* x^162880 mod p(x), x^162816 mod p(x) */
	.octa 0x000000006a270000000000006af70000

	/* x^161856 mod p(x), x^161792 mod p(x) */
	.octa 0x000000006685000000000000e5210000

	/* x^160832 mod p(x), x^160768 mod p(x) */
	.octa 0x0000000062da00000000000008290000

	/* x^159808 mod p(x), x^159744 mod p(x) */
	.octa 0x00000000bb4b000000000000e4d00000

	/* x^158784 mod p(x), x^158720 mod p(x) */
	.octa 0x00000000d2490000000000004ae10000

	/* x^157760 mod p(x), x^157696 mod p(x) */
	.octa 0x00000000c85b00000000000000e70000

	/* x^156736 mod p(x), x^156672 mod p(x) */
	.octa 0x00000000c37a00000000000015650000

	/* x^155712 mod p(x), x^155648 mod p(x) */
	.octa 0x0000000018530000000000001c2f0000

	/* x^154688 mod p(x), x^154624 mod p(x) */
	.octa 0x00000000b46600000000000037bd0000

	/* x^153664 mod p(x), x^153600 mod p(x) */
	.octa 0x00000000439b00000000000012190000

	/* x^152640 mod p(x), x^152576 mod p(x) */
	.octa 0x00000000b1260000000000005ece0000

	/* x^151616 mod p(x), x^151552 mod p(x) */
	.octa 0x00000000d8110000000000002a5e0000

	/* x^150592 mod p(x), x^150528 mod p(x) */
	.octa 0x00000000099f00000000000052330000

	/* x^149568 mod p(x), x^149504 mod p(x) */
	.octa 0x00000000f9f9000000000000f9120000

	/* x^148544 mod p(x), x^148480 mod p(x) */
	.octa 0x000000005cc00000000000000ddc0000

	/* x^147520 mod p(x), x^147456 mod p(x) */
	.octa 0x00000000343b00000000000012200000

	/* x^146496 mod p(x), x^146432 mod p(x) */
	.octa 0x000000009222000000000000d12b0000

	/* x^145472 mod p(x), x^145408 mod p(x) */
	.octa 0x00000000d781000000000000eb2d0000

	/* x^144448 mod p(x), x^144384 mod p(x) */
	.octa 0x000000000bf400000000000058970000

	/* x^143424 mod p(x), x^143360 mod p(x) */
	.o