Lines Matching +full:4 +full:b

42 	ld1		{v12.4s}, [x10]
46 add v0.4s, v0.4s, v1.4s
47 eor v3.16b, v3.16b, v0.16b
51 add v2.4s, v2.4s, v3.4s
52 eor v4.16b, v1.16b, v2.16b
53 shl v1.4s, v4.4s, #12
54 sri v1.4s, v4.4s, #20
57 add v0.4s, v0.4s, v1.4s
58 eor v3.16b, v3.16b, v0.16b
59 tbl v3.16b, {v3.16b}, v12.16b
62 add v2.4s, v2.4s, v3.4s
63 eor v4.16b, v1.16b, v2.16b
64 shl v1.4s, v4.4s, #7
65 sri v1.4s, v4.4s, #25
68 ext v1.16b, v1.16b, v1.16b, #4
70 ext v2.16b, v2.16b, v2.16b, #8
72 ext v3.16b, v3.16b, v3.16b, #12
75 add v0.4s, v0.4s, v1.4s
76 eor v3.16b, v3.16b, v0.16b
80 add v2.4s, v2.4s, v3.4s
81 eor v4.16b, v1.16b, v2.16b
82 shl v1.4s, v4.4s, #12
83 sri v1.4s, v4.4s, #20
86 add v0.4s, v0.4s, v1.4s
87 eor v3.16b, v3.16b, v0.16b
88 tbl v3.16b, {v3.16b}, v12.16b
91 add v2.4s, v2.4s, v3.4s
92 eor v4.16b, v1.16b, v2.16b
93 shl v1.4s, v4.4s, #7
94 sri v1.4s, v4.4s, #25
97 ext v1.16b, v1.16b, v1.16b, #12
99 ext v2.16b, v2.16b, v2.16b, #8
101 ext v3.16b, v3.16b, v3.16b, #4
104 b.ne .Ldoubleround
119 ld1 {v0.4s-v3.4s}, [x0]
120 ld1 {v8.4s-v11.4s}, [x0]
124 ld1 {v4.16b-v7.16b}, [x2]
127 add v0.4s, v0.4s, v8.4s
128 eor v0.16b, v0.16b, v4.16b
131 add v1.4s, v1.4s, v9.4s
132 eor v1.16b, v1.16b, v5.16b
135 add v2.4s, v2.4s, v10.4s
136 eor v2.16b, v2.16b, v6.16b
139 add v3.4s, v3.4s, v11.4s
140 eor v3.16b, v3.16b, v7.16b
142 st1 {v0.16b-v3.16b}, [x1]
156 ld1 {v0.4s-v3.4s}, [x0]
161 st1 {v0.4s}, [x1], #16
162 st1 {v3.4s}, [x1]
190 // x1: 4 data blocks output, o
191 // x2: 4 data blocks input, i
212 ld1 {v30.4s-v31.4s}, [x9]
216 ld4r { v0.4s- v3.4s}, [x0]
217 ld4r { v4.4s- v7.4s}, [x8], #16
218 ld4r { v8.4s-v11.4s}, [x8], #16
219 ld4r {v12.4s-v15.4s}, [x8]
238 // x12 += counter values 1-4
239 add v12.4s, v12.4s, v30.4s
246 add v0.4s, v0.4s, v4.4s
248 add v1.4s, v1.4s, v5.4s
250 add v2.4s, v2.4s, v6.4s
252 add v3.4s, v3.4s, v7.4s
255 eor v12.16b, v12.16b, v0.16b
257 eor v13.16b, v13.16b, v1.16b
259 eor v14.16b, v14.16b, v2.16b
261 eor v15.16b, v15.16b, v3.16b
277 add v8.4s, v8.4s, v12.4s
279 add v9.4s, v9.4s, v13.4s
281 add v10.4s, v10.4s, v14.4s
283 add v11.4s, v11.4s, v15.4s
286 eor v16.16b, v4.16b, v8.16b
288 eor v17.16b, v5.16b, v9.16b
290 eor v18.16b, v6.16b, v10.16b
292 eor v19.16b, v7.16b, v11.16b
295 shl v4.4s, v16.4s, #12
296 shl v5.4s, v17.4s, #12
297 shl v6.4s, v18.4s, #12
298 shl v7.4s, v19.4s, #12
300 sri v4.4s, v16.4s, #20
302 sri v5.4s, v17.4s, #20
304 sri v6.4s, v18.4s, #20
306 sri v7.4s, v19.4s, #20
313 add v0.4s, v0.4s, v4.4s
315 add v1.4s, v1.4s, v5.4s
317 add v2.4s, v2.4s, v6.4s
319 add v3.4s, v3.4s, v7.4s
322 eor v12.16b, v12.16b, v0.16b
324 eor v13.16b, v13.16b, v1.16b
326 eor v14.16b, v14.16b, v2.16b
328 eor v15.16b, v15.16b, v3.16b
331 tbl v12.16b, {v12.16b}, v31.16b
333 tbl v13.16b, {v13.16b}, v31.16b
335 tbl v14.16b, {v14.16b}, v31.16b
337 tbl v15.16b, {v15.16b}, v31.16b
344 add v8.4s, v8.4s, v12.4s
346 add v9.4s, v9.4s, v13.4s
348 add v10.4s, v10.4s, v14.4s
350 add v11.4s, v11.4s, v15.4s
353 eor v16.16b, v4.16b, v8.16b
355 eor v17.16b, v5.16b, v9.16b
357 eor v18.16b, v6.16b, v10.16b
359 eor v19.16b, v7.16b, v11.16b
362 shl v4.4s, v16.4s, #7
363 shl v5.4s, v17.4s, #7
364 shl v6.4s, v18.4s, #7
365 shl v7.4s, v19.4s, #7
367 sri v4.4s, v16.4s, #25
369 sri v5.4s, v17.4s, #25
371 sri v6.4s, v18.4s, #25
373 sri v7.4s, v19.4s, #25
380 add v0.4s, v0.4s, v5.4s
382 add v1.4s, v1.4s, v6.4s
384 add v2.4s, v2.4s, v7.4s
386 add v3.4s, v3.4s, v4.4s
389 eor v15.16b, v15.16b, v0.16b
391 eor v12.16b, v12.16b, v1.16b
393 eor v13.16b, v13.16b, v2.16b
395 eor v14.16b, v14.16b, v3.16b
411 add v10.4s, v10.4s, v15.4s
413 add v11.4s, v11.4s, v12.4s
415 add v8.4s, v8.4s, v13.4s
417 add v9.4s, v9.4s, v14.4s
420 eor v16.16b, v5.16b, v10.16b
422 eor v17.16b, v6.16b, v11.16b
424 eor v18.16b, v7.16b, v8.16b
426 eor v19.16b, v4.16b, v9.16b
429 shl v5.4s, v16.4s, #12
430 shl v6.4s, v17.4s, #12
431 shl v7.4s, v18.4s, #12
432 shl v4.4s, v19.4s, #12
434 sri v5.4s, v16.4s, #20
436 sri v6.4s, v17.4s, #20
438 sri v7.4s, v18.4s, #20
440 sri v4.4s, v19.4s, #20
447 add v0.4s, v0.4s, v5.4s
449 add v1.4s, v1.4s, v6.4s
451 add v2.4s, v2.4s, v7.4s
453 add v3.4s, v3.4s, v4.4s
456 eor v15.16b, v15.16b, v0.16b
458 eor v12.16b, v12.16b, v1.16b
460 eor v13.16b, v13.16b, v2.16b
462 eor v14.16b, v14.16b, v3.16b
465 tbl v15.16b, {v15.16b}, v31.16b
467 tbl v12.16b, {v12.16b}, v31.16b
469 tbl v13.16b, {v13.16b}, v31.16b
471 tbl v14.16b, {v14.16b}, v31.16b
478 add v10.4s, v10.4s, v15.4s
480 add v11.4s, v11.4s, v12.4s
482 add v8.4s, v8.4s, v13.4s
484 add v9.4s, v9.4s, v14.4s
487 eor v16.16b, v5.16b, v10.16b
489 eor v17.16b, v6.16b, v11.16b
491 eor v18.16b, v7.16b, v8.16b
493 eor v19.16b, v4.16b, v9.16b
496 shl v5.4s, v16.4s, #7
497 shl v6.4s, v17.4s, #7
498 shl v7.4s, v18.4s, #7
499 shl v4.4s, v19.4s, #7
501 sri v5.4s, v16.4s, #25
503 sri v6.4s, v17.4s, #25
505 sri v7.4s, v18.4s, #25
507 sri v4.4s, v19.4s, #25
511 b.ne .Ldoubleround4
513 ld4r {v16.4s-v19.4s}, [x0], #16
514 ld4r {v20.4s-v23.4s}, [x0], #16
517 add v12.4s, v12.4s, v30.4s
523 add v0.4s, v0.4s, v16.4s
526 add v1.4s, v1.4s, v17.4s
529 add v2.4s, v2.4s, v18.4s
532 add v3.4s, v3.4s, v19.4s
540 ld4r {v24.4s-v27.4s}, [x0], #16
541 ld4r {v28.4s-v31.4s}, [x0]
547 add v4.4s, v4.4s, v20.4s
550 add v5.4s, v5.4s, v21.4s
553 add v6.4s, v6.4s, v22.4s
556 add v7.4s, v7.4s, v23.4s
568 add v8.4s, v8.4s, v24.4s
571 add v9.4s, v9.4s, v25.4s
574 add v10.4s, v10.4s, v26.4s
577 add v11.4s, v11.4s, v27.4s
589 add v12.4s, v12.4s, v28.4s
592 add v13.4s, v13.4s, v29.4s
595 add v14.4s, v14.4s, v30.4s
598 add v15.4s, v15.4s, v31.4s
608 zip1 v16.4s, v0.4s, v1.4s
611 zip2 v17.4s, v0.4s, v1.4s
613 zip1 v18.4s, v2.4s, v3.4s
615 zip2 v19.4s, v2.4s, v3.4s
618 zip1 v20.4s, v4.4s, v5.4s
621 zip2 v21.4s, v4.4s, v5.4s
623 zip1 v22.4s, v6.4s, v7.4s
625 zip2 v23.4s, v6.4s, v7.4s
628 zip1 v24.4s, v8.4s, v9.4s
631 zip2 v25.4s, v8.4s, v9.4s
633 zip1 v26.4s, v10.4s, v11.4s
635 zip2 v27.4s, v10.4s, v11.4s
638 zip1 v28.4s, v12.4s, v13.4s
641 zip2 v29.4s, v12.4s, v13.4s
643 zip1 v30.4s, v14.4s, v15.4s
645 zip2 v31.4s, v14.4s, v15.4s
661 ld1 {v16.16b-v19.16b}, [x2], x3
664 ccmp x3, xzr, #4, lt
675 ld1 {v20.16b-v23.16b}, [x2], x3
678 ccmp x3, xzr, #4, lt
689 ld1 {v24.16b-v27.16b}, [x2], x3
692 ccmp x3, xzr, #4, lt
702 ld1 {v28.16b-v31.16b}, [x2]
706 eor v16.16b, v16.16b, v0.16b
707 eor v17.16b, v17.16b, v1.16b
708 eor v18.16b, v18.16b, v2.16b
709 eor v19.16b, v19.16b, v3.16b
710 st1 {v16.16b-v19.16b}, [x1], #64
714 eor v20.16b, v20.16b, v4.16b
715 eor v21.16b, v21.16b, v5.16b
716 eor v22.16b, v22.16b, v6.16b
717 eor v23.16b, v23.16b, v7.16b
718 st1 {v20.16b-v23.16b}, [x1], #64
722 eor v24.16b, v24.16b, v8.16b
723 eor v25.16b, v25.16b, v9.16b
724 eor v26.16b, v26.16b, v10.16b
725 eor v27.16b, v27.16b, v11.16b
726 st1 {v24.16b-v27.16b}, [x1], #64
730 eor v28.16b, v28.16b, v12.16b
731 eor v29.16b, v29.16b, v13.16b
732 eor v30.16b, v30.16b, v14.16b
733 eor v31.16b, v31.16b, v15.16b
734 st1 {v28.16b-v31.16b}, [x1]
740 0: ld1 {v8.16b}, [x10]
741 ld1 {v9.16b}, [x11]
742 movi v10.16b, #16
745 ld1 {v16.16b-v19.16b}, [x2]
746 tbl v4.16b, {v0.16b-v3.16b}, v8.16b
747 tbx v20.16b, {v16.16b-v19.16b}, v9.16b
748 add v8.16b, v8.16b, v10.16b
749 add v9.16b, v9.16b, v10.16b
750 tbl v5.16b, {v0.16b-v3.16b}, v8.16b
751 tbx v21.16b, {v16.16b-v19.16b}, v9.16b
752 add v8.16b, v8.16b, v10.16b
753 add v9.16b, v9.16b, v10.16b
754 tbl v6.16b, {v0.16b-v3.16b}, v8.16b
755 tbx v22.16b, {v16.16b-v19.16b}, v9.16b
756 add v8.16b, v8.16b, v10.16b
757 add v9.16b, v9.16b, v10.16b
758 tbl v7.16b, {v0.16b-v3.16b}, v8.16b
759 tbx v23.16b, {v16.16b-v19.16b}, v9.16b
761 eor v20.16b, v20.16b, v4.16b
762 eor v21.16b, v21.16b, v5.16b
763 eor v22.16b, v22.16b, v6.16b
764 eor v23.16b, v23.16b, v7.16b
765 st1 {v20.16b-v23.16b}, [x1]
766 b .Lout
769 1: ld1 {v8.16b}, [x10]
770 ld1 {v9.16b}, [x11]
771 movi v10.16b, #16
773 tbl v0.16b, {v4.16b-v7.16b}, v8.16b
774 tbx v20.16b, {v16.16b-v19.16b}, v9.16b
775 add v8.16b, v8.16b, v10.16b
776 add v9.16b, v9.16b, v10.16b
777 tbl v1.16b, {v4.16b-v7.16b}, v8.16b
778 tbx v21.16b, {v16.16b-v19.16b}, v9.16b
779 add v8.16b, v8.16b, v10.16b
780 add v9.16b, v9.16b, v10.16b
781 tbl v2.16b, {v4.16b-v7.16b}, v8.16b
782 tbx v22.16b, {v16.16b-v19.16b}, v9.16b
783 add v8.16b, v8.16b, v10.16b
784 add v9.16b, v9.16b, v10.16b
785 tbl v3.16b, {v4.16b-v7.16b}, v8.16b
786 tbx v23.16b, {v16.16b-v19.16b}, v9.16b
788 eor v20.16b, v20.16b, v0.16b
789 eor v21.16b, v21.16b, v1.16b
790 eor v22.16b, v22.16b, v2.16b
791 eor v23.16b, v23.16b, v3.16b
792 st1 {v20.16b-v23.16b}, [x1]
793 b .Lout
796 2: ld1 {v4.16b}, [x10]
797 ld1 {v5.16b}, [x11]
798 movi v6.16b, #16
800 tbl v0.16b, {v8.16b-v11.16b}, v4.16b
801 tbx v24.16b, {v20.16b-v23.16b}, v5.16b
802 add v4.16b, v4.16b, v6.16b
803 add v5.16b, v5.16b, v6.16b
804 tbl v1.16b, {v8.16b-v11.16b}, v4.16b
805 tbx v25.16b, {v20.16b-v23.16b}, v5.16b
806 add v4.16b, v4.16b, v6.16b
807 add v5.16b, v5.16b, v6.16b
808 tbl v2.16b, {v8.16b-v11.16b}, v4.16b
809 tbx v26.16b, {v20.16b-v23.16b}, v5.16b
810 add v4.16b, v4.16b, v6.16b
811 add v5.16b, v5.16b, v6.16b
812 tbl v3.16b, {v8.16b-v11.16b}, v4.16b
813 tbx v27.16b, {v20.16b-v23.16b}, v5.16b
815 eor v24.16b, v24.16b, v0.16b
816 eor v25.16b, v25.16b, v1.16b
817 eor v26.16b, v26.16b, v2.16b
818 eor v27.16b, v27.16b, v3.16b
819 st1 {v24.16b-v27.16b}, [x1]
820 b .Lout
823 3: ld1 {v4.16b}, [x10]
824 ld1 {v5.16b}, [x11]
825 movi v6.16b, #16
827 tbl v0.16b, {v12.16b-v15.16b}, v4.16b
828 tbx v28.16b, {v24.16b-v27.16b}, v5.16b
829 add v4.16b, v4.16b, v6.16b
830 add v5.16b, v5.16b, v6.16b
831 tbl v1.16b, {v12.16b-v15.16b}, v4.16b
832 tbx v29.16b, {v24.16b-v27.16b}, v5.16b
833 add v4.16b, v4.16b, v6.16b
834 add v5.16b, v5.16b, v6.16b
835 tbl v2.16b, {v12.16b-v15.16b}, v4.16b
836 tbx v30.16b, {v24.16b-v27.16b}, v5.16b
837 add v4.16b, v4.16b, v6.16b
838 add v5.16b, v5.16b, v6.16b
839 tbl v3.16b, {v12.16b-v15.16b}, v4.16b
840 tbx v31.16b, {v24.16b-v27.16b}, v5.16b
842 eor v28.16b, v28.16b, v0.16b
843 eor v29.16b, v29.16b, v1.16b
844 eor v30.16b, v30.16b, v2.16b
845 eor v31.16b, v31.16b, v3.16b
846 st1 {v28.16b-v31.16b}, [x1]
847 b .Lout
859 CTRINC: .word 1, 2, 3, 4