Lines Matching +full:0 +full:x17

5 #define __has_feature(x) 0
29 add x29,sp,#0
34 ldr x9,[x2],#8 // bp[0]
36 ldp x7,x8,[x1],#16 // ap[0..1]
40 ldp x13,x14,[x3],#16 // np[0..1]
42 mul x6,x7,x9 // ap[0]*bp[0]
45 mul x10,x8,x9 // ap[1]*bp[0]
48 mul x15,x6,x4 // "tp[0]"*n0
51 // (*) mul x12,x13,x15 // np[0]*m1
65 umulh x17,x14,x15
77 mul x10,x8,x9 // ap[j]*bp[0]
78 adc x13,x17,xzr
84 umulh x17,x14,x15
95 adc x13,x17,xzr
107 ldr x23,[sp] // tp[0]
110 mul x6,x7,x9 // ap[0]*bp[i]
122 // (*) mul x12,x13,x15 // np[0]*m1
127 umulh x17,x14,x15
140 adc x13,x17,xzr
149 umulh x17,x14,x15
162 adcs x13,x17,x19
179 ldr x23,[sp] // tp[0]
181 ldr x14,[x3],#8 // np[0]
196 ldr x23,[sp] // tp[0]
198 ldr x8,[x0],#8 // rp[0]
232 add x29,sp,#0
240 ldp x6,x7,[x1,#8*0]
254 stp xzr,xzr,[x2,#8*0]
282 // a[1]a[0] (i)
283 // a[2]a[0]
284 // a[3]a[0]
285 // a[4]a[0]
286 // a[5]a[0]
287 // a[6]a[0]
288 // a[7]a[0]
311 mul x14,x7,x6 // lo(a[1..7]*a[0]) (i)
314 mul x17,x10,x6
315 adds x20,x20,x14 // t[1]+lo(a[1]*a[0])
321 adcs x23,x23,x17
322 umulh x17,x7,x6 // hi(a[1..7]*a[0])
329 stp x19,x20,[x2],#8*2 // t[0..1]
331 adds x21,x21,x17 // t[2]+lo(a[1]*a[0])
332 umulh x17,x11,x6
339 adcs x25,x25,x17
340 mul x17,x9,x7
348 adcs x23,x23,x17
349 mul x17,x13,x7
356 adcs x19,x19,x17
357 umulh x17,x11,x7
366 adcs x26,x26,x17
367 mul x17,x10,x8
375 adcs x25,x25,x17
376 umulh x17,x9,x8 // hi(a[3..7]*a[2])
385 adds x25,x25,x17
386 umulh x17,x13,x8
393 adc x21,x21,x17
395 mul x17,x13,x9
402 adcs x21,x21,x17
403 umulh x17,x13,x9
412 adc x22,x22,x17
414 umulh x17,x11,x10 // hi(a[5..7]*a[4])
422 adds x21,x21,x17
423 mul x17,x13,x11
431 adcs x23,x23,x17
432 umulh x17,x13,x12 // hi(a[7]*a[6])
441 add x25,x25,x17
446 ldp x6,x7,[x2,#8*0]
452 ldp x6,x7,[x1,#8*0]
467 // a[8]a[0]
468 // a[9]a[0]
469 // a[a]a[0]
470 // a[b]a[0]
471 // a[c]a[0]
472 // a[d]a[0]
473 // a[e]a[0]
474 // a[f]a[0]
495 mul x17,x9,x4
502 adcs x22,x22,x17
503 mul x17,x13,x4
510 adcs x26,x26,x17
511 umulh x17,x9,x4
520 adcs x22,x23,x17
521 umulh x17,x13,x4
526 adcs x26,x28,x17
534 ldp x6,x7,[x2,#8*0]
541 ldp x6,x7,[x1,#8*0]
558 ldp x6,x7,[x0,#8*0]
567 stp x19,x20,[x2,#8*0]
568 ldp x19,x20,[x15,#8*0]
580 // Now multiply above result by 2 and add a[n-1]*a[n-1]|...|a[0]*a[0]
581 ldp x7,x9,[x14,#8*0] // recall that x14 is &a[0]
585 ldp x17,x14,[sp,#8*3]
587 stp x19,x20,[x2,#8*0]
602 extr x16,x17,x16,#63
611 extr x17,x14,x17,#63
612 stp x19,x20,[x2,#8*0]
613 adcs x23,x10,x17
617 ldp x17,x14,[x2,#8*7]
620 extr x16,x17,x16,#63
629 extr x17,x14,x17,#63
632 adcs x19,x6,x17
635 ldp x17,x14,[x2,#8*3]
641 extr x16,x17,x16,#63
646 stp x19,x20,[x2,#8*0]
650 extr x17,x14,x17,#63
651 adcs x23,x10,x17
653 ldp x19,x20,[sp,#8*0]
656 ldp x6,x7,[x1,#8*0]
664 mul x28,x4,x19 // t[0]*n0
678 // (*) mul x14,x6,x28 // lo(n[0-7])*lo(t[0]*n0)
682 str x28,[x2],#8 // put aside t[0]*n0 for tail processing
683 mul x17,x9,x28
691 adcs x21,x22,x17
692 mul x17,x13,x28
694 umulh x14,x6,x28 // hi(n[0-7])*lo(t[0]*n0)
699 adcs x25,x26,x17
700 umulh x17,x9,x28
708 adcs x22,x22,x17
709 umulh x17,x13,x28
710 mul x28,x4,x19 // next t[0]*n0
714 adc x26,x26,x17
717 ldp x14,x15,[x2,#8*0]
718 ldp x16,x17,[x2,#8*2]
725 adcs x22,x22,x17
726 ldp x16,x17,[x2,#8*6]
730 adcs x26,x26,x17
735 ldp x6,x7,[x1,#8*0]
748 mul x17,x9,x4
755 adcs x22,x22,x17
756 mul x17,x13,x4
763 adcs x26,x26,x17
764 umulh x17,x9,x4
773 adcs x22,x23,x17
774 umulh x17,x13,x4
779 adcs x26,x28,x17
784 ldp x6,x7,[x2,#8*0]
795 ldp x6,x7,[x1,#8*0]
818 ldp x19,x20,[x0,#8*0]
820 ldp x6,x7,[x16,#8*0] // recall that x16 is &n[0]
832 stp x14,x15,[x2,#8*0]
857 ldp x6,x7,[x1,#8*0]
858 sbcs x17,x22,x9
859 stp x14,x15,[x0,#8*0]
863 stp x16,x17,[x0,#8*2]
866 sbcs x17,x26,x13
869 ldp x19,x20,[x2,#8*0]
877 stp x16,x17,[x0,#8*6]
885 ldp x6,x7,[x3,#8*0]
886 sbcs x17,x22,x9
887 stp x14,x15,[x0,#8*0]
891 stp x16,x17,[x0,#8*2]
893 ldp x19,x20,[x1,#8*0]
894 sbcs x17,x26,x13
899 stp x16,x17,[x0,#8*6]
905 stp xzr,xzr,[x2,#8*0]
912 csel x17,x22,x9,lo
916 stp x14,x15,[x3,#8*0]
917 stp x16,x17,[x3,#8*2]
919 stp xzr,xzr,[x1,#8*0]
924 stp xzr,xzr,[x2,#8*0]
928 csel x17,x22,x9,lo
929 stp x14,x15,[x3,#8*0]
930 stp x16,x17,[x3,#8*2]
942 stp xzr,xzr,[sp,#8*0]
963 stp x6,x7,[x1,#8*0]
992 add x29,sp,#0
1008 ldr x24,[x2,#8*0] // b[0]
1009 ldp x6,x7,[x1,#8*0] // a[0..3]
1016 ldp x14,x15,[x3,#8*0] // n[0..3]
1017 ldp x16,x17,[x3,#8*2]
1020 mov x28,#0
1024 mul x10,x6,x24 // lo(a[0..3]*b[0])
1032 umulh x10,x6,x24 // hi(a[0..3]*b[0])
1034 mul x25,x19,x4 // t[0]*n0
1041 ldr x24,[x2,x28] // next b[i] (or b[0])
1043 // (*) mul x10,x14,x25 // lo(n[0..3]*t[0]*n0)
1044 str x25,[x26],#8 // put aside t[0]*n0 for tail processing
1050 mul x13,x17,x25
1053 umulh x10,x14,x25 // hi(n[0..3]*t[0]*n0)
1059 umulh x13,x17,x25
1072 ldp x6,x7,[x1,#8*0] // a[4..7]
1075 ldr x25,[sp] // a[0]*n0
1076 ldp x14,x15,[x3,#8*0] // n[4..7]
1077 ldp x16,x17,[x3,#8*2]
1097 ldr x24,[x2,x28] // next b[i] (or b[0])
1099 mul x10,x14,x25 // lo(n[4..7]*a[0]*n0)
1105 mul x13,x17,x25
1107 umulh x10,x14,x25 // hi(n[4..7]*a[0]*n0)
1114 umulh x13,x17,x25
1116 ldr x25,[sp,x28] // next t[0]*n0
1129 ldp x6,x7,[x1,#8*0]
1132 ldp x14,x15,[x3,#8*0]
1133 ldp x16,x17,[x3,#8*2]
1141 ldp x6,x7,[x11,#8*0] // a[0..3]
1146 stp x19,x20,[x26,#8*0] // result!!!
1147 ldp x19,x20,[sp,#8*4] // t[0..3]
1151 ldp x14,x15,[x3,#8*0] // n[0..3]
1153 ldp x16,x17,[x3,#8*2]
1159 mul x10,x6,x24 // lo(a[0..3]*b[4])
1167 umulh x10,x6,x24 // hi(a[0..3]*b[4])
1169 mul x25,x19,x4 // t[0]*n0
1179 str x25,[x26],#8 // put aside t[0]*n0 for tail processing
1181 mul x11,x15,x25 // lo(n[0..3]*t[0]*n0
1185 mul x13,x17,x25
1188 umulh x10,x14,x25 // hi(n[0..3]*t[0]*n0
1194 umulh x13,x17,x25
1207 ldp x6,x7,[x1,#8*0] // a[4..7]
1216 ldr x25,[sp] // t[0]*n0
1217 ldp x14,x15,[x3,#8*0] // n[4..7]
1218 ldp x16,x17,[x3,#8*2]
1241 mul x10,x14,x25 // lo(n[4..7]*t[0]*n0)
1247 mul x13,x17,x25
1249 umulh x10,x14,x25 // hi(n[4..7]*t[0]*n0)
1255 umulh x13,x17,x25
1257 ldr x25,[sp,x28] // next a[0]*n0
1274 ldp x6,x7,[x1,#8*0]
1282 ldp x14,x15,[x3,#8*0]
1283 ldp x16,x17,[x3,#8*2]
1295 stp x19,x20,[x26,#8*0] // result!!!
1297 ldp x19,x20,[sp,#8*4] // t[0..3]
1302 ldp x14,x15,[x11,#8*0] // n[0..3]
1303 ldp x16,x17,[x11,#8*2]
1308 ldp x6,x7,[x1,#8*0] // a[0..3]
1330 ldp x14,x15,[x3,#8*0]
1332 ldp x19,x20,[x26,#8*0]
1333 sbcs x13,x22,x17
1334 ldp x16,x17,[x3,#8*2]
1338 stp x10,x11,[x0,#8*0]
1348 ldp x6,x7,[x27,#8*0]
1349 sbcs x13,x22,x17
1350 stp x10,x11,[x0,#8*0]
1353 ldp x19,x20,[x1,#8*0]
1362 stp xzr,xzr,[x26,#8*0]
1373 stp x10,x11,[x27,#8*0]
1379 stp xzr,xzr,[x26,#8*0]
1386 stp x10,x11,[x27,#8*0]
1399 stp xzr,xzr,[sp,#8*0]
1402 sbcs x9,x22,x17
1412 stp x6,x7,[x1,#8*0]
1428 …9,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0