Lines Matching +full:0 +full:x21
5 #define __has_feature(x) 0
32 add x29,sp,#0
34 stp x21,x22,[sp,#32]
37 ldr x9,[x2],#8 // bp[0]
39 ldp x7,x8,[x1],#16 // ap[0..1]
43 ldp x13,x14,[x3],#16 // np[0..1]
45 mul x6,x7,x9 // ap[0]*bp[0]
46 sub x21,x5,#16 // j=num-2
48 mul x10,x8,x9 // ap[1]*bp[0]
51 mul x15,x6,x4 // "tp[0]"*n0
54 // (*) mul x12,x13,x15 // np[0]*m1
70 cbz x21,.L1st_skip
75 sub x21,x21,#8 // j--
80 mul x10,x8,x9 // ap[j]*bp[0]
89 cbnz x21,.L1st
110 ldr x23,[sp] // tp[0]
113 mul x6,x7,x9 // ap[0]*bp[i]
114 sub x21,x5,#16 // j=num-2
125 // (*) mul x12,x13,x15 // np[0]*m1
131 cbz x21,.Linner_skip
138 sub x21,x21,#8 // j--
154 cbnz x21,.Linner
182 ldr x23,[sp] // tp[0]
184 ldr x14,[x3],#8 // np[0]
185 subs x21,x5,#8 // j=num-1 and clear borrow
190 sub x21,x21,#8 // j--
193 cbnz x21,.Lsub
199 ldr x23,[sp] // tp[0]
201 ldr x8,[x0],#8 // rp[0]
219 ldp x21,x22,[x29,#32]
235 add x29,sp,#0
237 stp x21,x22,[sp,#32]
243 ldp x6,x7,[x1,#8*0]
257 stp xzr,xzr,[x2,#8*0]
273 mov x21,xzr
285 // a[1]a[0] (i)
286 // a[2]a[0]
287 // a[3]a[0]
288 // a[4]a[0]
289 // a[5]a[0]
290 // a[6]a[0]
291 // a[7]a[0]
314 mul x14,x7,x6 // lo(a[1..7]*a[0]) (i)
318 adds x20,x20,x14 // t[1]+lo(a[1]*a[0])
320 adcs x21,x21,x15
325 umulh x17,x7,x6 // hi(a[1..7]*a[0])
332 stp x19,x20,[x2],#8*2 // t[0..1]
334 adds x21,x21,x17 // t[2]+lo(a[1]*a[0])
361 stp x21,x22,[x2],#8*2 // t[2..3]
387 adc x21,xzr,xzr // t[10]
396 adc x21,x21,x17
405 adcs x21,x21,x17
413 adcs x21,x21,x16
420 adcs x21,x21,x15
425 adds x21,x21,x17
449 ldp x6,x7,[x2,#8*0]
455 ldp x6,x7,[x1,#8*0]
456 adcs x21,x21,x8
470 // a[8]a[0]
471 // a[9]a[0]
472 // a[a]a[0]
473 // a[b]a[0]
474 // a[c]a[0]
475 // a[d]a[0]
476 // a[e]a[0]
477 // a[f]a[0]
503 adcs x21,x21,x16
519 adcs x20,x21,x15
521 adcs x21,x22,x16
537 ldp x6,x7,[x2,#8*0]
544 ldp x6,x7,[x1,#8*0]
545 adcs x21,x21,x8
561 ldp x6,x7,[x0,#8*0]
570 stp x19,x20,[x2,#8*0]
571 ldp x19,x20,[x15,#8*0]
572 stp x21,x22,[x2,#8*2]
573 ldp x21,x22,[x15,#8*2]
583 // Now multiply above result by 2 and add a[n-1]*a[n-1]|...|a[0]*a[0]
584 ldp x7,x9,[x14,#8*0] // recall that x14 is &a[0]
590 stp x19,x20,[x2,#8*0]
592 stp x21,x22,[x2,#8*2]
604 adcs x21,x8,x15
615 stp x19,x20,[x2,#8*0]
618 stp x21,x22,[x2,#8*2]
643 adcs x21,x8,x15
649 stp x19,x20,[x2,#8*0]
652 stp x21,x22,[x2,#8*2]
656 ldp x19,x20,[sp,#8*0]
659 ldp x6,x7,[x1,#8*0]
667 mul x28,x4,x19 // t[0]*n0
670 ldp x21,x22,[sp,#8*2]
681 // (*) mul x14,x6,x28 // lo(n[0-7])*lo(t[0]*n0)
685 str x28,[x2],#8 // put aside t[0]*n0 for tail processing
692 adcs x20,x21,x16
694 adcs x21,x22,x17
697 umulh x14,x6,x28 // hi(n[0-7])*lo(t[0]*n0)
709 adcs x21,x21,x16
713 mul x28,x4,x19 // next t[0]*n0
720 ldp x14,x15,[x2,#8*0]
727 adcs x21,x21,x16
738 ldp x6,x7,[x1,#8*0]
756 adcs x21,x21,x16
772 adcs x20,x21,x15
774 adcs x21,x22,x16
787 ldp x6,x7,[x2,#8*0]
798 ldp x6,x7,[x1,#8*0]
799 adcs x21,x21,x8
821 ldp x19,x20,[x0,#8*0]
822 adcs x21,x21,x8
823 ldp x6,x7,[x16,#8*0] // recall that x16 is &n[0]
835 stp x14,x15,[x2,#8*0]
836 stp x21,x22,[x2,#8*2]
837 ldp x21,x22,[x0,#8*2]
859 sbcs x16,x21,x8
860 ldp x6,x7,[x1,#8*0]
862 stp x14,x15,[x0,#8*0]
872 ldp x19,x20,[x2,#8*0]
874 ldp x21,x22,[x2,#8*2]
885 sbcs x16,x21,x8
888 ldp x6,x7,[x3,#8*0]
890 stp x14,x15,[x0,#8*0]
896 ldp x19,x20,[x1,#8*0]
898 ldp x21,x22,[x1,#8*2]
908 stp xzr,xzr,[x2,#8*0]
912 csel x16,x21,x8,lo
917 ldp x21,x22,[x1,#8*6]
919 stp x14,x15,[x3,#8*0]
922 stp xzr,xzr,[x1,#8*0]
927 stp xzr,xzr,[x2,#8*0]
930 csel x16,x21,x8,lo
932 stp x14,x15,[x3,#8*0]
945 stp xzr,xzr,[sp,#8*0]
946 sbcs x8,x21,x8
964 csel x8,x21,x8,lo
966 stp x6,x7,[x1,#8*0]
978 ldp x21,x22,[x29,#32]
995 add x29,sp,#0
997 stp x21,x22,[sp,#32]
1011 ldr x24,[x2,#8*0] // b[0]
1012 ldp x6,x7,[x1,#8*0] // a[0..3]
1017 mov x21,xzr
1019 ldp x14,x15,[x3,#8*0] // n[0..3]
1023 mov x28,#0
1027 mul x10,x6,x24 // lo(a[0..3]*b[0])
1035 umulh x10,x6,x24 // hi(a[0..3]*b[0])
1037 mul x25,x19,x4 // t[0]*n0
1038 adcs x21,x21,x12
1044 ldr x24,[x2,x28] // next b[i] (or b[0])
1046 // (*) mul x10,x14,x25 // lo(n[0..3]*t[0]*n0)
1047 str x25,[x26],#8 // put aside t[0]*n0 for tail processing
1048 adcs x21,x21,x11
1056 umulh x10,x14,x25 // hi(n[0..3]*t[0]*n0)
1059 adcs x20,x21,x12
1061 adcs x21,x22,x13
1068 adcs x21,x21,x12
1075 ldp x6,x7,[x1,#8*0] // a[4..7]
1078 ldr x25,[sp] // a[0]*n0
1079 ldp x14,x15,[x3,#8*0] // n[4..7]
1095 adcs x21,x21,x12
1100 ldr x24,[x2,x28] // next b[i] (or b[0])
1102 mul x10,x14,x25 // lo(n[4..7]*a[0]*n0)
1103 adcs x21,x21,x11
1110 umulh x10,x14,x25 // hi(n[4..7]*a[0]*n0)
1113 adcs x21,x21,x12
1119 ldr x25,[sp,x28] // next t[0]*n0
1123 adcs x20,x21,x11
1124 adcs x21,x22,x12
1132 ldp x6,x7,[x1,#8*0]
1135 ldp x14,x15,[x3,#8*0]
1144 ldp x6,x7,[x11,#8*0] // a[0..3]
1149 stp x19,x20,[x26,#8*0] // result!!!
1150 ldp x19,x20,[sp,#8*4] // t[0..3]
1151 stp x21,x22,[x26,#8*2] // result!!!
1152 ldp x21,x22,[sp,#8*6]
1154 ldp x14,x15,[x3,#8*0] // n[0..3]
1162 mul x10,x6,x24 // lo(a[0..3]*b[4])
1170 umulh x10,x6,x24 // hi(a[0..3]*b[4])
1172 mul x25,x19,x4 // t[0]*n0
1173 adcs x21,x21,x12
1182 str x25,[x26],#8 // put aside t[0]*n0 for tail processing
1183 adcs x21,x21,x11
1184 mul x11,x15,x25 // lo(n[0..3]*t[0]*n0
1191 umulh x10,x14,x25 // hi(n[0..3]*t[0]*n0
1194 adcs x20,x21,x12
1196 adcs x21,x22,x13
1202 adcs x21,x21,x12
1210 ldp x6,x7,[x1,#8*0] // a[4..7]
1215 adcs x21,x21,x12
1219 ldr x25,[sp] // t[0]*n0
1220 ldp x14,x15,[x3,#8*0] // n[4..7]
1237 adcs x21,x21,x12
1244 mul x10,x14,x25 // lo(n[4..7]*t[0]*n0)
1245 adcs x21,x21,x11
1252 umulh x10,x14,x25 // hi(n[4..7]*t[0]*n0)
1255 adcs x21,x21,x12
1260 ldr x25,[sp,x28] // next a[0]*n0
1265 adcs x20,x21,x11
1266 adcs x21,x22,x12
1277 ldp x6,x7,[x1,#8*0]
1282 adcs x21,x21,x12
1285 ldp x14,x15,[x3,#8*0]
1297 adcs x21,x21,xzr
1298 stp x19,x20,[x26,#8*0] // result!!!
1300 ldp x19,x20,[sp,#8*4] // t[0..3]
1302 stp x21,x22,[x26,#8*2] // result!!!
1304 ldp x21,x22,[sp,#8*6]
1305 ldp x14,x15,[x11,#8*0] // n[0..3]
1311 ldp x6,x7,[x1,#8*0] // a[0..3]
1332 sbcs x12,x21,x16
1333 ldp x14,x15,[x3,#8*0]
1335 ldp x19,x20,[x26,#8*0]
1339 ldp x21,x22,[x26,#8*2]
1341 stp x10,x11,[x0,#8*0]
1348 sbcs x12,x21,x16
1351 ldp x6,x7,[x27,#8*0]
1353 stp x10,x11,[x0,#8*0]
1356 ldp x19,x20,[x1,#8*0]
1357 ldp x21,x22,[x1,#8*2]
1365 stp xzr,xzr,[x26,#8*0]
1369 csel x12,x21,x8,lo
1374 ldp x21,x22,[x1,#8*6]
1376 stp x10,x11,[x27,#8*0]
1382 stp xzr,xzr,[x26,#8*0]
1385 csel x12,x21,x8,lo
1389 stp x10,x11,[x27,#8*0]
1402 stp xzr,xzr,[sp,#8*0]
1403 sbcs x8,x21,x16
1413 csel x8,x21,x8,lo
1415 stp x6,x7,[x1,#8*0]
1421 ldp x21,x22,[x29,#32]
1431 …9,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0