• Home
  • Raw
  • Download

Lines Matching +full:0 +full:x21

5 #define __has_feature(x) 0
29 add x29,sp,#0
31 stp x21,x22,[sp,#32]
34 ldr x9,[x2],#8 // bp[0]
36 ldp x7,x8,[x1],#16 // ap[0..1]
40 ldp x13,x14,[x3],#16 // np[0..1]
42 mul x6,x7,x9 // ap[0]*bp[0]
43 sub x21,x5,#16 // j=num-2
45 mul x10,x8,x9 // ap[1]*bp[0]
48 mul x15,x6,x4 // "tp[0]"*n0
51 // (*) mul x12,x13,x15 // np[0]*m1
67 cbz x21,.L1st_skip
72 sub x21,x21,#8 // j--
77 mul x10,x8,x9 // ap[j]*bp[0]
86 cbnz x21,.L1st
107 ldr x23,[sp] // tp[0]
110 mul x6,x7,x9 // ap[0]*bp[i]
111 sub x21,x5,#16 // j=num-2
122 // (*) mul x12,x13,x15 // np[0]*m1
128 cbz x21,.Linner_skip
135 sub x21,x21,#8 // j--
151 cbnz x21,.Linner
179 ldr x23,[sp] // tp[0]
181 ldr x14,[x3],#8 // np[0]
182 subs x21,x5,#8 // j=num-1 and clear borrow
187 sub x21,x21,#8 // j--
190 cbnz x21,.Lsub
196 ldr x23,[sp] // tp[0]
198 ldr x8,[x0],#8 // rp[0]
216 ldp x21,x22,[x29,#32]
232 add x29,sp,#0
234 stp x21,x22,[sp,#32]
240 ldp x6,x7,[x1,#8*0]
254 stp xzr,xzr,[x2,#8*0]
270 mov x21,xzr
282 // a[1]a[0] (i)
283 // a[2]a[0]
284 // a[3]a[0]
285 // a[4]a[0]
286 // a[5]a[0]
287 // a[6]a[0]
288 // a[7]a[0]
311 mul x14,x7,x6 // lo(a[1..7]*a[0]) (i)
315 adds x20,x20,x14 // t[1]+lo(a[1]*a[0])
317 adcs x21,x21,x15
322 umulh x17,x7,x6 // hi(a[1..7]*a[0])
329 stp x19,x20,[x2],#8*2 // t[0..1]
331 adds x21,x21,x17 // t[2]+lo(a[1]*a[0])
358 stp x21,x22,[x2],#8*2 // t[2..3]
384 adc x21,xzr,xzr // t[10]
393 adc x21,x21,x17
402 adcs x21,x21,x17
410 adcs x21,x21,x16
417 adcs x21,x21,x15
422 adds x21,x21,x17
446 ldp x6,x7,[x2,#8*0]
452 ldp x6,x7,[x1,#8*0]
453 adcs x21,x21,x8
467 // a[8]a[0]
468 // a[9]a[0]
469 // a[a]a[0]
470 // a[b]a[0]
471 // a[c]a[0]
472 // a[d]a[0]
473 // a[e]a[0]
474 // a[f]a[0]
500 adcs x21,x21,x16
516 adcs x20,x21,x15
518 adcs x21,x22,x16
534 ldp x6,x7,[x2,#8*0]
541 ldp x6,x7,[x1,#8*0]
542 adcs x21,x21,x8
558 ldp x6,x7,[x0,#8*0]
567 stp x19,x20,[x2,#8*0]
568 ldp x19,x20,[x15,#8*0]
569 stp x21,x22,[x2,#8*2]
570 ldp x21,x22,[x15,#8*2]
580 // Now multiply above result by 2 and add a[n-1]*a[n-1]|...|a[0]*a[0]
581 ldp x7,x9,[x14,#8*0] // recall that x14 is &a[0]
587 stp x19,x20,[x2,#8*0]
589 stp x21,x22,[x2,#8*2]
601 adcs x21,x8,x15
612 stp x19,x20,[x2,#8*0]
615 stp x21,x22,[x2,#8*2]
640 adcs x21,x8,x15
646 stp x19,x20,[x2,#8*0]
649 stp x21,x22,[x2,#8*2]
653 ldp x19,x20,[sp,#8*0]
656 ldp x6,x7,[x1,#8*0]
664 mul x28,x4,x19 // t[0]*n0
667 ldp x21,x22,[sp,#8*2]
678 // (*) mul x14,x6,x28 // lo(n[0-7])*lo(t[0]*n0)
682 str x28,[x2],#8 // put aside t[0]*n0 for tail processing
689 adcs x20,x21,x16
691 adcs x21,x22,x17
694 umulh x14,x6,x28 // hi(n[0-7])*lo(t[0]*n0)
706 adcs x21,x21,x16
710 mul x28,x4,x19 // next t[0]*n0
717 ldp x14,x15,[x2,#8*0]
724 adcs x21,x21,x16
735 ldp x6,x7,[x1,#8*0]
753 adcs x21,x21,x16
769 adcs x20,x21,x15
771 adcs x21,x22,x16
784 ldp x6,x7,[x2,#8*0]
795 ldp x6,x7,[x1,#8*0]
796 adcs x21,x21,x8
818 ldp x19,x20,[x0,#8*0]
819 adcs x21,x21,x8
820 ldp x6,x7,[x16,#8*0] // recall that x16 is &n[0]
832 stp x14,x15,[x2,#8*0]
833 stp x21,x22,[x2,#8*2]
834 ldp x21,x22,[x0,#8*2]
856 sbcs x16,x21,x8
857 ldp x6,x7,[x1,#8*0]
859 stp x14,x15,[x0,#8*0]
869 ldp x19,x20,[x2,#8*0]
871 ldp x21,x22,[x2,#8*2]
882 sbcs x16,x21,x8
885 ldp x6,x7,[x3,#8*0]
887 stp x14,x15,[x0,#8*0]
893 ldp x19,x20,[x1,#8*0]
895 ldp x21,x22,[x1,#8*2]
905 stp xzr,xzr,[x2,#8*0]
909 csel x16,x21,x8,lo
914 ldp x21,x22,[x1,#8*6]
916 stp x14,x15,[x3,#8*0]
919 stp xzr,xzr,[x1,#8*0]
924 stp xzr,xzr,[x2,#8*0]
927 csel x16,x21,x8,lo
929 stp x14,x15,[x3,#8*0]
942 stp xzr,xzr,[sp,#8*0]
943 sbcs x8,x21,x8
961 csel x8,x21,x8,lo
963 stp x6,x7,[x1,#8*0]
975 ldp x21,x22,[x29,#32]
992 add x29,sp,#0
994 stp x21,x22,[sp,#32]
1008 ldr x24,[x2,#8*0] // b[0]
1009 ldp x6,x7,[x1,#8*0] // a[0..3]
1014 mov x21,xzr
1016 ldp x14,x15,[x3,#8*0] // n[0..3]
1020 mov x28,#0
1024 mul x10,x6,x24 // lo(a[0..3]*b[0])
1032 umulh x10,x6,x24 // hi(a[0..3]*b[0])
1034 mul x25,x19,x4 // t[0]*n0
1035 adcs x21,x21,x12
1041 ldr x24,[x2,x28] // next b[i] (or b[0])
1043 // (*) mul x10,x14,x25 // lo(n[0..3]*t[0]*n0)
1044 str x25,[x26],#8 // put aside t[0]*n0 for tail processing
1045 adcs x21,x21,x11
1053 umulh x10,x14,x25 // hi(n[0..3]*t[0]*n0)
1056 adcs x20,x21,x12
1058 adcs x21,x22,x13
1065 adcs x21,x21,x12
1072 ldp x6,x7,[x1,#8*0] // a[4..7]
1075 ldr x25,[sp] // a[0]*n0
1076 ldp x14,x15,[x3,#8*0] // n[4..7]
1092 adcs x21,x21,x12
1097 ldr x24,[x2,x28] // next b[i] (or b[0])
1099 mul x10,x14,x25 // lo(n[4..7]*a[0]*n0)
1100 adcs x21,x21,x11
1107 umulh x10,x14,x25 // hi(n[4..7]*a[0]*n0)
1110 adcs x21,x21,x12
1116 ldr x25,[sp,x28] // next t[0]*n0
1120 adcs x20,x21,x11
1121 adcs x21,x22,x12
1129 ldp x6,x7,[x1,#8*0]
1132 ldp x14,x15,[x3,#8*0]
1141 ldp x6,x7,[x11,#8*0] // a[0..3]
1146 stp x19,x20,[x26,#8*0] // result!!!
1147 ldp x19,x20,[sp,#8*4] // t[0..3]
1148 stp x21,x22,[x26,#8*2] // result!!!
1149 ldp x21,x22,[sp,#8*6]
1151 ldp x14,x15,[x3,#8*0] // n[0..3]
1159 mul x10,x6,x24 // lo(a[0..3]*b[4])
1167 umulh x10,x6,x24 // hi(a[0..3]*b[4])
1169 mul x25,x19,x4 // t[0]*n0
1170 adcs x21,x21,x12
1179 str x25,[x26],#8 // put aside t[0]*n0 for tail processing
1180 adcs x21,x21,x11
1181 mul x11,x15,x25 // lo(n[0..3]*t[0]*n0
1188 umulh x10,x14,x25 // hi(n[0..3]*t[0]*n0
1191 adcs x20,x21,x12
1193 adcs x21,x22,x13
1199 adcs x21,x21,x12
1207 ldp x6,x7,[x1,#8*0] // a[4..7]
1212 adcs x21,x21,x12
1216 ldr x25,[sp] // t[0]*n0
1217 ldp x14,x15,[x3,#8*0] // n[4..7]
1234 adcs x21,x21,x12
1241 mul x10,x14,x25 // lo(n[4..7]*t[0]*n0)
1242 adcs x21,x21,x11
1249 umulh x10,x14,x25 // hi(n[4..7]*t[0]*n0)
1252 adcs x21,x21,x12
1257 ldr x25,[sp,x28] // next a[0]*n0
1262 adcs x20,x21,x11
1263 adcs x21,x22,x12
1274 ldp x6,x7,[x1,#8*0]
1279 adcs x21,x21,x12
1282 ldp x14,x15,[x3,#8*0]
1294 adcs x21,x21,xzr
1295 stp x19,x20,[x26,#8*0] // result!!!
1297 ldp x19,x20,[sp,#8*4] // t[0..3]
1299 stp x21,x22,[x26,#8*2] // result!!!
1301 ldp x21,x22,[sp,#8*6]
1302 ldp x14,x15,[x11,#8*0] // n[0..3]
1308 ldp x6,x7,[x1,#8*0] // a[0..3]
1329 sbcs x12,x21,x16
1330 ldp x14,x15,[x3,#8*0]
1332 ldp x19,x20,[x26,#8*0]
1336 ldp x21,x22,[x26,#8*2]
1338 stp x10,x11,[x0,#8*0]
1345 sbcs x12,x21,x16
1348 ldp x6,x7,[x27,#8*0]
1350 stp x10,x11,[x0,#8*0]
1353 ldp x19,x20,[x1,#8*0]
1354 ldp x21,x22,[x1,#8*2]
1362 stp xzr,xzr,[x26,#8*0]
1366 csel x12,x21,x8,lo
1371 ldp x21,x22,[x1,#8*6]
1373 stp x10,x11,[x27,#8*0]
1379 stp xzr,xzr,[x26,#8*0]
1382 csel x12,x21,x8,lo
1386 stp x10,x11,[x27,#8*0]
1399 stp xzr,xzr,[sp,#8*0]
1400 sbcs x8,x21,x16
1410 csel x8,x21,x8,lo
1412 stp x6,x7,[x1,#8*0]
1418 ldp x21,x22,[x29,#32]
1428 …9,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0