/third_party/mindspore/mindspore/ccsrc/backend/kernel_compiler/cpu/nnacl/assembly/avx/ |
D | MatmulAvx.S | 59 pushq %rdx // -80 67 movq %rdx, %rsi 68 movq %r8, %rdx 74 movq %rdx, -80(%rsp) // rdx 118 movq -80(%rsp), %rdx 276 movq %rdx, %rax 279 vmovss %xmm4, (%rdx) 282 addq %r10, %rdx 283 vmovss %xmm6, (%rdx) 286 addq %r10, %rdx [all …]
|
D | ConvDwFp32Avx3x3.S | 54 pushq %rdx // -80 61 movq %rdx, %rsi 62 movq %r8, %rdx 67 mov %rdx, -80(%rsp) 86 movq -80(%rsp), %rdx 106 vmovups (%rdx), %ymm11 107 addq $32, %rdx 108 vmovups (%rdx), %ymm12 109 addq $32, %rdx 110 vmovups (%rdx), %ymm13 [all …]
|
D | ConvDwFp32RowAvx.S | 51 movq %rdx, %rsi // input_ptr 52 movq %r8, %rdx // weight_ptr 61 movq %rdx, %r14 // weight_ptr 68 movq %r14, %rdx // weight_tmp 93 vfmadd231ps (%rdx), %ymm0, %ymm8 94 vfmadd231ps 32(%rdx), %ymm1, %ymm9 95 vfmadd231ps 64(%rdx), %ymm2, %ymm10 96 vfmadd231ps 96(%rdx), %ymm3, %ymm11 103 addq $128, %rdx 123 vfmadd231ps (%rdx), %ymm0, %ymm8 [all …]
|
D | ConvDwFp32BorderAvx.S | 36 pushq %rdx // -80 41 movq %rdi, %rdx 43 movq %rcx, %rdx 45 movq 8(%rdx), %r12 // src 46 movq 16(%rdx), %r13 // weight 47 movq 24(%rdx), %rbp // bias 48 movq 32(%rdx), %r11 // height 49 movq 40(%rdx), %r10 51 movq 48(%rdx), %r10 53 movq 56(%rdx), %r10 // in_kw_step [all …]
|
/third_party/openssl/crypto/bn/asm/ |
D | x86_64-mont.pl | 86 $bp="%rdx"; # const BN_ULONG *bp, 191 mov %rdx,$hi0 196 adc \$0,%rdx 197 mov %rdx,$hi1 206 adc \$0,%rdx 209 adc \$0,%rdx 211 mov %rdx,$hi1 217 adc \$0,%rdx 219 mov %rdx,$lo0 227 adc \$0,%rdx [all …]
|
D | x86_64-mont5.pl | 71 $bp="%rdx"; # const BN_ULONG *bp, 262 mov %rdx,$hi0 267 adc \$0,%rdx 268 mov %rdx,$hi1 277 adc \$0,%rdx 280 adc \$0,%rdx 282 mov %rdx,$hi1 288 adc \$0,%rdx 290 mov %rdx,$lo0 298 adc \$0,%rdx [all …]
|
D | rsaz-x86_64.pl | 91 my ($out,$inp,$mod,$n0,$times) = ("%rdi","%rsi","%rdx","%rcx","%r8d"); 120 movq ($inp), %rdx 137 movq %rdx, %rbx # 0($inp) 139 mulq %rdx 142 movq %rdx, %r9 147 movq %rdx, %r10 153 movq %rdx, %r11 159 movq %rdx, %r12 165 movq %rdx, %r13 171 movq %rdx, %r14 [all …]
|
/third_party/openssl/crypto/whrlpool/asm/x86_64/ |
D | wp-x86_64.s | 29 movq %rdx,16(%r10) 38 xorq %rdx,%rdx 85 leaq (%rdx,%rdx,1),%rdi 92 leaq (%rdx,%rdx,1),%rdi 99 leaq (%rdx,%rdx,1),%rdi 106 leaq (%rdx,%rdx,1),%rdi 113 leaq (%rdx,%rdx,1),%rdi 120 leaq (%rdx,%rdx,1),%rdi 127 leaq (%rdx,%rdx,1),%rdi 134 leaq (%rdx,%rdx,1),%rdi [all …]
|
/third_party/mesa3d/src/mesa/x86-64/ |
D | xform4.S | 65 movl V4F_COUNT(%rdx), %ecx /* count */ 66 movzbl V4F_STRIDE(%rdx), %eax /* stride */ 77 movq V4F_START(%rdx), %rdx /* ptr to first src vertex */ 80 prefetcht1 16(%rdx) 90 movups (%rdx), %xmm8 /* ox | oy | oz | ow */ 94 addq %rax, %rdx 104 prefetcht1 16(%rdx) 148 movl V4F_COUNT(%rdx), %ecx /* count */ 149 movzbl V4F_STRIDE(%rdx), %eax /* stride */ 158 movq V4F_START(%rdx), %rdx /* ptr to first src vertex */ [all …]
|
/third_party/openssl/crypto/ec/asm/ |
D | x25519-x86_64.pl | 123 mov 8*0(%rdx),%r11 # load g[0-4] 124 mov 8*1(%rdx),%r12 125 mov 8*2(%rdx),%r13 126 mov 8*3(%rdx),%rbp 127 mov 8*4(%rdx),%r14 135 mov %rdx,%rcx 141 mov %rdx,%r9 147 mov %rdx,%r11 151 mov %rdx,%r13 155 mov %rdx,%r15 [all …]
|
D | ecp_nistz256-x86_64.pl | 115 my ($t0,$t1,$t2,$t3,$t4)=("%rax","%rdx","%rcx","%r12","%r13"); 116 my ($r_ptr,$a_ptr,$b_ptr)=("%rdi","%rsi","%rdx"); 489 my ($r_ptr,$a_ptr,$b_org,$b_ptr)=("%rdi","%rsi","%rdx","%rbx"); 491 my ($t0,$t1,$t2,$t3,$t4)=("%rcx","%rbp","%rbx","%rdx","%rax"); 538 mov %rdx, $acc1 543 adc \$0, %rdx 544 mov %rdx, $acc2 549 adc \$0, %rdx 554 mov %rdx, $acc3 558 adc \$0, %rdx [all …]
|
/third_party/openssl/crypto/bn/asm/x86_64/ |
D | x86_64-mont.s | 18 cmpq %rsi,%rdx 72 movq %rdx,%r12 86 movq %rdx,%r11 91 adcq $0,%rdx 92 movq %rdx,%r13 101 adcq $0,%rdx 104 adcq $0,%rdx 106 movq %rdx,%r13 112 adcq $0,%rdx 114 movq %rdx,%r10 [all …]
|
D | rsaz-x86_64.s | 33 movq (%rsi),%rdx 46 movq %rdx,%rbx 48 mulq %rdx 51 movq %rdx,%r9 56 movq %rdx,%r10 62 movq %rdx,%r11 68 movq %rdx,%r12 74 movq %rdx,%r13 80 movq %rdx,%r14 86 adcq $0,%rdx [all …]
|
D | x86_64-mont5.s | 68 leaq 128(%rdx),%r12 211 movq %rdx,%r11 216 adcq $0,%rdx 217 movq %rdx,%r13 226 adcq $0,%rdx 229 adcq $0,%rdx 231 movq %rdx,%r13 237 adcq $0,%rdx 239 movq %rdx,%r10 247 adcq $0,%rdx [all …]
|
D | x86_64-gf2m.s | 21 movq %rax,%rdx 24 shrq $1,%rdx 32 xorq %rcx,%rdx 35 xorq %rbx,%rdx 91 xorq %rbx,%rdx 106 xorq %rbx,%rdx 121 xorq %rbx,%rdx 136 xorq %rbx,%rdx 151 xorq %rbx,%rdx 166 xorq %rbx,%rdx [all …]
|
/third_party/openssl/crypto/ec/asm/x86_64/ |
D | x25519-x86_64.s | 31 movq 0(%rdx),%r11 32 movq 8(%rdx),%r12 33 movq 16(%rdx),%r13 34 movq 24(%rdx),%rbp 35 movq 32(%rdx),%r14 43 movq %rdx,%rcx 49 movq %rdx,%r9 55 movq %rdx,%r11 59 movq %rdx,%r13 63 movq %rdx,%r15 [all …]
|
D | ecp_nistz256-x86_64.s | 2426 movq %r9,%rdx 2438 cmovcq %rdx,%r9 2479 movq %r9,%rdx 2492 cmovzq %rdx,%r9 2500 movq %r10,%rdx 2503 shlq $63,%rdx 2506 orq %rdx,%r9 2554 movq %r9,%rdx 2566 cmovcq %rdx,%r9 2576 movq %r9,%rdx [all …]
|
/third_party/musl/src/string/x86_64/ |
D | memset.s | 8 cmp $126,%rdx 15 mov %sil,-1(%rdi,%rdx) 20 mov %ax,(-1-2)(%rdi,%rdx) 25 mov %eax,(-1-2-4)(%rdi,%rdx) 30 mov %rax,(-1-2-4-8)(%rdi,%rdx) 36 mov %rax,(-1-2-4-8-16)(%rdi,%rdx) 37 mov %rax,(-1-2-4-8-8)(%rdi,%rdx) 45 mov %rax,(-1-2-4-8-16-32)(%rdi,%rdx) 46 mov %rax,(-1-2-4-8-16-24)(%rdi,%rdx) 47 mov %rax,(-1-2-4-8-16-16)(%rdi,%rdx) [all …]
|
/third_party/boost/tools/boost_install/test/iostreams/zlib-1.2.11/contrib/amd64/ |
D | amd64-match.S | 269 mov $(-MAX_MATCH_8), %rdx 275 prefetcht1 (%windowbestlen, %rdx) 276 prefetcht1 (%prev, %rdx) 293 movdqu (%windowbestlen, %rdx), %xmm1 294 movdqu (%prev, %rdx), %xmm2 296 movdqu 16(%windowbestlen, %rdx), %xmm3 297 movdqu 16(%prev, %rdx), %xmm4 299 movdqu 32(%windowbestlen, %rdx), %xmm5 300 movdqu 32(%prev, %rdx), %xmm6 302 movdqu 48(%windowbestlen, %rdx), %xmm7 [all …]
|
/third_party/boost/libs/beast/test/extern/zlib-1.2.11/contrib/amd64/ |
D | amd64-match.S | 269 mov $(-MAX_MATCH_8), %rdx 275 prefetcht1 (%windowbestlen, %rdx) 276 prefetcht1 (%prev, %rdx) 293 movdqu (%windowbestlen, %rdx), %xmm1 294 movdqu (%prev, %rdx), %xmm2 296 movdqu 16(%windowbestlen, %rdx), %xmm3 297 movdqu 16(%prev, %rdx), %xmm4 299 movdqu 32(%windowbestlen, %rdx), %xmm5 300 movdqu 32(%prev, %rdx), %xmm6 302 movdqu 48(%windowbestlen, %rdx), %xmm7 [all …]
|
/third_party/openssl/engines/asm/ |
D | e_padlock-x86_64.pl | 41 $ctx="%rdx"; 47 ($arg1,$arg2,$arg3,$arg4)=$win64?("%rcx","%rdx","%r8", "%r9") : # Win64 order 48 ("%rdi","%rsi","%rdx","%rcx"); # Unix order 167 mov %rdx,%rcx 168 mov %rdi,%rdx # put aside %rdi 180 movups %xmm0,(%rdx) # copy-out context 181 mov %eax,16(%rdx) 189 mov %rdx,%rcx 190 mov %rdi,%rdx # put aside %rdi 202 movups %xmm0,(%rdx) # copy-out context [all …]
|
/third_party/openssl/crypto/sha/asm/x86_64/ |
D | sha512-x86_64.s | 37 shlq $4,%rdx 39 leaq (%rsi,%rdx,8),%rdx 43 movq %rdx,128+16(%rsp) 51 movq 24(%rdi),%rdx 99 addq %r12,%rdx 105 movq %rdx,%r13 111 xorq %rdx,%r13 117 andq %rdx,%rdi 124 xorq %rdx,%r13 150 movq %rdx,%r15 [all …]
|
D | keccak1600-x86_64.s | 10 movq 84(%rdi),%rdx 22 xorq -76(%rdi),%rdx 32 xorq -36(%rdi),%rdx 38 xorq 4(%rdi),%rdx 45 xorq %r11,%rdx 48 xorq %rdx,%rax 51 rolq $1,%rdx 52 xorq %rbx,%rdx 61 xorq %rdx,%r10 102 xorq %rdx,%r12 [all …]
|
/third_party/openssl/crypto/whrlpool/asm/ |
D | wp-x86_64.pl | 91 mov %rdx,16(%r10) 100 xor %rdx,%rdx 125 lea (%rdx,%rdx),%rdi 132 lea (%rdx,%rdx),%rdi 139 lea (%rdx,%rdx),%rdi 146 lea (%rdx,%rdx),%rdi 159 lea (%rdx,%rdx),%rdi 166 lea (%rdx,%rdx),%rdi 173 lea (%rdx,%rdx),%rdi 180 lea (%rdx,%rdx),%rdi [all …]
|
/third_party/openssl/crypto/camellia/asm/ |
D | cmll-x86_64.pl | 157 mov %rdx,$key 284 mov %rdx,$keyend 460 mov %rdx,$out # keyTable 572 &_loadround (4,$out,"%rcx","%rdx"); # KR 582 &_rotl128 ("%rcx","%rdx",15); 583 &_saveround (4,$out,-128,"%rcx","%rdx"); # KR<<<15 586 &_rotl128 ("%rcx","%rdx",15); # 15+15=30 587 &_saveround (8,$out,-128,"%rcx","%rdx"); # KR<<<30 596 &_rotl128 ("%rcx","%rdx",30); # 30+30=60 597 &_saveround (18,$out,-128,"%rcx","%rdx"); # KR<<<60 [all …]
|