Home
last modified time | relevance | path

Searched +full:- +full:o0 (Results 1 – 25 of 1112) sorted by relevance

12345678910>>...45

/external/llvm/test/CodeGen/AArch64/
Dcxx-tlscc.ll1 ; RUN: llc < %s -mtriple=aarch64-apple-ios | FileCheck %s
2 ; RUN: llc < %s -mtriple=aarch64-apple-ios -enable-shrink-wrap=true | FileCheck %s
6 ; RUN: llc < %s -mtriple=aarch64-apple-ios -O0 | FileCheck --check-prefix=CHECK-O0 %s
33 ; CHECK-LABEL: _ZTW2sg
34 ; CHECK-NOT: stp d31, d30
35 ; CHECK-NOT: stp d29, d28
36 ; CHECK-NOT: stp d27, d26
37 ; CHECK-NOT: stp d25, d24
38 ; CHECK-NOT: stp d23, d22
39 ; CHECK-NOT: stp d21, d20
[all …]
Dswifterror.ll1 ; RUN: llc -verify-machineinstrs -disable-fp-elim < %s -mtriple=aarch64-apple-ios -disable-post-ra …
2 ; RUN: llc -verify-machineinstrs -disable-fp-elim -O0 < %s -mtriple=aarch64-apple-ios -disable-post
11 ; CHECK-APPLE-LABEL: foo:
12 ; CHECK-APPLE: orr w0, wzr, #0x10
13 ; CHECK-APPLE: malloc
14 ; CHECK-APPLE: orr [[ID:w[0-9]+]], wzr, #0x1
15 ; CHECK-APPLE: strb [[ID]], [x0, #8]
16 ; CHECK-APPLE: mov x19, x0
17 ; CHECK-APPLE-NOT: x19
19 ; CHECK-O0-LABEL: foo:
[all …]
/external/llvm/test/CodeGen/X86/
Dcxx_tlscc64.ll1 ; RUN: llc -verify-machineinstrs < %s -mtriple=x86_64-apple-darwin | FileCheck %s
2 ; TLS function were wrongly model and after fixing that, shrink-wrapping
5 ; Applying tricks on x86-64 similar to r255821.
6 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -enable-shrink-wrap=true | FileCheck %s
7 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -O0 | FileCheck %s --check-prefix=CHECK-O0
19 ; Every GPR should be saved - except rdi, rax, and rsp
20 ; CHECK-LABEL: _ZTW2sg
21 ; CHECK-NOT: pushq %r11
22 ; CHECK-NOT: pushq %r10
23 ; CHECK-NOT: pushq %r9
[all …]
Dswifterror.ll1 ; RUN: llc -verify-machineinstrs < %s -mtriple=x86_64-apple-darwin | FileCheck --check-prefix=CHECK
2 ; RUN: llc -verify-machineinstrs -O0 < %s -mtriple=x86_64-apple-darwin | FileCheck --check-prefix=C…
11 ; CHECK-APPLE-LABEL: foo:
12 ; CHECK-APPLE: movl $16, %edi
13 ; CHECK-APPLE: malloc
14 ; CHECK-APPLE: movb $1, 8(%rax)
15 ; CHECK-APPLE: movq %rax, %r12
17 ; CHECK-O0-LABEL: foo:
18 ; CHECK-O0: movl $16
19 ; CHECK-O0: malloc
[all …]
Dswift-return.ll1 ; RUN: llc -verify-machineinstrs < %s -mtriple=x86_64-unknown-unknown | FileCheck %s
2 ; RUN: llc -verify-machineinstrs < %s -mtriple=x86_64-unknown-unknown -O0 | FileCheck --check-prefi…
8 ; CHECK-LABEL: test:
13 ; CHECK-O0-LABEL: test
14 ; CHECK-O0: movl %edi
15 ; CHECK-O0: callq gen
16 ; CHECK-O0: movswl %ax
17 ; CHECK-O0: movsbl %dl
18 ; CHECK-O0: addl
19 ; CHECK-O0: movw %{{.*}}, %ax
[all …]
/external/llvm/test/CodeGen/SystemZ/
Dswifterror.ll1 ; RUN: llc < %s -mtriple=s390x-linux-gnu| FileCheck %s
2 ; RUN: llc < %s -O0 -mtriple=s390x-linux-gnu | FileCheck --check-prefix=CHECK-O0 %s
11 ; CHECK-LABEL: foo:
16 ; CHECK-O0-LABEL: foo:
17 ; CHECK-O0: lghi %r2, 16
18 ; CHECK-O0: brasl %r14, malloc
19 ; CHECK-O0: lgr %r[[REG1:[0-9]+]], %r2
20 ; CHECK-O0: mvi 8(%r2), 1
21 ; CHECK-O0: lgr %r9, %r[[REG1]]
33 ; CHECK-LABEL: caller:
[all …]
Dswift-return.ll1 ; RUN: llc < %s -mtriple=s390x-linux-gnu -verify-machineinstrs | FileCheck %s
2 ; RUN: llc < %s -mtriple=s390x-linux-gnu -O0 -verify-machineinstrs | FileCheck --check-prefix=CHECK
8 ; CHECK-LABEL: test:
11 ; CHECK-DAG: lhr %r2, %r2
12 ; CHECK-DAG: lbr %[[REG1:r[0-9]+]], %r3
14 ; CHECK-O0-LABEL: test
15 ; CHECK-O0: st %r2
16 ; CHECK-O0: brasl %r14, gen
17 ; CHECK-O0-DAG: lhr %[[REG1:r[0-9]+]], %r2
18 ; CHECK-O0-DAG: lbr %[[REG2:r[0-9]+]], %r3
[all …]
/external/llvm/test/CodeGen/ARM/
Dswifterror.ll1 ; RUN: llc -verify-machineinstrs < %s -mtriple=armv7-apple-ios | FileCheck --check-prefix=CHECK-APP…
2 ; RUN: llc -verify-machineinstrs -O0 < %s -mtriple=armv7-apple-ios | FileCheck --check-prefix=CHECK
12 ; CHECK-APPLE-LABEL: foo:
13 ; CHECK-APPLE: mov r0, #16
14 ; CHECK-APPLE: malloc
15 ; CHECK-APPLE-DAG: mov [[ID:r[0-9]+]], #1
16 ; CHECK-APPLE-DAG: mov r6, r{{.*}}
17 ; CHECK-APPLE-DAG: strb [[ID]], [r{{.*}}, #8]
19 ; CHECK-O0-LABEL: foo:
20 ; CHECK-O0: mov r{{.*}}, #16
[all …]
Dcxx-tlscc.ll1 ; RUN: llc < %s -mtriple=armv7k-apple-watchos2.0 | FileCheck %s
2 ; RUN: llc < %s -mtriple=armv7k-apple-watchos2.0 -enable-shrink-wrap=true | FileCheck %s
3 ; RUN: llc < %s -mtriple=armv7-apple-ios8.0 | FileCheck %s
4 ; RUN: llc < %s -mtriple=armv7-apple-ios8.0 -enable-shrink-wrap=true | FileCheck %s
6 ; RUN: llc < %s -mtriple=armv7k-apple-watchos2.0 -O0 | FileCheck --check-prefix=CHECK-O0 --check-pr…
7 ; RUN: llc < %s -mtriple=armv7-apple-ios8.0 -O0 | FileCheck --check-prefix=CHECK-O0 --check-prefix=…
9 ; RUN: llc < %s -mtriple=thumbv7-apple-ios8.0 | FileCheck --check-prefix=THUMB %s
25 ; Make sure Epilog does not overwrite an explicitly-handled CSR in CXX_FAST_TLS.
26 ; THUMB-LABEL: _ZTW2sg
29 ; THUMB: bne [[TH_end:.?LBB0_[0-9]+]]
[all …]
Dswift-return.ll1 ; RUN: llc -mtriple=armv7k-apple-ios8.0 -mcpu=cortex-a7 -verify-machineinstrs < %s | FileCheck %s
2 ; RUN: llc -mtriple=armv7k-apple-ios8.0 -mcpu=cortex-a7 -verify-machineinstrs < %s -O0 | FileCheck
4 ; RUN: llc -mtriple=armv7-apple-ios -verify-machineinstrs < %s | FileCheck %s
5 ; RUN: llc -mtriple=armv7-apple-ios -verify-machineinstrs < %s -O0 | FileCheck --check-prefix=CHECK
9 ; CHECK-LABEL: test:
13 ; CHECK-O0-LABEL: test:
14 ; CHECK-O0: bl {{.*}}gen
15 ; CHECK-O0: sxth r0, r0
16 ; CHECK-O0: sxtb r1, r1
17 ; CHECK-O0: add r0, r0, r1
[all …]
/external/XNNPACK/src/x24-transposec/gen/
D4x1-scalar.c1 // Auto-generated file. Do not edit!
2 // Template: src/x24-transposec/scalar.c.in
7 // This source code is licensed under the BSD-style license found in the
28 const size_t input_reset = 3 - round_down_po2(block_height, 4) * input_stride; in xnn_x24_transposec_ukernel__4x1_scalar()
29 const size_t output_reset = 1 * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__4x1_scalar()
37 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__4x1_scalar() local
41 for (; bh >= 4; bh -= 4) { in xnn_x24_transposec_ukernel__4x1_scalar()
42 o0[0] = i0[0]; in xnn_x24_transposec_ukernel__4x1_scalar()
43 o0[1] = i0[1]; in xnn_x24_transposec_ukernel__4x1_scalar()
44 o0[2] = i0[2]; in xnn_x24_transposec_ukernel__4x1_scalar()
[all …]
D4x2-scalar.c1 // Auto-generated file. Do not edit!
2 // Template: src/x24-transposec/scalar.c.in
7 // This source code is licensed under the BSD-style license found in the
28 const size_t input_reset = 6 - round_down_po2(block_height, 4) * input_stride; in xnn_x24_transposec_ukernel__4x2_scalar()
29 const size_t output_reset = 2 * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__4x2_scalar()
37 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__4x2_scalar() local
38 uint8_t* o1 = (uint8_t*) ((uintptr_t) o0 + output_stride); in xnn_x24_transposec_ukernel__4x2_scalar()
42 o1 = o0; in xnn_x24_transposec_ukernel__4x2_scalar()
45 for (; bh >= 4; bh -= 4) { in xnn_x24_transposec_ukernel__4x2_scalar()
59 o0[0] = i0[0]; in xnn_x24_transposec_ukernel__4x2_scalar()
[all …]
D4x4-scalar.c1 // Auto-generated file. Do not edit!
2 // Template: src/x24-transposec/scalar.c.in
7 // This source code is licensed under the BSD-style license found in the
28 const size_t input_reset = 12 - round_down_po2(block_height, 4) * input_stride; in xnn_x24_transposec_ukernel__4x4_scalar()
29 const size_t output_reset = 4 * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__4x4_scalar()
37 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__4x4_scalar() local
38 uint8_t* o1 = (uint8_t*) ((uintptr_t) o0 + output_stride); in xnn_x24_transposec_ukernel__4x4_scalar()
44 o1 = o0; in xnn_x24_transposec_ukernel__4x4_scalar()
47 o2 = o0; in xnn_x24_transposec_ukernel__4x4_scalar()
50 o3 = o0; in xnn_x24_transposec_ukernel__4x4_scalar()
[all …]
D2x2-scalar.c1 // Auto-generated file. Do not edit!
2 // Template: src/x24-transposec/scalar.c.in
7 // This source code is licensed under the BSD-style license found in the
28 const size_t input_reset = 6 - round_down_po2(block_height, 2) * input_stride; in xnn_x24_transposec_ukernel__2x2_scalar()
29 const size_t output_reset = 2 * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__2x2_scalar()
35 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__2x2_scalar() local
36 uint8_t* o1 = (uint8_t*) ((uintptr_t) o0 + output_stride); in xnn_x24_transposec_ukernel__2x2_scalar()
40 o1 = o0; in xnn_x24_transposec_ukernel__2x2_scalar()
43 for (; bh >= 2; bh -= 2) { in xnn_x24_transposec_ukernel__2x2_scalar()
51 o0[0] = i0[0]; in xnn_x24_transposec_ukernel__2x2_scalar()
[all …]
D2x1-scalar.c1 // Auto-generated file. Do not edit!
2 // Template: src/x24-transposec/scalar.c.in
7 // This source code is licensed under the BSD-style license found in the
28 const size_t input_reset = 3 - round_down_po2(block_height, 2) * input_stride; in xnn_x24_transposec_ukernel__2x1_scalar()
29 const size_t output_reset = 1 * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__2x1_scalar()
35 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__2x1_scalar() local
39 for (; bh >= 2; bh -= 2) { in xnn_x24_transposec_ukernel__2x1_scalar()
40 o0[0] = i0[0]; in xnn_x24_transposec_ukernel__2x1_scalar()
41 o0[1] = i0[1]; in xnn_x24_transposec_ukernel__2x1_scalar()
42 o0[2] = i0[2]; in xnn_x24_transposec_ukernel__2x1_scalar()
[all …]
D2x4-scalar.c1 // Auto-generated file. Do not edit!
2 // Template: src/x24-transposec/scalar.c.in
7 // This source code is licensed under the BSD-style license found in the
28 const size_t input_reset = 12 - round_down_po2(block_height, 2) * input_stride; in xnn_x24_transposec_ukernel__2x4_scalar()
29 const size_t output_reset = 4 * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__2x4_scalar()
35 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__2x4_scalar() local
36 uint8_t* o1 = (uint8_t*) ((uintptr_t) o0 + output_stride); in xnn_x24_transposec_ukernel__2x4_scalar()
42 o1 = o0; in xnn_x24_transposec_ukernel__2x4_scalar()
45 o2 = o0; in xnn_x24_transposec_ukernel__2x4_scalar()
48 o3 = o0; in xnn_x24_transposec_ukernel__2x4_scalar()
[all …]
/external/llvm/test/CodeGen/SPARC/
Dbasictest.ll1 ; RUN: llc < %s -march=sparc | FileCheck %s
6 ; CHECK-LABEL: test0:
7 ; CHECK: add %o0, 1, %o0
14 %B = xor i32 %A, -1
16 ; CHECK-LABEL: test1:
17 ; CHECK: xnor %o0, %o1, %o0
21 %A = xor i32 %X, -1
24 ; CHECK-LABEL: test2:
25 ; CHECK: xnor %o0, %o1, %o0
28 ; CHECK-LABEL: store_zero:
[all …]
/external/libffi/src/sparc/
Dv8.S1 /* -----------------------------------------------------------------------
2 v8.S - Copyright (c) 2013 The Written Word, Inc.
26 ----------------------------------------------------------------------- */
54 1: iflush %o0
63 .size C(ffi_flush_icache), . - C(ffi_flush_icache)
82 mov %i0, %o0 ! copy cif
89 and %o0, SPARC_FLAG_RET_MASK, %l0 ! save return type
90 srl %o0, SPARC_SIZEMASK_SHIFT, %l1 ! save return size
91 ld [%sp+64+4], %o0 ! load all argument registers
107 jmp %o7+(2f-0b)
[all …]
Dv9.S1 /* -----------------------------------------------------------------------
2 v9.S - Copyright (c) 2000, 2003, 2004, 2008 Red Hat, Inc.
4 SPARC 64-bit Foreign Function Interface
25 ----------------------------------------------------------------------- */
62 mov %i0, %o0 ! copy cif
68 andcc %o0, SPARC_FLAG_FP_ARGS, %g0 ! need fp regs?
71 mov %o0, %l0 ! save flags
90 1: ldx [%sp+STACK_BIAS+128], %o0 ! load all int arg regs
103 jmp %o7+(2f-0b)
112 add %sp, STACK_BIAS-64+128+48, %l2
[all …]
/external/XNNPACK/src/f32-prelu/gen/
Dneon-1x16.c1 // Auto-generated file. Do not edit!
2 // Template: src/f32-prelu/neon.c.in
7 // This source code is licensed under the BSD-style license found in the
32 float* o0 = output; in xnn_f32_prelu_ukernel__neon_1x16() local
34 const size_t input_increment = input_stride * 1 - channels; in xnn_f32_prelu_ukernel__neon_1x16()
35 const size_t output_increment = output_stride * 1 - channels; in xnn_f32_prelu_ukernel__neon_1x16()
41 for (; c >= 16 * sizeof(float); c -= 16 * sizeof(float)) { in xnn_f32_prelu_ukernel__neon_1x16()
66 vst1q_f32(o0, vacc0x0123); o0 += 4; in xnn_f32_prelu_ukernel__neon_1x16()
67 vst1q_f32(o0, vacc0x4567); o0 += 4; in xnn_f32_prelu_ukernel__neon_1x16()
68 vst1q_f32(o0, vacc0x89AB); o0 += 4; in xnn_f32_prelu_ukernel__neon_1x16()
[all …]
Dneon-2x16.c1 // Auto-generated file. Do not edit!
2 // Template: src/f32-prelu/neon.c.in
7 // This source code is licensed under the BSD-style license found in the
32 float* o0 = output; in xnn_f32_prelu_ukernel__neon_2x16() local
34 float* o1 = (float*) ((uintptr_t) o0 + output_stride); in xnn_f32_prelu_ukernel__neon_2x16()
36 const size_t input_increment = input_stride * 2 - channels; in xnn_f32_prelu_ukernel__neon_2x16()
37 const size_t output_increment = output_stride * 2 - channels; in xnn_f32_prelu_ukernel__neon_2x16()
42 o1 = o0; in xnn_f32_prelu_ukernel__neon_2x16()
47 for (; c >= 16 * sizeof(float); c -= 16 * sizeof(float)) { in xnn_f32_prelu_ukernel__neon_2x16()
88 vst1q_f32(o0, vacc0x0123); o0 += 4; in xnn_f32_prelu_ukernel__neon_2x16()
[all …]
Davx-2x16.c1 // Auto-generated file. Do not edit!
2 // Template: src/f32-prelu/avx.c.in
7 // This source code is licensed under the BSD-style license found in the
18 static const int32_t mask_table[14] = {-1, -1, -1, -1, -1, -1, -1, 0, 0, 0, 0, 0, 0, 0};
34 float* o0 = output; in xnn_f32_prelu_ukernel__avx_2x16() local
36 float* o1 = (float*) ((uintptr_t) o0 + output_stride); in xnn_f32_prelu_ukernel__avx_2x16()
38 const size_t input_increment = input_stride * 2 - channels; in xnn_f32_prelu_ukernel__avx_2x16()
39 const size_t output_increment = output_stride * 2 - channels; in xnn_f32_prelu_ukernel__avx_2x16()
44 o1 = o0; in xnn_f32_prelu_ukernel__avx_2x16()
49 for (; c >= 16 * sizeof(float); c -= 16 * sizeof(float)) { in xnn_f32_prelu_ukernel__avx_2x16()
[all …]
Dwasmsimd-bitselect-1x16.c1 // Auto-generated file. Do not edit!
2 // Template: src/f32-prelu/wasmsimd-bitselect.c.in
7 // This source code is licensed under the BSD-style license found in the
32 float* o0 = output; in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16() local
34 const size_t input_increment = input_stride * 1 - channels; in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16()
35 const size_t output_increment = output_stride * 1 - channels; in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16()
41 for (; c >= 16 * sizeof(float); c -= 16 * sizeof(float)) { in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16()
68 wasm_v128_store(o0, vacc0x0123); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16()
69 wasm_v128_store(o0 + 4, vacc0x4567); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16()
70 wasm_v128_store(o0 + 8, vacc0x89AB); in xnn_f32_prelu_ukernel__wasmsimd_bitselect_1x16()
[all …]
/external/XNNPACK/src/x24-transposec/
D2x2-neon-tbl.c3 // This source code is licensed under the BSD-style license found in the
31 const size_t tile_wbytes_minus_4 = tile_wbytes - 4; in xnn_x24_transposec_ukernel__2x2_neon_tbl()
32 const size_t input_reset = tile_wbytes - round_down_po2(block_height, tile_height) * input_stride; in xnn_x24_transposec_ukernel__2x2_neon_tbl()
33 const size_t output_reset = tile_height * output_stride - block_height * 3; in xnn_x24_transposec_ukernel__2x2_neon_tbl()
40 uint8_t* o0 = (uint8_t*) output; in xnn_x24_transposec_ukernel__2x2_neon_tbl() local
41 uint8_t* o1 = (uint8_t*) ((uintptr_t) o0 + output_stride); in xnn_x24_transposec_ukernel__2x2_neon_tbl()
47 o1 = o0; in xnn_x24_transposec_ukernel__2x2_neon_tbl()
50 for (; bh >= 2; bh -= 2) { in xnn_x24_transposec_ukernel__2x2_neon_tbl()
59 … vst1_lane_u32((void*) o0, vreinterpret_u32_u8(vres0), 0); o0 = (uint8_t*) ((uintptr_t) o0 + 4); in xnn_x24_transposec_ukernel__2x2_neon_tbl()
61 …vst1_lane_u16((void*) o0, vreinterpret_u16_u8(vres0), 2); o0 = (uint8_t*) ((uintptr_t) o0 + tile_w… in xnn_x24_transposec_ukernel__2x2_neon_tbl()
[all …]
/external/XNNPACK/src/f16-prelu/gen/
Dneonfp16arith-2x16.c1 // Auto-generated file. Do not edit!
2 // Template: src/f16-prelu/neonfp16arith.c.in
7 // This source code is licensed under the BSD-style license found in the
32 __fp16* o0 = (__fp16*) output; in xnn_f16_prelu_ukernel__neonfp16arith_2x16() local
34 __fp16* o1 = (__fp16*) ((uintptr_t) o0 + output_stride); in xnn_f16_prelu_ukernel__neonfp16arith_2x16()
36 const size_t input_increment = input_stride * 2 - channels; in xnn_f16_prelu_ukernel__neonfp16arith_2x16()
37 const size_t output_increment = output_stride * 2 - channels; in xnn_f16_prelu_ukernel__neonfp16arith_2x16()
42 o1 = o0; in xnn_f16_prelu_ukernel__neonfp16arith_2x16()
47 for (; c >= 16 * sizeof(__fp16); c -= 16 * sizeof(__fp16)) { in xnn_f16_prelu_ukernel__neonfp16arith_2x16()
70 vst1q_f16(o0, vacc0x001234567); o0 += 8; in xnn_f16_prelu_ukernel__neonfp16arith_2x16()
[all …]

12345678910>>...45