Home
last modified time | relevance | path

Searched refs:warp (Results 1 – 25 of 47) sorted by relevance

12

/external/python/cpython2/Tools/pybench/
Dpybench.py205 warp = 1 variable in Test
219 def __init__(self, warp=None, calibration_runs=None, timer=None): argument
222 if warp is not None:
223 self.rounds = int(self.rounds / warp)
226 self.warp = warp
403 warp = 1 # Warp factor variable in Benchmark
420 def __init__(self, name, verbose=None, timer=None, warp=None, argument
432 if warp is not None:
433 self.warp = warp
489 warp=self.warp,
[all …]
DREADME70 -w arg set warp factor to arg (10)
123 Running 10 round(s) of the suite at warp factor 10:
246 # 1-2 seconds (at warp 1).
350 100-200ms using warp 10
351 - changed default warp factor to 10 (from 20)
/external/llvm-project/llvm/test/CodeGen/NVPTX/
Dbarrier.ll3 declare void @llvm.nvvm.bar.warp.sync(i32)
26 ; CHECK: bar.warp.sync [[ID]];
27 call void @llvm.nvvm.bar.warp.sync(i32 %id)
28 ; CHECK: bar.warp.sync 6;
29 call void @llvm.nvvm.bar.warp.sync(i32 6)
/external/skqp/src/compute/hs/gen/
Dtarget_opencl.c67 hsg_transpose_reg_prefix(state->config->warp.lanes_log2), in hsg_transpose_remap()
181 config->warp.lanes_log2, // FIXME - may be different on a SIMD target in hsg_target_opencl()
182 config->warp.lanes_log2, in hsg_target_opencl()
213 for (uint32_t ii=1; ii<=config->warp.lanes_log2; ii++) in hsg_target_opencl()
224 hsg_transpose(config->warp.lanes_log2, in hsg_target_opencl()
305 m->warps * config->warp.lanes, in hsg_target_opencl()
334 m->warps * config->warp.lanes, in hsg_target_opencl()
500 ops->b * config->warp.lanes, in hsg_target_opencl()
508 ops->b * config->warp.lanes, in hsg_target_opencl()
518 ops->b * config->warp.lanes); in hsg_target_opencl()
[all …]
Dtarget_cuda.c67 hsg_transpose_reg_prefix(state->config->warp.lanes_log2), in hsg_transpose_remap()
179 config->warp.lanes_log2, in hsg_target_cuda()
180 config->warp.lanes_log2, in hsg_target_cuda()
212 for (uint32_t ii=1; ii<=config->warp.lanes_log2; ii++) in hsg_target_cuda()
223 hsg_transpose(config->warp.lanes_log2, in hsg_target_cuda()
336 m->warps * config->warp.lanes, in hsg_target_cuda()
373 m->warps * config->warp.lanes, in hsg_target_cuda()
569 ops->b * config->warp.lanes, in hsg_target_cuda()
577 ops->b * config->warp.lanes, in hsg_target_cuda()
587 ops->b * config->warp.lanes); in hsg_target_cuda()
[all …]
Dtarget_glsl.c67 hsg_transpose_reg_prefix(state->config->warp.lanes_log2), in hsg_transpose_remap()
192 config->warp.lanes_log2, // FIXME -- this matters for SIMD in hsg_target_glsl()
193 config->warp.lanes_log2, in hsg_target_glsl()
224 for (uint32_t ii=1; ii<=config->warp.lanes_log2; ii++) in hsg_target_glsl()
235 hsg_transpose(config->warp.lanes_log2, in hsg_target_glsl()
324 m->warps * config->warp.lanes, in hsg_target_glsl()
369 m->warps * config->warp.lanes, in hsg_target_glsl()
588 ops->b * config->warp.lanes, in hsg_target_glsl()
596 ops->b * config->warp.lanes, in hsg_target_glsl()
606 ops->b * config->warp.lanes); in hsg_target_glsl()
[all …]
Dmain.c149 .warp = {
227 hsg_config.warp.skpw_bs = bs_keys / hsg_merge[0].warps; in hsg_config_init_shared()
240 uint32_t const bs_threads = merge->warps << hsg_config.warp.lanes_log2; in hsg_merge_levels_init_shared()
270 uint32_t const bc_threads = bc_warps_min << hsg_config.warp.lanes_log2; in hsg_merge_levels_init_shared()
728 uint32_t const level = hsg_config.warp.lanes; in hsg_warp_merge()
1014 ops = hsg_warp_half(ops,hsg_config.warp.lanes); in hsg_bs_flip_merge()
1141 ops = hsg_warp_half(ops,hsg_config.warp.lanes); in hsg_bc_clean()
1461 hsg_config.warp.lanes = atoi(optarg); in main()
1462 hsg_config.warp.lanes_log2 = msb_idx_u32(hsg_config.warp.lanes); in main()
Dgen.h64 } warp; member
/external/tensorflow/tensorflow/compiler/tf2xla/kernels/
Dresampler_ops.cc195 XlaOp BoundSamples(XlaOpKernelContext* ctx, XlaOp warp, in BoundSamples() argument
201 xla::Gt(warp, in BoundSamples()
206 warp, in BoundSamples()
249 XlaOp gather_indices, XlaOp warp, in CalculateGradData() argument
284 reshaped_weights = BoundSamples(ctx, warp, warp_type, warp_shape, in CalculateGradData()
512 XlaOp warp = ctx->Input("warp"); in Compile() local
517 XlaOp top_left = xla::ConvertElementType(warp, xla::S32); in Compile()
526 XlaOp ratio = warp - xla::ConvertElementType(top_left, data_type); in Compile()
555 auto is_ge_zero = xla::Ge(warp, xla::ZerosLike(warp)); in Compile()
558 warp, in Compile()
[all …]
/external/llvm-project/openmp/libomptarget/deviceRTLs/nvptx/docs/
DReductionDesign.txt82 ReduceData that is already reduced within a warp to a lane in the first
83 warp with minimal shared memory footprint. This is an essential step to
96 On the warp level, we have three versions of the algorithms:
110 algorithm being used here, is set to 0 to signify full warp reduction.
123 An illustration of this algorithm operating on a hypothetical 8-lane full-warp
162 located in a contiguous subset of threads in a warp starting from lane 0.
171 warp woud be:
222 warp). This particular version of shuffle intrinsic we take accepts only
231 where the first half of the (partial) warp is reduced with the second half
232 of the (partial) warp. This is because, the mapping
[all …]
/external/libgav1/libgav1/src/dsp/
Dwarp.cc433 dsp->warp = Warp_C</*is_compound=*/false, 8, uint8_t>; in Init8bpp()
438 dsp->warp = Warp_C</*is_compound=*/false, 8, uint8_t>; in Init8bpp()
451 dsp->warp = Warp_C</*is_compound=*/false, 10, uint16_t>; in Init10bpp()
456 dsp->warp = Warp_C</*is_compound=*/false, 10, uint16_t>; in Init10bpp()
Dlibgav1_dsp.cmake71 "${libgav1_source}/dsp/warp.cc"
72 "${libgav1_source}/dsp/warp.h"
Ddsp.h854 WarpFunc warp; member
/external/aac/libSBRenc/src/
Dsbrenc_freq_sca.cpp428 FIXP_DBL warp = FL2FXCONST_DBL(0.0f); in FDKsbrEnc_UpdateFreqScale() local
450 warp = FL2FXCONST_DBL(0.5f); /* 1.0/(1.0*2.0) */ in FDKsbrEnc_UpdateFreqScale()
452 warp = FL2FXCONST_DBL(1.0f / 2.6f); /* 1.0/(1.3*2.0); */ in FDKsbrEnc_UpdateFreqScale()
460 num_bands1 = numberOfBands(b_p_o, k1, k2, warp); in FDKsbrEnc_UpdateFreqScale()
/external/rust/crates/tokio/
DREADME.md131 * [`warp`]: A super-easy, composable, web server framework for warp speeds.
146 [`warp`]: https://github.com/seanmonstar/warp
/external/autotest/client/tests/monotonic_time/
Dcontrol14 Based on time-warp-test.c by Ingo Molnar.
/external/llvm-project/openmp/libomptarget/deviceRTLs/amdgcn/src/
Dtarget_impl.hip18 // thread's lane number in the warp
27 // thread's lane number in the warp
/external/arm-trusted-firmware/docs/plat/
Dwarp7.rst88 cp /path/to/linux/arch/boot/dts/imx7s-warp.dtb fiptool_images
104 --hw-config fiptool_images/imx7s-warp.dtb
110 --hw-config fiptool_images/imx7s-warp.dtb \
/external/skqp/src/gpu/effects/
DGrRRectBlurEffect.fp170 // warp the fragment position to the appropriate part of the 9patch blur texture
/external/libgav1/libgav1/src/dsp/arm/
Dwarp_neon.cc434 dsp->warp = Warp_NEON</*is_compound=*/false>; in Init8bpp()
/external/skqp/src/compute/skc/platforms/cl_12/kernels/
Dfills_expand.cl226 // decrement prim_idx by 1 so we can use inclusive warp scan later
Drasterize.cl2275 // iteration of the warp of multi-pixel lines.
2279 // partial warp workloads in the final iteration of each stage. It
2936 // this is a subgroup/warp-centric kernel
3094 // this is a subgroup/warp-centric kernel
3203 // this is a subgroup/warp-centric kernel
3308 // this is a subgroup/warp-centric kernel
/external/libgav1/libgav1/src/dsp/x86/
Dwarp_sse4.cc505 dsp->warp = Warp_SSE4_1</*is_compound=*/false>; in Init8bpp()
/external/libgav1/
DAndroid.bp111 "libgav1/src/dsp/warp.cc",
/external/skqp/src/compute/hs/
DREADME.md290 intra-warp/inter-lane shuffling ― reenable this capability.

12