Searched refs:msb_idx_u32 (Results 1 – 9 of 9) sorted by relevance
60 return 1u << msb_idx_u32(n); in pow2_rd_u32()68 msb_idx_u32(uint32_t n) in msb_idx_u32() function
25 uint32_t msb_idx_u32(uint32_t n); // 0-based bit position
150 uint32_t const bc_max = msb_idx_u32(pow2_rd_u32(merge->warps)); in hsg_target_cuda()186 msb_idx_u32(pow2_ru_u32(merge->warps)), in hsg_target_cuda()311 uint32_t const msb = msb_idx_u32(bs); in hsg_target_cuda()357 uint32_t const msb = msb_idx_u32(m->warps); in hsg_target_cuda()407 uint32_t const msb = msb_idx_u32(pow2_ru_u32(merge[0].warps)); in hsg_target_cuda()
153 uint32_t const bc_max = msb_idx_u32(pow2_rd_u32(merge->warps)); in hsg_target_opencl()187 msb_idx_u32(pow2_ru_u32(merge->warps)), in hsg_target_opencl()289 uint32_t const msb = msb_idx_u32(bs); in hsg_target_opencl()318 uint32_t const msb = msb_idx_u32(m->warps); in hsg_target_opencl()
166 uint32_t const bc_max = msb_idx_u32(pow2_rd_u32(merge->warps)); in hsg_target_glsl()198 msb_idx_u32(pow2_ru_u32(merge->warps)), in hsg_target_glsl()303 uint32_t const msb = msb_idx_u32(bs); in hsg_target_glsl()348 uint32_t const msb = msb_idx_u32(m->warps); in hsg_target_glsl()
1235 ops = hsg_op(ops,FM_KERNEL_PROTO(scale_log2,msb_idx_u32(pow2_ru_u32(span_right)))); in hsg_fm_merge()1462 hsg_config.warp.lanes_log2 = msb_idx_u32(hsg_config.warp.lanes); in main()
411 hs->pipelines.fm[scale_log2][msb_idx_u32(frac_fm)]); in hs_fm()446 uint32_t const frac_idx = msb_idx_u32(frac_bs); in hs_bs()451 hs->pipelines.bs[msb_idx_u32(frac_bs)]); in hs_bs()829 uint32_t const bs_slabs_log2_ru = msb_idx_u32(pow2_ru_u32(target->config.block.slabs)); in hs_vk_create()830 uint32_t const bc_slabs_log2_max = msb_idx_u32(pow2_rd_u32(target->config.block.slabs)); in hs_vk_create()847 count_fm[scale] = msb_idx_u32(pow2_ru_u32(fm_left)) + 1; in hs_vk_create()
438 cl_kernel kernel_frac = hs->kernels.fm[scale_log2][msb_idx_u32(fm_frac)]; in hs_fm_enqueue()578 cl_kernel kernel_frac = hs->kernels.bs[msb_idx_u32(frac)]; in hs_bs_enqueue()1040 uint32_t const bs_slabs_log2_ru = msb_idx_u32(pow2_ru_u32(target->config.block.slabs)); in hs_cl_create()1041 uint32_t const bc_slabs_log2_max = msb_idx_u32(pow2_rd_u32(target->config.block.slabs)); in hs_cl_create()1058 count_fm[scale] = msb_idx_u32(pow2_ru_u32(fm_left)) + 1; in hs_cl_create()
776 hs_kernels_offset_fm[scale_log2-HS_FM_SCALE_MIN][msb_idx_u32(frac_fm)]820 hs_kernels_offset_bs[msb_idx_u32(frac_bs)]