Home
last modified time | relevance | path

Searched refs:lds_size (Results 1 – 25 of 27) sorted by relevance

12

/external/llvm-project/llvm/test/CodeGen/AMDGPU/GlobalISel/
Dpostlegalizercombiner-and.mir196 ; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
198 ; CHECK: %and:_(s32) = G_AND %lds_size, %mask
201 %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
203 %and:_(s32) = G_AND %lds_size, %mask
217 ; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
218 ; CHECK: $vgpr0 = COPY %lds_size(s32)
220 %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
222 %and:_(s32) = G_AND %lds_size, %mask
236 ; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize)
238 ; CHECK: %and:_(s32) = G_AND %lds_size, %mask
[all …]
/external/mesa3d/src/amd/vulkan/
Dradv_shader.h227 uint32_t lds_size; member
529 unsigned lds_size = output_patch0_offset + output_patch_size * tcs_num_patches; in calculate_tess_lds_size() local
532 assert(lds_size <= 65536); in calculate_tess_lds_size()
533 lds_size = align(lds_size, 512) / 512; in calculate_tess_lds_size()
535 assert(lds_size <= 32768); in calculate_tess_lds_size()
536 lds_size = align(lds_size, 256) / 256; in calculate_tess_lds_size()
539 return lds_size; in calculate_tess_lds_size()
Dradv_shader.c1026 S_00B84C_LDS_SIZE(config_in->lds_size) | in radv_postprocess_config()
1067 S_00B22C_LDS_SIZE(config_in->lds_size) | in radv_postprocess_config()
1173 if (rtld_binary.lds_size > 0) { in radv_shader_variant_create()
1175 config.lds_size = align(rtld_binary.lds_size, alloc_granularity) / alloc_granularity; in radv_shader_variant_create()
1537 lds_per_wave = conf->lds_size * lds_increment + in radv_get_max_waves()
1543 lds_per_wave = (conf->lds_size * lds_increment) / in radv_get_max_waves()
1619 statistics.resourceUsage.ldsUsageSizeInBytes = conf->lds_size * lds_multiplier; in radv_GetShaderInfoAMD()
Dradv_rgp.c264 int32_t lds_size; member
388 chunk->lds_size = rad_info->lds_size_per_workgroup; in radv_fill_sqtt_asic_info()
Dradv_pipeline.c1892 out->lds_size = align(esgs_lds_size, 128) / 128; in gfx9_get_gs_info()
4649 radeon_emit(cs, gs->config.rsrc2 | S_00B22C_LDS_SIZE(gs_state->lds_size)); in radv_pipeline_generate_hw_gs()
5744 s->value.u64 = shader->config.lds_size * lds_increment; in radv_GetPipelineExecutableStatisticsKHR()
/external/mesa3d/src/amd/common/
Dac_binary.c65 conf->lds_size = MAX2(conf->lds_size, G_00B02C_EXTRA_LDS_SIZE(value)); in ac_parse_shader_binary_config()
83 conf->lds_size = MAX2(conf->lds_size, G_00B84C_LDS_SIZE(value)); in ac_parse_shader_binary_config()
Dac_rtld.c313 binary->lds_size = shared_lds_size; in ac_rtld_open()
393 binary->lds_size = MAX2(binary->lds_size, part_lds_size); in ac_rtld_open()
404 binary->lds_size = align(binary->lds_size, lds_end_align); in ac_rtld_open()
411 lds_end->offset = binary->lds_size; in ac_rtld_open()
415 if (binary->lds_size > max_lds_size) { in ac_rtld_open()
417 (unsigned)binary->lds_size, max_lds_size); in ac_rtld_open()
543 config->lds_size = MAX2(config->lds_size, c.lds_size); in ac_rtld_read_config()
Dac_binary.h43 unsigned lds_size; /* in HW allocation units; i.e 256 bytes on SI, 512 bytes on CI+ */ member
Dac_rtld.h73 uint32_t lds_size; member
/external/llvm/test/CodeGen/AMDGPU/
Dllvm.amdgcn.groupstaticgroup.ll11 define void @get_groupstaticsize_test0(float addrspace(1)* %out, i32 addrspace(1)* %lds_size) #0 {
15 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4
26 define void @groupstaticsize_test1(float addrspace(1)* %out, i32 %cond, i32 addrspace(1)* %lds_size
29 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4
/external/llvm-project/llvm/test/CodeGen/AMDGPU/
Dllvm.amdgcn.groupstaticsize.ll17 …dgpu_kernel void @groupstaticsize_test0(float addrspace(1)* %out, i32 addrspace(1)* %lds_size) #0 {
21 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4
32 …nel void @groupstaticsize_test1(float addrspace(1)* %out, i32 %cond, i32 addrspace(1)* %lds_size) {
35 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4
Dpal-userdata-regs.ll16 …mit\CD\01\00\A3.hs\82\AB.sgpr_limith\AB.vgpr_limit\CD\01\00\A3.ls\83\A9.lds_size\CD\03\00\AB.sgpr_…
/external/mesa3d/src/amd/compiler/
Daco_instruction_selection_setup.cpp392 unsigned lds_size = ctx->program->info->ngg_info.esgs_ring_size; in setup_vs_variables() local
393 ctx->program->config->lds_size = (lds_size + ctx->program->lds_alloc_granule - 1) / in setup_vs_variables()
401 …ctx->program->config->lds_size = ctx->program->info->gs_ring_info.lds_size; /* Already in units of… in setup_gs_variables()
419 …ctx->program->config->lds_size = (total_lds_bytes + ctx->program->lds_alloc_granule - 1) / ctx->pr… in setup_gs_variables()
471 unsigned lds_size = calculate_tess_lds_size( in setup_tcs_info() local
481 ctx->args->shader_info->tcs.num_lds_blocks = lds_size; in setup_tcs_info()
482 ctx->program->config->lds_size = (lds_size + ctx->program->lds_alloc_granule - 1) / in setup_tcs_info()
514 …ctx->program->config->lds_size = (nir->info.cs.shared_size + ctx->program->lds_alloc_granule - 1) / in setup_variables()
538 …assert((ctx->program->config->lds_size * ctx->program->lds_alloc_granule) <= ctx->program->lds_lim… in setup_variables()
Daco_live_var_analysis.cpp359 if (program->config->lds_size) { in update_vgpr_sgpr_demand()
360 unsigned lds = program->config->lds_size * program->lds_alloc_granule; in update_vgpr_sgpr_demand()
/external/mesa3d/src/gallium/drivers/radeonsi/
Dsi_state_draw.c86 unsigned perpatch_output_offset, lds_size; in si_emit_derived_tess_state() local
230 lds_size = output_patch0_offset + output_patch_size * *num_patches; in si_emit_derived_tess_state()
233 assert(lds_size <= 65536); in si_emit_derived_tess_state()
234 lds_size = align(lds_size, 512) / 512; in si_emit_derived_tess_state()
236 assert(lds_size <= 32768); in si_emit_derived_tess_state()
237 lds_size = align(lds_size, 256) / 256; in si_emit_derived_tess_state()
247 assert(ls_current->config.lds_size == 0); in si_emit_derived_tess_state()
253 hs_rsrc2 |= S_00B42C_LDS_SIZE_GFX10(lds_size); in si_emit_derived_tess_state()
255 hs_rsrc2 |= S_00B42C_LDS_SIZE_GFX9(lds_size); in si_emit_derived_tess_state()
268 si_multiwave_lds_size_workaround(sctx->screen, &lds_size); in si_emit_derived_tess_state()
[all …]
Dsi_shader.c839 if (rtld->lds_size > 0) { in si_shader_binary_open()
841 shader->config.lds_size = align(rtld->lds_size, alloc_granularity) / alloc_granularity; in si_shader_binary_open()
991 lds_per_wave = conf->lds_size * lds_increment + align(num_inputs * 48, lds_increment); in si_calculate_max_simd_waves()
995 lds_per_wave = (conf->lds_size * lds_increment) / in si_calculate_max_simd_waves()
1036 conf->lds_size, conf->scratch_bytes_per_wave, shader->info.max_simd_waves, in si_shader_dump_stats_for_shader_db()
1068 conf->lds_size, conf->scratch_bytes_per_wave, shader->info.max_simd_waves); in si_shader_dump_stats()
2414 void si_multiwave_lds_size_workaround(struct si_screen *sscreen, unsigned *lds_size) in si_multiwave_lds_size_workaround() argument
2426 *lds_size = MAX2(*lds_size, 8); in si_multiwave_lds_size_workaround()
2437 si_multiwave_lds_size_workaround(sscreen, &shader->config.lds_size); in si_fix_resource_usage()
Dsi_compute.c103 out_config->lds_size = MAX2(out_config->lds_size, G_00B84C_LDS_SIZE(rsrc2)); in code_object_to_config()
211 S_00B84C_LDS_SIZE(shader->config.lds_size); in si_create_compute_state_async()
465 lds_blocks = config->lds_size; in si_switch_compute_shader()
Dsi_shader_llvm.c366 unsigned lds_size = sel->info.base.cs.shared_size; in si_llvm_declare_compute_memory() local
373 var = LLVMAddGlobalInAddressSpace(ctx->ac.module, LLVMArrayType(ctx->ac.i8, lds_size), in si_llvm_declare_compute_memory()
Dsi_shader.h842 void si_multiwave_lds_size_workaround(struct si_screen *sscreen, unsigned *lds_size);
Dsi_state_shaders.c876 S_00B22C_LDS_SIZE(shader->config.lds_size) | in si_shader_gs()
1161 S_00B22C_LDS_SIZE(shader->config.lds_size)); in gfx10_shader_ngg()
1687 S_00B02C_EXTRA_LDS_SIZE(shader->config.lds_size) | in si_shader_ps()
Dsi_compute_prim_discard.c1389 S_00B84C_LDS_SIZE(shader->config.lds_size)); in si_dispatch_prim_discard_cs_and_draw()
/external/mesa3d/src/gallium/drivers/r600/
Devergreen_compute.c609 unsigned lds_size = shader->local_size / 4; in evergreen_emit_dispatch() local
613 lds_size += shader->bc.nlds_dw; in evergreen_emit_dispatch()
631 num_pipes, num_waves, lds_size); in evergreen_emit_dispatch()
649 assert(lds_size <= 8192); in evergreen_emit_dispatch()
653 assert(lds_size <= 8160); in evergreen_emit_dispatch()
657 lds_size | (num_waves << 14)); in evergreen_emit_dispatch()
Devergreen_state.c4517 unsigned output_patch0_offset, perpatch_output_offset, lds_size; in evergreen_setup_tess_constants() local
4566 lds_size = output_patch0_offset + output_patch_size * *num_patches; in evergreen_setup_tess_constants()
4582 rctx->lds_alloc = (lds_size | (num_waves << 14)); in evergreen_setup_tess_constants()
/external/llvm/lib/Target/AMDGPU/Utils/
DAMDKernelCodeTInfo.h115 COMPPGM2(lds_size, LDS_SIZE),
/external/mesa3d/src/amd/llvm/
Dac_llvm_build.c2948 unsigned lds_size = ctx->chip_class >= GFX7 ? 65536 : 32768; in ac_declare_lds_as_pointer() local
2951 LLVMPointerType(LLVMArrayType(ctx->i32, lds_size / 4), AC_ADDR_SPACE_LDS), "lds"); in ac_declare_lds_as_pointer()

12