/external/llvm-project/llvm/test/CodeGen/AMDGPU/GlobalISel/ |
D | postlegalizercombiner-and.mir | 196 ; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize) 198 ; CHECK: %and:_(s32) = G_AND %lds_size, %mask 201 %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize) 203 %and:_(s32) = G_AND %lds_size, %mask 217 ; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize) 218 ; CHECK: $vgpr0 = COPY %lds_size(s32) 220 %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize) 222 %and:_(s32) = G_AND %lds_size, %mask 236 ; CHECK: %lds_size:_(s32) = G_INTRINSIC intrinsic(@llvm.amdgcn.groupstaticsize) 238 ; CHECK: %and:_(s32) = G_AND %lds_size, %mask [all …]
|
/external/mesa3d/src/amd/vulkan/ |
D | radv_shader.h | 227 uint32_t lds_size; member 529 unsigned lds_size = output_patch0_offset + output_patch_size * tcs_num_patches; in calculate_tess_lds_size() local 532 assert(lds_size <= 65536); in calculate_tess_lds_size() 533 lds_size = align(lds_size, 512) / 512; in calculate_tess_lds_size() 535 assert(lds_size <= 32768); in calculate_tess_lds_size() 536 lds_size = align(lds_size, 256) / 256; in calculate_tess_lds_size() 539 return lds_size; in calculate_tess_lds_size()
|
D | radv_shader.c | 1026 S_00B84C_LDS_SIZE(config_in->lds_size) | in radv_postprocess_config() 1067 S_00B22C_LDS_SIZE(config_in->lds_size) | in radv_postprocess_config() 1173 if (rtld_binary.lds_size > 0) { in radv_shader_variant_create() 1175 config.lds_size = align(rtld_binary.lds_size, alloc_granularity) / alloc_granularity; in radv_shader_variant_create() 1537 lds_per_wave = conf->lds_size * lds_increment + in radv_get_max_waves() 1543 lds_per_wave = (conf->lds_size * lds_increment) / in radv_get_max_waves() 1619 statistics.resourceUsage.ldsUsageSizeInBytes = conf->lds_size * lds_multiplier; in radv_GetShaderInfoAMD()
|
D | radv_rgp.c | 264 int32_t lds_size; member 388 chunk->lds_size = rad_info->lds_size_per_workgroup; in radv_fill_sqtt_asic_info()
|
D | radv_pipeline.c | 1892 out->lds_size = align(esgs_lds_size, 128) / 128; in gfx9_get_gs_info() 4649 radeon_emit(cs, gs->config.rsrc2 | S_00B22C_LDS_SIZE(gs_state->lds_size)); in radv_pipeline_generate_hw_gs() 5744 s->value.u64 = shader->config.lds_size * lds_increment; in radv_GetPipelineExecutableStatisticsKHR()
|
/external/mesa3d/src/amd/common/ |
D | ac_binary.c | 65 conf->lds_size = MAX2(conf->lds_size, G_00B02C_EXTRA_LDS_SIZE(value)); in ac_parse_shader_binary_config() 83 conf->lds_size = MAX2(conf->lds_size, G_00B84C_LDS_SIZE(value)); in ac_parse_shader_binary_config()
|
D | ac_rtld.c | 313 binary->lds_size = shared_lds_size; in ac_rtld_open() 393 binary->lds_size = MAX2(binary->lds_size, part_lds_size); in ac_rtld_open() 404 binary->lds_size = align(binary->lds_size, lds_end_align); in ac_rtld_open() 411 lds_end->offset = binary->lds_size; in ac_rtld_open() 415 if (binary->lds_size > max_lds_size) { in ac_rtld_open() 417 (unsigned)binary->lds_size, max_lds_size); in ac_rtld_open() 543 config->lds_size = MAX2(config->lds_size, c.lds_size); in ac_rtld_read_config()
|
D | ac_binary.h | 43 unsigned lds_size; /* in HW allocation units; i.e 256 bytes on SI, 512 bytes on CI+ */ member
|
D | ac_rtld.h | 73 uint32_t lds_size; member
|
/external/llvm/test/CodeGen/AMDGPU/ |
D | llvm.amdgcn.groupstaticgroup.ll | 11 define void @get_groupstaticsize_test0(float addrspace(1)* %out, i32 addrspace(1)* %lds_size) #0 { 15 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4 26 define void @groupstaticsize_test1(float addrspace(1)* %out, i32 %cond, i32 addrspace(1)* %lds_size… 29 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4
|
/external/llvm-project/llvm/test/CodeGen/AMDGPU/ |
D | llvm.amdgcn.groupstaticsize.ll | 17 …dgpu_kernel void @groupstaticsize_test0(float addrspace(1)* %out, i32 addrspace(1)* %lds_size) #0 { 21 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4 32 …nel void @groupstaticsize_test1(float addrspace(1)* %out, i32 %cond, i32 addrspace(1)* %lds_size) { 35 store i32 %static_lds_size, i32 addrspace(1)* %lds_size, align 4
|
D | pal-userdata-regs.ll | 16 …mit\CD\01\00\A3.hs\82\AB.sgpr_limith\AB.vgpr_limit\CD\01\00\A3.ls\83\A9.lds_size\CD\03\00\AB.sgpr_…
|
/external/mesa3d/src/amd/compiler/ |
D | aco_instruction_selection_setup.cpp | 392 unsigned lds_size = ctx->program->info->ngg_info.esgs_ring_size; in setup_vs_variables() local 393 ctx->program->config->lds_size = (lds_size + ctx->program->lds_alloc_granule - 1) / in setup_vs_variables() 401 …ctx->program->config->lds_size = ctx->program->info->gs_ring_info.lds_size; /* Already in units of… in setup_gs_variables() 419 …ctx->program->config->lds_size = (total_lds_bytes + ctx->program->lds_alloc_granule - 1) / ctx->pr… in setup_gs_variables() 471 unsigned lds_size = calculate_tess_lds_size( in setup_tcs_info() local 481 ctx->args->shader_info->tcs.num_lds_blocks = lds_size; in setup_tcs_info() 482 ctx->program->config->lds_size = (lds_size + ctx->program->lds_alloc_granule - 1) / in setup_tcs_info() 514 …ctx->program->config->lds_size = (nir->info.cs.shared_size + ctx->program->lds_alloc_granule - 1) / in setup_variables() 538 …assert((ctx->program->config->lds_size * ctx->program->lds_alloc_granule) <= ctx->program->lds_lim… in setup_variables()
|
D | aco_live_var_analysis.cpp | 359 if (program->config->lds_size) { in update_vgpr_sgpr_demand() 360 unsigned lds = program->config->lds_size * program->lds_alloc_granule; in update_vgpr_sgpr_demand()
|
/external/mesa3d/src/gallium/drivers/radeonsi/ |
D | si_state_draw.c | 86 unsigned perpatch_output_offset, lds_size; in si_emit_derived_tess_state() local 230 lds_size = output_patch0_offset + output_patch_size * *num_patches; in si_emit_derived_tess_state() 233 assert(lds_size <= 65536); in si_emit_derived_tess_state() 234 lds_size = align(lds_size, 512) / 512; in si_emit_derived_tess_state() 236 assert(lds_size <= 32768); in si_emit_derived_tess_state() 237 lds_size = align(lds_size, 256) / 256; in si_emit_derived_tess_state() 247 assert(ls_current->config.lds_size == 0); in si_emit_derived_tess_state() 253 hs_rsrc2 |= S_00B42C_LDS_SIZE_GFX10(lds_size); in si_emit_derived_tess_state() 255 hs_rsrc2 |= S_00B42C_LDS_SIZE_GFX9(lds_size); in si_emit_derived_tess_state() 268 si_multiwave_lds_size_workaround(sctx->screen, &lds_size); in si_emit_derived_tess_state() [all …]
|
D | si_shader.c | 839 if (rtld->lds_size > 0) { in si_shader_binary_open() 841 shader->config.lds_size = align(rtld->lds_size, alloc_granularity) / alloc_granularity; in si_shader_binary_open() 991 lds_per_wave = conf->lds_size * lds_increment + align(num_inputs * 48, lds_increment); in si_calculate_max_simd_waves() 995 lds_per_wave = (conf->lds_size * lds_increment) / in si_calculate_max_simd_waves() 1036 conf->lds_size, conf->scratch_bytes_per_wave, shader->info.max_simd_waves, in si_shader_dump_stats_for_shader_db() 1068 conf->lds_size, conf->scratch_bytes_per_wave, shader->info.max_simd_waves); in si_shader_dump_stats() 2414 void si_multiwave_lds_size_workaround(struct si_screen *sscreen, unsigned *lds_size) in si_multiwave_lds_size_workaround() argument 2426 *lds_size = MAX2(*lds_size, 8); in si_multiwave_lds_size_workaround() 2437 si_multiwave_lds_size_workaround(sscreen, &shader->config.lds_size); in si_fix_resource_usage()
|
D | si_compute.c | 103 out_config->lds_size = MAX2(out_config->lds_size, G_00B84C_LDS_SIZE(rsrc2)); in code_object_to_config() 211 S_00B84C_LDS_SIZE(shader->config.lds_size); in si_create_compute_state_async() 465 lds_blocks = config->lds_size; in si_switch_compute_shader()
|
D | si_shader_llvm.c | 366 unsigned lds_size = sel->info.base.cs.shared_size; in si_llvm_declare_compute_memory() local 373 var = LLVMAddGlobalInAddressSpace(ctx->ac.module, LLVMArrayType(ctx->ac.i8, lds_size), in si_llvm_declare_compute_memory()
|
D | si_shader.h | 842 void si_multiwave_lds_size_workaround(struct si_screen *sscreen, unsigned *lds_size);
|
D | si_state_shaders.c | 876 S_00B22C_LDS_SIZE(shader->config.lds_size) | in si_shader_gs() 1161 S_00B22C_LDS_SIZE(shader->config.lds_size)); in gfx10_shader_ngg() 1687 S_00B02C_EXTRA_LDS_SIZE(shader->config.lds_size) | in si_shader_ps()
|
D | si_compute_prim_discard.c | 1389 S_00B84C_LDS_SIZE(shader->config.lds_size)); in si_dispatch_prim_discard_cs_and_draw()
|
/external/mesa3d/src/gallium/drivers/r600/ |
D | evergreen_compute.c | 609 unsigned lds_size = shader->local_size / 4; in evergreen_emit_dispatch() local 613 lds_size += shader->bc.nlds_dw; in evergreen_emit_dispatch() 631 num_pipes, num_waves, lds_size); in evergreen_emit_dispatch() 649 assert(lds_size <= 8192); in evergreen_emit_dispatch() 653 assert(lds_size <= 8160); in evergreen_emit_dispatch() 657 lds_size | (num_waves << 14)); in evergreen_emit_dispatch()
|
D | evergreen_state.c | 4517 unsigned output_patch0_offset, perpatch_output_offset, lds_size; in evergreen_setup_tess_constants() local 4566 lds_size = output_patch0_offset + output_patch_size * *num_patches; in evergreen_setup_tess_constants() 4582 rctx->lds_alloc = (lds_size | (num_waves << 14)); in evergreen_setup_tess_constants()
|
/external/llvm/lib/Target/AMDGPU/Utils/ |
D | AMDKernelCodeTInfo.h | 115 COMPPGM2(lds_size, LDS_SIZE),
|
/external/mesa3d/src/amd/llvm/ |
D | ac_llvm_build.c | 2948 unsigned lds_size = ctx->chip_class >= GFX7 ? 65536 : 32768; in ac_declare_lds_as_pointer() local 2951 LLVMPointerType(LLVMArrayType(ctx->i32, lds_size / 4), AC_ADDR_SPACE_LDS), "lds"); in ac_declare_lds_as_pointer()
|