Home
last modified time | relevance | path

Searched refs:num_waves (Results 1 – 12 of 12) sorted by relevance

/external/mesa3d/src/amd/compiler/
Daco_scheduler.cpp32 #define SMEM_WINDOW_SIZE (350 - ctx.num_waves * 35)
33 #define VMEM_WINDOW_SIZE (1024 - ctx.num_waves * 64)
35 #define SMEM_MAX_MOVES (64 - ctx.num_waves * 4)
36 #define VMEM_MAX_MOVES (128 - ctx.num_waves * 8)
38 #define VMEM_CLAUSE_MAX_GRAB_DIST ((ctx.num_waves - 1) * 8)
86 int16_t num_waves; member
651 ctx.last_SMEM_stall = 10 - ctx.num_waves - k; in schedule_SMEM()
904 if (program->num_waves <= 5) in schedule_program()
905 ctx.num_waves = program->num_waves; in schedule_program()
907 ctx.num_waves = 5; in schedule_program()
[all …]
Daco_live_var_analysis.cpp349 program->num_waves = 0; in update_vgpr_sgpr_demand()
352 program->num_waves = program->physical_sgprs / get_sgpr_alloc(program, new_demand.sgpr); in update_vgpr_sgpr_demand()
353 …program->num_waves = std::min<uint16_t>(program->num_waves, 256 / get_vgpr_alloc(program, new_dema… in update_vgpr_sgpr_demand()
372 program->num_waves = std::min<uint16_t>(program->num_waves, program->max_waves); in update_vgpr_sgpr_demand()
373 program->max_reg_demand.vgpr = get_addr_vgpr_from_waves(program, program->num_waves); in update_vgpr_sgpr_demand()
374 program->max_reg_demand.sgpr = get_addr_sgpr_from_waves(program, program->num_waves); in update_vgpr_sgpr_demand()
Daco_spill.cpp1770 if (program->num_waves > 0) in spill()
1802 assert(program->num_waves > 0); in spill()
Daco_ir.h1620 uint16_t num_waves = 0; variable
/external/llvm-project/openmp/libomptarget/deviceRTLs/amdgcn/src/
Dtarget_impl.hip78 uint32_t num_waves = num_threads / WARPSIZE;
87 assert(num_waves != 0);
88 assert(num_waves * WARPSIZE == num_threads);
89 assert(num_waves < 0xffffu);
102 if ((load & 0x0000ffffu) == (num_waves - 1)) {
103 // Reached num_waves in low bits so this is the last wave.
/external/mesa3d/src/amd/vulkan/
Dradv_debug.c300 unsigned num_waves, FILE *f) in radv_dump_annotated_shader() argument
312 for (i = 0; i < num_waves; i++) { in radv_dump_annotated_shader()
317 if (i == num_waves) in radv_dump_annotated_shader()
322 num_waves -= i; in radv_dump_annotated_shader()
344 while (num_waves && start_addr + inst->offset == waves->pc) { in radv_dump_annotated_shader()
361 num_waves--; in radv_dump_annotated_shader()
375 unsigned num_waves = ac_get_wave_info(chip_class, waves); in radv_dump_annotated_shaders() local
378 "\n\n", num_waves); in radv_dump_annotated_shaders()
385 stage, waves, num_waves, f); in radv_dump_annotated_shaders()
391 for (i = 0; i < num_waves; i++) { in radv_dump_annotated_shaders()
/external/mesa3d/src/gallium/drivers/radeonsi/
Dsi_debug.c923 unsigned num_waves, FILE *f) in si_print_annotated_shader() argument
935 for (i = 0; i < num_waves; i++) { in si_print_annotated_shader()
939 if (i == num_waves) in si_print_annotated_shader()
944 num_waves -= i; in si_print_annotated_shader()
986 while (num_waves && inst->addr == waves->pc) { in si_print_annotated_shader()
1000 num_waves--; in si_print_annotated_shader()
1013 unsigned num_waves = ac_get_wave_info(sctx->chip_class, waves); in si_dump_annotated_shaders() local
1015 fprintf(f, COLOR_CYAN "The number of active waves = %u" COLOR_RESET "\n\n", num_waves); in si_dump_annotated_shaders()
1017 si_print_annotated_shader(sctx->vs_shader.current, waves, num_waves, f); in si_dump_annotated_shaders()
1018 si_print_annotated_shader(sctx->tcs_shader.current, waves, num_waves, f); in si_dump_annotated_shaders()
[all …]
/external/mesa3d/src/amd/common/
Dac_debug.c777 unsigned num_waves = 0; in ac_get_wave_info() local
794 assert(num_waves < AC_MAX_WAVES_PER_CHIP); in ac_get_wave_info()
795 w = &waves[num_waves]; in ac_get_wave_info()
803 num_waves++; in ac_get_wave_info()
807 qsort(waves, num_waves, sizeof(struct ac_wave_info), compare_wave); in ac_get_wave_info()
810 return num_waves; in ac_get_wave_info()
/external/mesa3d/src/gallium/drivers/r600/
Devergreen_compute.c604 unsigned num_waves; in evergreen_emit_dispatch() local
625 num_waves = (info->block[0] * info->block[1] * info->block[2] + in evergreen_emit_dispatch()
631 num_pipes, num_waves, lds_size); in evergreen_emit_dispatch()
657 lds_size | (num_waves << 14)); in evergreen_emit_dispatch()
Devergreen_state.c4519 unsigned num_waves; in evergreen_setup_tess_constants() local
4580 num_waves = ceilf((float)(*num_patches * num_tcs_output_cp) / (float)wave_divisor); in evergreen_setup_tess_constants()
4582 rctx->lds_alloc = (lds_size | (num_waves << 14)); in evergreen_setup_tess_constants()
/external/mesa3d/docs/relnotes/
D20.3.1.rst160 - aco: Use program->num_waves as maximum in scheduler.
D19.3.0.rst2859 - aco: take LDS into account when calculating num_waves