Searched refs:max_waves (Results 1 - 18 of 18) sorted by relevance

/xsrc/external/mit/MesaLib/dist/src/freedreno/ir3/
H A Dir3_compiler.h129 uint32_t max_waves; member in struct:ir3_compiler
H A Dir3.c141 compiler->threadsize_base * compiler->max_waves;
177 unsigned max_waves = compiler->max_waves; local in function:ir3_get_reg_independent_max_waves
191 max_waves = MIN2(max_waves, waves_per_wg * wgs_per_core *
201 max_waves = MIN2(max_waves, branchstack_max_waves);
204 return max_waves;
216 : compiler->max_waves;
331 info->max_waves
[all...]
H A Dir3_compiler.c96 compiler->max_waves = 16;
H A Dir3.h72 int8_t max_waves; member in struct:ir3_info
/xsrc/external/mit/MesaLib/dist/src/amd/compiler/
H A Daco_live_var_analysis.cpp374 program->max_waves = max_waves_per_simd;
376 /* adjust max_waves for workgroup and LDS limits */
403 program->max_waves = std::min<uint16_t>(
404 program->max_waves,
407 /* incorporate max_waves and calculate max_reg_demand */
408 program->num_waves = std::min<uint16_t>(program->num_waves, program->max_waves);
H A Daco_ir.h2042 uint16_t max_waves = 0; /* maximum number of waves, regardless of register usage */ member in class:aco::Program
2229 /* return number of addressable sgprs/vgprs for max_waves */
2230 uint16_t get_addr_sgpr_from_waves(Program* program, uint16_t max_waves);
2231 uint16_t get_addr_vgpr_from_waves(Program* program, uint16_t max_waves);
/xsrc/external/mit/MesaLib.old/dist/src/amd/vulkan/
H A Dradv_pipeline.c147 unsigned max_waves = 0; local in function:radv_pipeline_scratch_init
160 max_waves = MAX2(max_waves, max_stage_waves);
172 max_waves = MIN2(max_waves, 0xffffffffu / scratch_bytes_per_wave);
174 if (scratch_bytes_per_wave && max_waves < min_waves) {
180 pipeline->max_waves = max_waves;
3494 S_0286E8_WAVES(pipeline->max_waves) |
3883 S_00B860_WAVES(pipeline->max_waves) |
[all...]
H A Dradv_private.h1410 unsigned max_waves; member in struct:radv_pipeline
H A Dradv_cmd_buffer.c898 pipeline->max_waves * pipeline->scratch_bytes_per_wave);
2988 pipeline->max_waves * pipeline->scratch_bytes_per_wave);
/xsrc/external/mit/MesaLib/dist/src/gallium/drivers/freedreno/ir3/
H A Dir3_gallium.c98 v->info.ss, v->info.sy, v->info.max_waves, v->max_sun, v->loops);
/xsrc/external/mit/MesaLib/dist/src/gallium/drivers/radeonsi/
H A Dgfx10_shader_ngg.c667 unsigned max_waves, LLVMValueRef tid,
673 unsigned num_i8vec4 = DIV_ROUND_UP(max_waves, 4);
698 if (max_waves > 4) {
713 LLVMTypeRef type = max_waves > 4 ? ctx->ac.i64 : ctx->ac.i32;
824 unsigned max_waves = DIV_ROUND_UP(ctx->screen->ngg_subgroup_size, ctx->ac.wave_size); local in function:gfx10_emit_ngg_culling_epilogue
1053 load_vertex_counts(ctx, ctx->gs_ngg_scratch, max_waves, tid, &new_num_es_threads,
666 load_vertex_counts(struct si_shader_context * ctx,LLVMValueRef lds,unsigned max_waves,LLVMValueRef tid,LLVMValueRef * total_count,LLVMValueRef * prefix_sum) argument
/xsrc/external/mit/MesaLib/dist/src/amd/vulkan/
H A Dradv_pipeline.c245 unsigned max_waves = 0; local in function:radv_pipeline_init_scratch
257 max_waves = MAX2(max_waves, max_stage_waves);
262 pipeline->max_waves = max_waves;
5992 unsigned max_waves = radv_get_max_waves(device, shader, stage); local in function:radv_GetPipelineExecutableStatisticsKHR
6058 s->value.u64 = max_waves;
H A Dradv_private.h1842 unsigned max_waves; member in struct:radv_pipeline
H A Dradv_cmd_buffer.c1317 cmd_buffer->scratch_waves_wanted = MAX2(cmd_buffer->scratch_waves_wanted, pipeline->max_waves);
4838 MAX2(cmd_buffer->compute_scratch_waves_wanted, pipeline->max_waves);
/xsrc/external/mit/MesaLib/dist/src/freedreno/vulkan/
H A Dtu_pipeline.c3479 stat->value.u64 = exe->stats.max_waves;
/xsrc/external/mit/MesaLib/dist/docs/relnotes/
H A D19.3.0.rst803 - aco: restrict scheduling depending on max_waves
2857 - radv: round vgprs/sgprs before calculating max_waves
H A D21.1.0.rst1312 - ir3: Calcuate max_waves and threadsize
1316 - freedreno: Report max_waves in shaderdb output
4703 - radv: fix max_waves estimation on GFX10.3
H A D21.2.0.rst3528 - radeonsi: set more precise max_waves in NGG code

Completed in 97 milliseconds