summaryrefslogtreecommitdiff
path: root/lib/mesa/src/gallium
diff options
context:
space:
mode:
authorJonathan Gray <jsg@cvs.openbsd.org>2023-04-06 10:23:47 +0000
committerJonathan Gray <jsg@cvs.openbsd.org>2023-04-06 10:23:47 +0000
commit500e30a5d7582b5570d25d9b471c9bc7d653eab0 (patch)
tree4704749be209373b1f7c18cea2c7f6de571f6720 /lib/mesa/src/gallium
parenta0d742befadcae89d35a2e4a5d65a85c53c886a5 (diff)
Merge Mesa 22.3.7
Diffstat (limited to 'lib/mesa/src/gallium')
-rw-r--r--lib/mesa/src/gallium/auxiliary/util/u_vbuf.c10
-rw-r--r--lib/mesa/src/gallium/drivers/etnaviv/etnaviv_resource.c12
-rw-r--r--lib/mesa/src/gallium/drivers/etnaviv/etnaviv_screen.c2
-rw-r--r--lib/mesa/src/gallium/drivers/iris/iris_screen.c2
-rw-r--r--lib/mesa/src/gallium/drivers/llvmpipe/lp_screen.c2
-rw-r--r--lib/mesa/src/gallium/drivers/nouveau/nouveau_screen.c2
-rw-r--r--lib/mesa/src/gallium/drivers/r600/sfn/sfn_nir.cpp35
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_pipe.c2
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_pm4.c3
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_pm4.h1
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_shader.c5
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_shader_internal.h12
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_shader_llvm.c14
-rw-r--r--lib/mesa/src/gallium/drivers/radeonsi/si_state.c12
-rw-r--r--lib/mesa/src/gallium/drivers/svga/svga_format.c6
-rw-r--r--lib/mesa/src/gallium/drivers/svga/svga_resource_texture.c15
-rw-r--r--lib/mesa/src/gallium/drivers/svga/svga_resource_texture.h19
-rw-r--r--lib/mesa/src/gallium/drivers/svga/svga_screen_cache.c6
-rw-r--r--lib/mesa/src/gallium/include/pipe/p_video_state.h3
19 files changed, 104 insertions, 59 deletions
diff --git a/lib/mesa/src/gallium/auxiliary/util/u_vbuf.c b/lib/mesa/src/gallium/auxiliary/util/u_vbuf.c
index 58db9e672..202fbed0a 100644
--- a/lib/mesa/src/gallium/auxiliary/util/u_vbuf.c
+++ b/lib/mesa/src/gallium/auxiliary/util/u_vbuf.c
@@ -1467,8 +1467,6 @@ void u_vbuf_draw_vbo(struct u_vbuf *mgr, const struct pipe_draw_info *info,
boolean unroll_indices = FALSE;
const uint32_t used_vb_mask = mgr->ve->used_vb_mask;
uint32_t user_vb_mask = mgr->user_vb_mask & used_vb_mask;
- struct pipe_draw_info new_info;
- struct pipe_draw_start_count_bias new_draw;
unsigned fixed_restart_index = info->index_size ? util_prim_restart_index_from_size(info->index_size) : 0;
uint32_t misaligned = 0;
@@ -1505,12 +1503,10 @@ void u_vbuf_draw_vbo(struct u_vbuf *mgr, const struct pipe_draw_info *info,
*/
if (num_draws > 1 && info->take_index_buffer_ownership)
p_atomic_add(&info->index.resource->reference.count, num_draws - 1);
- new_info = *info;
for (unsigned d = 0; d < num_draws; d++) {
- new_draw = draws[d];
- if (info->increment_draw_id)
- drawid_offset++;
+ struct pipe_draw_info new_info = *info;
+ struct pipe_draw_start_count_bias new_draw = draws[d];
/* Handle indirect (multi)draws. */
if (indirect && indirect->buffer) {
@@ -1786,6 +1782,8 @@ void u_vbuf_draw_vbo(struct u_vbuf *mgr, const struct pipe_draw_info *info,
util_primconvert_draw_vbo(mgr->pc, &new_info, drawid_offset, indirect, &new_draw, 1);
} else
pipe->draw_vbo(pipe, &new_info, drawid_offset, indirect, &new_draw, 1);
+ if (info->increment_draw_id)
+ drawid_offset++;
}
if (mgr->using_translate) {
diff --git a/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_resource.c b/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_resource.c
index f0c4fbe23..3a193fa69 100644
--- a/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_resource.c
+++ b/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_resource.c
@@ -570,15 +570,9 @@ etna_resource_from_handle(struct pipe_screen *pscreen,
goto fail;
}
- if (screen->ro) {
- struct pipe_resource *imp_prsc = prsc;
- do {
- etna_resource(imp_prsc)->scanout =
- renderonly_create_gpu_import_for_resource(imp_prsc, screen->ro,
- NULL);
- /* failure is expected for scanout incompatible buffers */
- } while ((imp_prsc = imp_prsc->next));
- }
+ if (screen->ro)
+ rsc->scanout = renderonly_create_gpu_import_for_resource(prsc, screen->ro,
+ NULL);
return prsc;
diff --git a/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_screen.c b/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_screen.c
index 795f1258a..7c20ad2bd 100644
--- a/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_screen.c
+++ b/lib/mesa/src/gallium/drivers/etnaviv/etnaviv_screen.c
@@ -94,6 +94,8 @@ etna_screen_destroy(struct pipe_screen *pscreen)
if (screen->perfmon)
etna_perfmon_del(screen->perfmon);
+ util_dynarray_fini(&screen->supported_pm_queries);
+
etna_shader_screen_fini(pscreen);
if (screen->pipe)
diff --git a/lib/mesa/src/gallium/drivers/iris/iris_screen.c b/lib/mesa/src/gallium/drivers/iris/iris_screen.c
index 90a598df7..1c3d5f29c 100644
--- a/lib/mesa/src/gallium/drivers/iris/iris_screen.c
+++ b/lib/mesa/src/gallium/drivers/iris/iris_screen.c
@@ -774,7 +774,7 @@ iris_init_identifier_bo(struct iris_screen *screen)
screen->workaround_address = (struct iris_address) {
.bo = screen->workaround_bo,
.offset = ALIGN(
- intel_debug_write_identifiers(bo_map, 4096, "Iris") + 8, 8),
+ intel_debug_write_identifiers(bo_map, 4096, "Iris"), 32),
};
iris_bo_unmap(screen->workaround_bo);
diff --git a/lib/mesa/src/gallium/drivers/llvmpipe/lp_screen.c b/lib/mesa/src/gallium/drivers/llvmpipe/lp_screen.c
index a4d7b405a..5e594bb72 100644
--- a/lib/mesa/src/gallium/drivers/llvmpipe/lp_screen.c
+++ b/lib/mesa/src/gallium/drivers/llvmpipe/lp_screen.c
@@ -565,7 +565,7 @@ llvmpipe_get_compute_param(struct pipe_screen *_screen,
case PIPE_COMPUTE_CAP_ADDRESS_BITS:
if (ret) {
uint32_t *address_bits = ret;
- *address_bits = 64;
+ *address_bits = sizeof(void*) * 8;
}
return sizeof(uint32_t);
}
diff --git a/lib/mesa/src/gallium/drivers/nouveau/nouveau_screen.c b/lib/mesa/src/gallium/drivers/nouveau/nouveau_screen.c
index bdd2b903d..0daca9ea3 100644
--- a/lib/mesa/src/gallium/drivers/nouveau/nouveau_screen.c
+++ b/lib/mesa/src/gallium/drivers/nouveau/nouveau_screen.c
@@ -241,6 +241,8 @@ nouveau_pushbuf_create(struct nouveau_screen *screen, struct nouveau_context *co
void
nouveau_pushbuf_destroy(struct nouveau_pushbuf **push)
{
+ if (!*push)
+ return;
FREE((*push)->user_priv);
nouveau_pushbuf_del(push);
}
diff --git a/lib/mesa/src/gallium/drivers/r600/sfn/sfn_nir.cpp b/lib/mesa/src/gallium/drivers/r600/sfn/sfn_nir.cpp
index fa5a45dec..be959f350 100644
--- a/lib/mesa/src/gallium/drivers/r600/sfn/sfn_nir.cpp
+++ b/lib/mesa/src/gallium/drivers/r600/sfn/sfn_nir.cpp
@@ -443,23 +443,30 @@ r600_lower_clipvertex_to_clipdist(nir_shader *sh, pipe_stream_output_info& so_in
static bool
r600_nir_lower_atomics(nir_shader *shader)
{
- /* First re-do the offsets, in Hardware we start at zero for each new
- * binding, and we use an offset of one per counter */
- int current_binding = -1;
- int current_offset = 0;
- nir_foreach_variable_with_modes(var, shader, nir_var_uniform)
- {
- if (!var->type->contains_atomic())
- continue;
+ /* In Hardware we start at a zero index for each new
+ * binding, and we use an offset of one per counter. We also
+ * need to sort the atomics according to binding and offset. */
+ std::map<unsigned, unsigned> binding_offset;
+ std::map<unsigned, nir_variable *> sorted_var;
+
+ nir_foreach_variable_with_modes_safe(var, shader, nir_var_uniform) {
+ if (var->type->contains_atomic()) {
+ sorted_var[(var->data.binding << 16) | var->data.offset] = var;
+ exec_node_remove(&var->node);
+ }
+ }
- if (current_binding == (int)var->data.binding) {
- var->data.index = current_offset;
- current_offset += var->type->atomic_size() / ATOMIC_COUNTER_SIZE;
- } else {
- current_binding = var->data.binding;
+ for (auto& [dummy, var] : sorted_var) {
+ auto iindex = binding_offset.find(var->data.binding);
+ unsigned offset_update = var->type->atomic_size() / ATOMIC_COUNTER_SIZE;
+ if (iindex == binding_offset.end()) {
var->data.index = 0;
- current_offset = var->type->atomic_size() / ATOMIC_COUNTER_SIZE;
+ binding_offset[var->data.binding] = offset_update;
+ } else {
+ var->data.index = iindex->second;
+ iindex->second += offset_update;
}
+ shader->variables.push_tail(&var->node);
}
return nir_shader_instructions_pass(shader,
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_pipe.c b/lib/mesa/src/gallium/drivers/radeonsi/si_pipe.c
index 999c0a3a8..971023f9b 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_pipe.c
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_pipe.c
@@ -1141,6 +1141,8 @@ static struct pipe_screen *radeonsi_screen_create_impl(struct radeon_winsys *ws,
sscreen->options.enable_sam,
sscreen->options.disable_sam);
+ sscreen->info.smart_access_memory = false; /* VRAM has slower CPU access */
+
if (sscreen->info.gfx_level >= GFX9) {
sscreen->se_tile_repeat = 32 * sscreen->info.max_se;
} else {
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.c b/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.c
index f8454cd30..857f60214 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.c
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.c
@@ -63,13 +63,14 @@ static void si_pm4_set_reg_custom(struct si_pm4_state *state, unsigned reg, uint
assert(state->ndw + 2 <= state->max_dw);
- if (opcode != state->last_opcode || reg != (state->last_reg + 1)) {
+ if (opcode != state->last_opcode || reg != (state->last_reg + 1) || idx != state->last_idx) {
si_pm4_cmd_begin(state, opcode);
state->pm4[state->ndw++] = reg | (idx << 28);
}
assert(reg <= UINT16_MAX);
state->last_reg = reg;
+ state->last_idx = idx;
state->pm4[state->ndw++] = val;
si_pm4_cmd_end(state, false);
}
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.h b/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.h
index 4d1770a96..a0c50e6a3 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.h
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_pm4.h
@@ -47,6 +47,7 @@ struct si_pm4_state {
uint16_t last_pm4;
uint16_t ndw; /* number of dwords in pm4 */
uint8_t last_opcode;
+ uint8_t last_idx;
/* For shader states only */
bool is_shader;
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_shader.c b/lib/mesa/src/gallium/drivers/radeonsi/si_shader.c
index 4797f0f88..4908e2870 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_shader.c
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_shader.c
@@ -2005,7 +2005,8 @@ static struct si_shader_part *
si_get_shader_part(struct si_screen *sscreen, struct si_shader_part **list,
gl_shader_stage stage, bool prolog, union si_shader_part_key *key,
struct ac_llvm_compiler *compiler, struct util_debug_callback *debug,
- void (*build)(struct si_shader_context *, union si_shader_part_key *),
+ void (*build)(struct si_shader_context *, union si_shader_part_key *,
+ bool non_monolithic),
const char *name)
{
struct si_shader_part *result;
@@ -2062,7 +2063,7 @@ si_get_shader_part(struct si_screen *sscreen, struct si_shader_part **list,
ctx.shader = &shader;
ctx.stage = stage;
- build(&ctx, key);
+ build(&ctx, key, true);
/* Compile. */
si_llvm_optimize_module(&ctx);
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_shader_internal.h b/lib/mesa/src/gallium/drivers/radeonsi/si_shader_internal.h
index 066943810..466f3b2bf 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_shader_internal.h
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_shader_internal.h
@@ -247,14 +247,17 @@ LLVMValueRef si_get_tcs_in_vertex_dw_stride(struct si_shader_context *ctx);
LLVMValueRef si_get_num_tcs_out_vertices(struct si_shader_context *ctx);
void si_llvm_preload_tess_rings(struct si_shader_context *ctx);
void si_llvm_ls_build_end(struct si_shader_context *ctx);
-void si_llvm_build_tcs_epilog(struct si_shader_context *ctx, union si_shader_part_key *key);
+void si_llvm_build_tcs_epilog(struct si_shader_context *ctx, union si_shader_part_key *key,
+ bool separate_epilog);
void si_llvm_tcs_build_end(struct si_shader_context *ctx);
void si_llvm_init_tcs_callbacks(struct si_shader_context *ctx);
/* si_shader_llvm_ps.c */
LLVMValueRef si_get_sample_id(struct si_shader_context *ctx);
-void si_llvm_build_ps_prolog(struct si_shader_context *ctx, union si_shader_part_key *key);
-void si_llvm_build_ps_epilog(struct si_shader_context *ctx, union si_shader_part_key *key);
+void si_llvm_build_ps_prolog(struct si_shader_context *ctx, union si_shader_part_key *key,
+ bool separate_prolog);
+void si_llvm_build_ps_epilog(struct si_shader_context *ctx, union si_shader_part_key *key,
+ bool separate_epilog);
void si_llvm_build_monolithic_ps(struct si_shader_context *ctx, struct si_shader *shader);
void si_llvm_ps_build_end(struct si_shader_context *ctx);
void si_llvm_init_ps_callbacks(struct si_shader_context *ctx);
@@ -274,7 +277,8 @@ void si_llvm_emit_streamout(struct si_shader_context *ctx, struct si_shader_outp
void si_llvm_build_vs_exports(struct si_shader_context *ctx, LLVMValueRef num_export_threads,
struct si_shader_output_values *outputs, unsigned noutput);
void si_llvm_vs_build_end(struct si_shader_context *ctx);
-void si_llvm_build_vs_prolog(struct si_shader_context *ctx, union si_shader_part_key *key);
+void si_llvm_build_vs_prolog(struct si_shader_context *ctx, union si_shader_part_key *key,
+ bool separate_prolog);
void si_llvm_init_vs_callbacks(struct si_shader_context *ctx, bool ngg_cull_shader);
#endif
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_shader_llvm.c b/lib/mesa/src/gallium/drivers/radeonsi/si_shader_llvm.c
index f7817aff6..75b024481 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_shader_llvm.c
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_shader_llvm.c
@@ -1300,7 +1300,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
si_get_vs_prolog_key(&sel->info, shader->info.num_input_sgprs, true,
&shader->key.ge.part.vs.prolog, shader, &prolog_key);
prolog_key.vs_prolog.is_monolithic = true;
- si_llvm_build_vs_prolog(&ctx, &prolog_key);
+ si_llvm_build_vs_prolog(&ctx, &prolog_key, false);
parts[num_parts++] = ctx.main_fn;
first_is_prolog = true;
}
@@ -1312,7 +1312,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
si_get_vs_prolog_key(&sel->info, shader->info.num_input_sgprs, false,
&shader->key.ge.part.vs.prolog, shader, &prolog_key);
prolog_key.vs_prolog.is_monolithic = true;
- si_llvm_build_vs_prolog(&ctx, &prolog_key);
+ si_llvm_build_vs_prolog(&ctx, &prolog_key, false);
parts[num_parts++] = ctx.main_fn;
if (num_parts == 1)
first_is_prolog = true;
@@ -1337,7 +1337,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
prolog_key.vs_prolog.as_ngg = 1;
prolog_key.vs_prolog.load_vgprs_after_culling = 1;
prolog_key.vs_prolog.is_monolithic = true;
- si_llvm_build_vs_prolog(&ctx, &prolog_key);
+ si_llvm_build_vs_prolog(&ctx, &prolog_key, false);
prolog = ctx.main_fn;
parts[0] = ngg_cull_main_fn;
@@ -1361,7 +1361,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
/* TCS epilog */
union si_shader_part_key tcs_epilog_key;
si_get_tcs_epilog_key(shader, &tcs_epilog_key);
- si_llvm_build_tcs_epilog(&ctx, &tcs_epilog_key);
+ si_llvm_build_tcs_epilog(&ctx, &tcs_epilog_key, false);
parts[3] = ctx.main_fn;
struct si_shader shader_ls = {};
@@ -1393,7 +1393,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
si_get_vs_prolog_key(&ls->info, shader_ls.info.num_input_sgprs, false,
&shader->key.ge.part.tcs.ls_prolog, shader, &vs_prolog_key);
vs_prolog_key.vs_prolog.is_monolithic = true;
- si_llvm_build_vs_prolog(&ctx, &vs_prolog_key);
+ si_llvm_build_vs_prolog(&ctx, &vs_prolog_key, false);
parts[0] = ctx.main_fn;
}
@@ -1417,7 +1417,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
memset(&epilog_key, 0, sizeof(epilog_key));
epilog_key.tcs_epilog.states = shader->key.ge.part.tcs.epilog;
- si_llvm_build_tcs_epilog(&ctx, &epilog_key);
+ si_llvm_build_tcs_epilog(&ctx, &epilog_key, false);
parts[1] = ctx.main_fn;
si_build_wrapper_function(&ctx, parts, 2, 0, 0, main_arg_types, false);
@@ -1466,7 +1466,7 @@ bool si_llvm_compile_shader(struct si_screen *sscreen, struct ac_llvm_compiler *
si_get_vs_prolog_key(&es->info, shader_es.info.num_input_sgprs, false,
&shader->key.ge.part.gs.vs_prolog, shader, &vs_prolog_key);
vs_prolog_key.vs_prolog.is_monolithic = true;
- si_llvm_build_vs_prolog(&ctx, &vs_prolog_key);
+ si_llvm_build_vs_prolog(&ctx, &vs_prolog_key, false);
es_prolog = ctx.main_fn;
}
diff --git a/lib/mesa/src/gallium/drivers/radeonsi/si_state.c b/lib/mesa/src/gallium/drivers/radeonsi/si_state.c
index 3ab4216b7..54eb62c8f 100644
--- a/lib/mesa/src/gallium/drivers/radeonsi/si_state.c
+++ b/lib/mesa/src/gallium/drivers/radeonsi/si_state.c
@@ -114,7 +114,7 @@ static void si_emit_cb_render_state(struct si_context *sctx)
if (sctx->gfx_level >= GFX11) {
radeon_opt_set_context_reg(sctx, R_028424_CB_FDCC_CONTROL, SI_TRACKED_CB_DCC_CONTROL,
S_028424_SAMPLE_MASK_TRACKER_DISABLE(oc_disable) |
- S_028424_SAMPLE_MASK_TRACKER_WATERMARK(15));
+ S_028424_SAMPLE_MASK_TRACKER_WATERMARK(0));
} else {
radeon_opt_set_context_reg(
sctx, R_028424_CB_DCC_CONTROL, SI_TRACKED_CB_DCC_CONTROL,
@@ -193,7 +193,8 @@ static void si_emit_cb_render_state(struct si_context *sctx)
spi_format == V_028714_SPI_SHADER_UINT16_ABGR ||
spi_format == V_028714_SPI_SHADER_SINT16_ABGR) {
sx_ps_downconvert |= V_028754_SX_RT_EXPORT_8_8_8_8 << (i * 4);
- sx_blend_opt_epsilon |= V_028758_8BIT_FORMAT << (i * 4);
+ if (G_028C70_NUMBER_TYPE(surf->cb_color_info) != V_028C70_NUMBER_SRGB)
+ sx_blend_opt_epsilon |= V_028758_8BIT_FORMAT << (i * 4);
}
break;
@@ -3302,6 +3303,11 @@ static void si_emit_framebuffer_state(struct si_context *sctx)
S_028C78_DISABLE_CONSTANT_ENCODE_REG(1) |
S_028C78_FDCC_ENABLE(vi_dcc_enabled(tex, cb->base.u.tex.level));
+ if (sctx->family >= CHIP_GFX1103_R2) {
+ cb_fdcc_control |= S_028C78_ENABLE_MAX_COMP_FRAG_OVERRIDE(1) |
+ S_028C78_MAX_COMP_FRAGS(cb->base.texture->nr_samples >= 4);
+ }
+
radeon_set_context_reg_seq(R_028C6C_CB_COLOR0_VIEW + i * 0x3C, 4);
radeon_emit(cb->cb_color_view); /* CB_COLOR0_VIEW */
radeon_emit(cb_color_info); /* CB_COLOR0_INFO */
@@ -5587,9 +5593,9 @@ void si_init_cs_preamble_state(struct si_context *sctx, bool uses_reg_shadowing)
si_pm4_set_reg(pm4, R_028AC8_DB_PRELOAD_CONTROL, 0x0);
si_pm4_set_reg(pm4, R_02800C_DB_RENDER_OVERRIDE, 0);
si_pm4_set_reg(pm4, R_028A8C_VGT_PRIMITIVEID_RESET, 0x0);
- si_pm4_set_reg(pm4, R_028B98_VGT_STRMOUT_BUFFER_CONFIG, 0x0);
if (sctx->gfx_level < GFX11) {
+ si_pm4_set_reg(pm4, R_028B98_VGT_STRMOUT_BUFFER_CONFIG, 0x0);
si_pm4_set_reg(pm4, R_028A5C_VGT_GS_PER_VS, 0x2);
si_pm4_set_reg(pm4, R_028AB8_VGT_VTX_CNT_EN, 0x0);
}
diff --git a/lib/mesa/src/gallium/drivers/svga/svga_format.c b/lib/mesa/src/gallium/drivers/svga/svga_format.c
index 6cfc92b6f..75e41f37e 100644
--- a/lib/mesa/src/gallium/drivers/svga/svga_format.c
+++ b/lib/mesa/src/gallium/drivers/svga/svga_format.c
@@ -1438,7 +1438,10 @@ static const struct format_cap format_cap_table[] = {
static const SVGA3dSurfaceFormat compat_x8r8g8b8[] = {
SVGA3D_X8R8G8B8, SVGA3D_A8R8G8B8, SVGA3D_B8G8R8X8_UNORM,
- SVGA3D_B8G8R8A8_UNORM, 0
+ SVGA3D_B8G8R8A8_UNORM, SVGA3D_B8G8R8X8_TYPELESS, SVGA3D_B8G8R8A8_TYPELESS, 0
+};
+static const SVGA3dSurfaceFormat compat_r8g8b8a8[] = {
+ SVGA3D_R8G8B8A8_UNORM, SVGA3D_R8G8B8A8_TYPELESS, 0
};
static const SVGA3dSurfaceFormat compat_r8[] = {
SVGA3D_R8_UNORM, SVGA3D_NV12, SVGA3D_YV12, 0
@@ -1453,6 +1456,7 @@ static const SVGA3dSurfaceFormat compat_r5g6b5[] = {
static const struct format_compat_entry format_compats[] = {
{PIPE_FORMAT_B8G8R8X8_UNORM, compat_x8r8g8b8},
{PIPE_FORMAT_B8G8R8A8_UNORM, compat_x8r8g8b8},
+ {PIPE_FORMAT_R8G8B8A8_UNORM, compat_r8g8b8a8},
{PIPE_FORMAT_R8_UNORM, compat_r8},
{PIPE_FORMAT_R8G8_UNORM, compat_g8r8},
{PIPE_FORMAT_B5G6R5_UNORM, compat_r5g6b5}
diff --git a/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.c b/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.c
index f2ab20edb..d7d15f99e 100644
--- a/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.c
+++ b/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.c
@@ -1,5 +1,5 @@
/**********************************************************
- * Copyright 2008-2009 VMware, Inc. All rights reserved.
+ * Copyright 2008-2023 VMware, Inc. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person
* obtaining a copy of this software and associated documentation
@@ -209,7 +209,9 @@ svga_resource_get_handle(struct pipe_screen *screen,
if (texture->target == PIPE_BUFFER)
return false;
- assert(svga_texture(texture)->key.cachable == 0);
+ SVGA_DBG(DEBUG_DMA, "%s: texture=%p cachable=%d\n", __FUNCTION__,
+ texture, svga_texture(texture)->key.cachable);
+
svga_texture(texture)->key.cachable = 0;
stride = util_format_get_nblocksx(texture->format, texture->width0) *
@@ -355,7 +357,7 @@ svga_texture_transfer_map_direct(struct svga_context *svga,
else {
assert(usage & PIPE_MAP_WRITE);
if ((usage & PIPE_MAP_UNSYNCHRONIZED) == 0) {
- if (svga_is_texture_dirty(tex, st->slice, level)) {
+ if (svga_is_texture_level_dirty(tex, st->slice, level)) {
/*
* do a surface flush if the subresource has been modified
* in this command buffer.
@@ -565,14 +567,15 @@ svga_texture_transfer_map(struct pipe_context *pipe,
!(st->base.usage & PIPE_MAP_READ);
boolean was_rendered_to =
svga_was_texture_rendered_to(svga_texture(texture));
+ boolean is_dirty = svga_is_texture_dirty(svga_texture(texture));
- /* If the texture was already rendered to and upload buffer
- * is supported, then we will use upload buffer to
+ /* If the texture was already rendered to or has pending changes and
+ * upload buffer is supported, then we will use upload buffer to
* avoid the need to read back the texture content; otherwise,
* we'll first try to map directly to the GB surface, if it is blocked,
* then we'll try the upload buffer.
*/
- if (was_rendered_to && can_use_upload) {
+ if ((was_rendered_to || is_dirty) && can_use_upload) {
map = svga_texture_transfer_map_upload(svga, st);
}
else {
diff --git a/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.h b/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.h
index e1872faad..32b42dd0e 100644
--- a/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.h
+++ b/lib/mesa/src/gallium/drivers/svga/svga_resource_texture.h
@@ -1,5 +1,5 @@
/**********************************************************
- * Copyright 2008-2009 VMware, Inc. All rights reserved.
+ * Copyright 2008-2023 VMware, Inc. All rights reserved.
*
* Permission is hereby granted, free of charge, to any person
* obtaining a copy of this software and associated documentation
@@ -85,6 +85,11 @@ struct svga_texture
*/
boolean can_use_upload;
+ /**
+ * Whether texture is modified. Set if any of the dirty bits is set.
+ */
+ boolean modified;
+
unsigned size; /**< Approximate size in bytes */
/** array indexed by cube face or 3D/array slice, one bit per mipmap level */
@@ -242,6 +247,7 @@ svga_set_texture_dirty(struct svga_texture *tex,
{
check_face_level(tex, face, level);
tex->dirty[face] |= 1 << level;
+ tex->modified = TRUE;
}
static inline void
@@ -251,16 +257,23 @@ svga_clear_texture_dirty(struct svga_texture *tex)
for (i = 0; i < tex->b.depth0 * tex->b.array_size; i++) {
tex->dirty[i] = 0;
}
+ tex->modified = FALSE;
}
static inline boolean
-svga_is_texture_dirty(const struct svga_texture *tex,
- unsigned face, unsigned level)
+svga_is_texture_level_dirty(const struct svga_texture *tex,
+ unsigned face, unsigned level)
{
check_face_level(tex, face, level);
return !!(tex->dirty[face] & (1 << level));
}
+static inline boolean
+svga_is_texture_dirty(const struct svga_texture *tex)
+{
+ return tex->modified;
+}
+
struct pipe_resource *
svga_texture_create(struct pipe_screen *screen,
const struct pipe_resource *template);
diff --git a/lib/mesa/src/gallium/drivers/svga/svga_screen_cache.c b/lib/mesa/src/gallium/drivers/svga/svga_screen_cache.c
index 38ec50c48..89705fb3a 100644
--- a/lib/mesa/src/gallium/drivers/svga/svga_screen_cache.c
+++ b/lib/mesa/src/gallium/drivers/svga/svga_screen_cache.c
@@ -573,7 +573,11 @@ svga_screen_surface_create(struct svga_screen *svgascreen,
/* Unable to recycle surface, allocate a new one */
unsigned usage = 0;
- if (!key->cachable)
+ /* mark the surface as shareable if the surface is not
+ * cachable or the RENDER_TARGET bind flag is set.
+ */
+ if (!key->cachable ||
+ ((bind_flags & PIPE_BIND_RENDER_TARGET) != 0))
usage |= SVGA_SURFACE_USAGE_SHARED;
if (key->scanout)
usage |= SVGA_SURFACE_USAGE_SCANOUT;
diff --git a/lib/mesa/src/gallium/include/pipe/p_video_state.h b/lib/mesa/src/gallium/include/pipe/p_video_state.h
index 0b7ed1ee7..988370704 100644
--- a/lib/mesa/src/gallium/include/pipe/p_video_state.h
+++ b/lib/mesa/src/gallium/include/pipe/p_video_state.h
@@ -862,12 +862,15 @@ struct pipe_vp9_picture_desc
struct {
uint16_t frame_width;
uint16_t frame_height;
+ uint16_t prev_frame_width;
+ uint16_t prev_frame_height;
struct {
uint32_t subsampling_x:1;
uint32_t subsampling_y:1;
uint32_t frame_type:1;
uint32_t show_frame:1;
+ uint32_t prev_show_frame:1;
uint32_t error_resilient_mode:1;
uint32_t intra_only:1;
uint32_t allow_high_precision_mv:1;