diff options
author | Alyssa Rosenzweig <alyssa@collabora.com> | 2022-01-15 15:24:17 -0500 |
---|---|---|
committer | Marge Bot <emma+marge@anholt.net> | 2022-01-15 21:51:57 +0000 |
commit | b8d37eb1bb99b795d370634a8eadcf83cf5a9d7d (patch) | |
tree | 37ca786d1961bd5d83c79a1b62983618719aa47a | |
parent | 77a1514a37884183a05389bc7ac47708f408b841 (diff) | |
download | mesa-b8d37eb1bb99b795d370634a8eadcf83cf5a9d7d.tar.gz mesa-b8d37eb1bb99b795d370634a8eadcf83cf5a9d7d.tar.bz2 mesa-b8d37eb1bb99b795d370634a8eadcf83cf5a9d7d.zip |
pan/bi: Schedule around blend shader register clobbering
By software ABI, a blend shader is permitted to clobber registers
R0-R15. The scheduler needs to be aware of this, to avoid moving a write
to one of these registers past the BLEND itself. Otherwise the schedule
is invalid.
This bug affects GLES3.0, but is rare enough in practice that we had
missed it. It requires a fragment shader to write to multiple render
targets with attached blend shaders, and have temporaries register
allocated to R0-R15 that are not read by the blend shader, but are sunk
past the BLEND instruction by the scheduler. Prevents a regression when
switching boolean representations on:
dEQP-GLES31.functional.shaders.builtin_functions.integer.uaddcarry.uvec4_lowp_fragment
Signed-off-by: Alyssa Rosenzweig <alyssa@collabora.com>
Cc: mesa-stable
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/14577>
-rw-r--r-- | src/panfrost/bifrost/bi_schedule.c | 20 |
1 files changed, 16 insertions, 4 deletions
diff --git a/src/panfrost/bifrost/bi_schedule.c b/src/panfrost/bifrost/bi_schedule.c index 7d73b2f9674..88162ecc86e 100644 --- a/src/panfrost/bifrost/bi_schedule.c +++ b/src/panfrost/bifrost/bi_schedule.c @@ -197,7 +197,7 @@ bi_is_sched_barrier(bi_instr *I) } static void -bi_create_dependency_graph(struct bi_worklist st, bool inorder) +bi_create_dependency_graph(struct bi_worklist st, bool inorder, bool is_blend) { struct util_dynarray last_read[64], last_write[64]; @@ -262,6 +262,17 @@ bi_create_dependency_graph(struct bi_worklist st, bool inorder) } } + /* Blend shaders are allowed to clobber R0-R15. Treat these + * registers like extra destinations for scheduling purposes. + */ + if (ins->op == BI_OPCODE_BLEND && !is_blend) { + for (unsigned c = 0; c < 16; ++c) { + add_dependency(last_read, c, i, st.dependents, st.dep_counts); + add_dependency(last_write, c, i, st.dependents, st.dep_counts); + mark_access(last_write, c, i); + } + } + bi_foreach_src(ins, s) { if (ins->src[s].type != BI_INDEX_REGISTER) continue; @@ -414,7 +425,7 @@ bi_flatten_block(bi_block *block, unsigned *len) */ static struct bi_worklist -bi_initialize_worklist(bi_block *block, bool inorder) +bi_initialize_worklist(bi_block *block, bool inorder, bool is_blend) { struct bi_worklist st = { }; st.instructions = bi_flatten_block(block, &st.count); @@ -425,7 +436,7 @@ bi_initialize_worklist(bi_block *block, bool inorder) st.dependents = calloc(st.count, sizeof(st.dependents[0])); st.dep_counts = calloc(st.count, sizeof(st.dep_counts[0])); - bi_create_dependency_graph(st, inorder); + bi_create_dependency_graph(st, inorder, is_blend); st.worklist = calloc(BITSET_WORDS(st.count), sizeof(BITSET_WORD)); for (unsigned i = 0; i < st.count; ++i) { @@ -1801,7 +1812,8 @@ bi_schedule_block(bi_context *ctx, bi_block *block) /* Copy list to dynamic array */ struct bi_worklist st = bi_initialize_worklist(block, - bifrost_debug & BIFROST_DBG_INORDER); + bifrost_debug & BIFROST_DBG_INORDER, + ctx->inputs->is_blend); if (!st.count) { bi_free_worklist(st); |