853 lines
34 KiB
C
853 lines
34 KiB
C
/*
|
|
* Copyright (C) 2018 Alyssa Rosenzweig
|
|
* Copyright (C) 2019-2021 Collabora, Ltd.
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
* SOFTWARE.
|
|
*/
|
|
|
|
#include "pan_blend.h"
|
|
|
|
#ifdef PAN_ARCH
|
|
#include "pan_shader.h"
|
|
#endif
|
|
|
|
#include "pan_texture.h"
|
|
#include "panfrost/util/pan_lower_framebuffer.h"
|
|
#include "util/format/u_format.h"
|
|
#include "compiler/nir/nir.h"
|
|
#include "compiler/nir/nir_builder.h"
|
|
#include "compiler/nir/nir_conversion_builder.h"
|
|
#include "compiler/nir/nir_lower_blend.h"
|
|
|
|
#ifndef PAN_ARCH
|
|
|
|
/* Fixed function blending */
|
|
|
|
static bool
|
|
factor_is_supported(enum blend_factor factor)
|
|
{
|
|
return factor != BLEND_FACTOR_SRC_ALPHA_SATURATE &&
|
|
factor != BLEND_FACTOR_SRC1_COLOR &&
|
|
factor != BLEND_FACTOR_SRC1_ALPHA;
|
|
}
|
|
|
|
/* OpenGL allows encoding (src*dest + dest*src) which is incompatiblle with
|
|
* Midgard style blending since there are two multiplies. However, it may be
|
|
* factored as 2*src*dest = dest*(2*src), which can be encoded on Bifrost as 0
|
|
* + dest * (2*src) wih the new source_2 value of C. Detect this case. */
|
|
|
|
static bool
|
|
is_2srcdest(enum blend_func blend_func,
|
|
enum blend_factor src_factor,
|
|
bool invert_src,
|
|
enum blend_factor dest_factor,
|
|
bool invert_dest,
|
|
bool is_alpha)
|
|
{
|
|
return (blend_func == BLEND_FUNC_ADD) &&
|
|
((src_factor == BLEND_FACTOR_DST_COLOR) ||
|
|
((src_factor == BLEND_FACTOR_DST_ALPHA) && is_alpha)) &&
|
|
((dest_factor == BLEND_FACTOR_SRC_COLOR) ||
|
|
((dest_factor == BLEND_FACTOR_SRC_ALPHA) && is_alpha)) &&
|
|
!invert_src && !invert_dest;
|
|
}
|
|
|
|
static bool
|
|
can_fixed_function_equation(enum blend_func blend_func,
|
|
enum blend_factor src_factor,
|
|
bool invert_src,
|
|
enum blend_factor dest_factor,
|
|
bool invert_dest,
|
|
bool is_alpha,
|
|
bool supports_2src)
|
|
{
|
|
if (is_2srcdest(blend_func, src_factor, invert_src,
|
|
dest_factor, invert_dest, is_alpha)) {
|
|
|
|
return supports_2src;
|
|
}
|
|
|
|
if (blend_func != BLEND_FUNC_ADD &&
|
|
blend_func != BLEND_FUNC_SUBTRACT &&
|
|
blend_func != BLEND_FUNC_REVERSE_SUBTRACT)
|
|
return false;
|
|
|
|
if (!factor_is_supported(src_factor) ||
|
|
!factor_is_supported(dest_factor))
|
|
return false;
|
|
|
|
if (src_factor != dest_factor &&
|
|
src_factor != BLEND_FACTOR_ZERO &&
|
|
dest_factor != BLEND_FACTOR_ZERO)
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
static unsigned
|
|
blend_factor_constant_mask(enum blend_factor factor)
|
|
{
|
|
if (factor == BLEND_FACTOR_CONSTANT_COLOR)
|
|
return 0b0111; /* RGB */
|
|
else if (factor == BLEND_FACTOR_CONSTANT_ALPHA)
|
|
return 0b1000; /* A */
|
|
else
|
|
return 0b0000; /* - */
|
|
}
|
|
|
|
unsigned
|
|
pan_blend_constant_mask(const struct pan_blend_equation eq)
|
|
{
|
|
return blend_factor_constant_mask(eq.rgb_src_factor) |
|
|
blend_factor_constant_mask(eq.rgb_dst_factor) |
|
|
blend_factor_constant_mask(eq.alpha_src_factor) |
|
|
blend_factor_constant_mask(eq.alpha_dst_factor);
|
|
}
|
|
|
|
/* Only "homogenous" (scalar or vector with all components equal) constants are
|
|
* valid for fixed-function, so check for this condition */
|
|
|
|
bool
|
|
pan_blend_is_homogenous_constant(unsigned mask, const float *constants)
|
|
{
|
|
float constant = pan_blend_get_constant(mask, constants);
|
|
|
|
u_foreach_bit(i, mask) {
|
|
if (constants[i] != constant)
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/* Determines if an equation can run in fixed function */
|
|
|
|
bool
|
|
pan_blend_can_fixed_function(const struct pan_blend_equation equation,
|
|
bool supports_2src)
|
|
{
|
|
return !equation.blend_enable ||
|
|
(can_fixed_function_equation(equation.rgb_func,
|
|
equation.rgb_src_factor,
|
|
equation.rgb_invert_src_factor,
|
|
equation.rgb_dst_factor,
|
|
equation.rgb_invert_dst_factor,
|
|
false, supports_2src) &&
|
|
can_fixed_function_equation(equation.alpha_func,
|
|
equation.alpha_src_factor,
|
|
equation.alpha_invert_src_factor,
|
|
equation.alpha_dst_factor,
|
|
equation.alpha_invert_dst_factor,
|
|
true, supports_2src));
|
|
}
|
|
|
|
static enum mali_blend_operand_c
|
|
to_c_factor(enum blend_factor factor)
|
|
{
|
|
switch (factor) {
|
|
case BLEND_FACTOR_ZERO:
|
|
return MALI_BLEND_OPERAND_C_ZERO;
|
|
|
|
case BLEND_FACTOR_SRC_ALPHA:
|
|
return MALI_BLEND_OPERAND_C_SRC_ALPHA;
|
|
|
|
case BLEND_FACTOR_DST_ALPHA:
|
|
return MALI_BLEND_OPERAND_C_DEST_ALPHA;
|
|
|
|
case BLEND_FACTOR_SRC_COLOR:
|
|
return MALI_BLEND_OPERAND_C_SRC;
|
|
|
|
case BLEND_FACTOR_DST_COLOR:
|
|
return MALI_BLEND_OPERAND_C_DEST;
|
|
|
|
case BLEND_FACTOR_CONSTANT_COLOR:
|
|
case BLEND_FACTOR_CONSTANT_ALPHA:
|
|
return MALI_BLEND_OPERAND_C_CONSTANT;
|
|
|
|
default:
|
|
unreachable("Unsupported blend factor");
|
|
}
|
|
}
|
|
|
|
static void
|
|
to_panfrost_function(enum blend_func blend_func,
|
|
enum blend_factor src_factor,
|
|
bool invert_src,
|
|
enum blend_factor dest_factor,
|
|
bool invert_dest,
|
|
bool is_alpha,
|
|
struct MALI_BLEND_FUNCTION *function)
|
|
{
|
|
assert(can_fixed_function_equation(blend_func, src_factor, invert_src,
|
|
dest_factor, invert_dest, is_alpha, true));
|
|
|
|
if (src_factor == BLEND_FACTOR_ZERO && !invert_src) {
|
|
function->a = MALI_BLEND_OPERAND_A_ZERO;
|
|
function->b = MALI_BLEND_OPERAND_B_DEST;
|
|
if (blend_func == BLEND_FUNC_SUBTRACT)
|
|
function->negate_b = true;
|
|
function->invert_c = invert_dest;
|
|
function->c = to_c_factor(dest_factor);
|
|
} else if (src_factor == BLEND_FACTOR_ZERO && invert_src) {
|
|
function->a = MALI_BLEND_OPERAND_A_SRC;
|
|
function->b = MALI_BLEND_OPERAND_B_DEST;
|
|
if (blend_func == BLEND_FUNC_SUBTRACT)
|
|
function->negate_b = true;
|
|
else if (blend_func == BLEND_FUNC_REVERSE_SUBTRACT)
|
|
function->negate_a = true;
|
|
function->invert_c = invert_dest;
|
|
function->c = to_c_factor(dest_factor);
|
|
} else if (dest_factor == BLEND_FACTOR_ZERO && !invert_dest) {
|
|
function->a = MALI_BLEND_OPERAND_A_ZERO;
|
|
function->b = MALI_BLEND_OPERAND_B_SRC;
|
|
if (blend_func == BLEND_FUNC_REVERSE_SUBTRACT)
|
|
function->negate_b = true;
|
|
function->invert_c = invert_src;
|
|
function->c = to_c_factor(src_factor);
|
|
} else if (dest_factor == BLEND_FACTOR_ZERO && invert_dest) {
|
|
function->a = MALI_BLEND_OPERAND_A_DEST;
|
|
function->b = MALI_BLEND_OPERAND_B_SRC;
|
|
if (blend_func == BLEND_FUNC_SUBTRACT)
|
|
function->negate_a = true;
|
|
else if (blend_func == BLEND_FUNC_REVERSE_SUBTRACT)
|
|
function->negate_b = true;
|
|
function->invert_c = invert_src;
|
|
function->c = to_c_factor(src_factor);
|
|
} else if (src_factor == dest_factor && invert_src == invert_dest) {
|
|
function->a = MALI_BLEND_OPERAND_A_ZERO;
|
|
function->invert_c = invert_src;
|
|
function->c = to_c_factor(src_factor);
|
|
|
|
switch (blend_func) {
|
|
case BLEND_FUNC_ADD:
|
|
function->b = MALI_BLEND_OPERAND_B_SRC_PLUS_DEST;
|
|
break;
|
|
case BLEND_FUNC_REVERSE_SUBTRACT:
|
|
function->negate_b = true;
|
|
FALLTHROUGH;
|
|
case BLEND_FUNC_SUBTRACT:
|
|
function->b = MALI_BLEND_OPERAND_B_SRC_MINUS_DEST;
|
|
break;
|
|
default:
|
|
unreachable("Invalid blend function");
|
|
}
|
|
} else if (is_2srcdest(blend_func, src_factor, invert_src, dest_factor,
|
|
invert_dest, is_alpha)) {
|
|
/* src*dest + dest*src = 2*src*dest = 0 + dest*(2*src) */
|
|
function->a = MALI_BLEND_OPERAND_A_ZERO;
|
|
function->b = MALI_BLEND_OPERAND_B_DEST;
|
|
function->c = MALI_BLEND_OPERAND_C_SRC_X_2;
|
|
} else {
|
|
assert(src_factor == dest_factor && invert_src != invert_dest);
|
|
|
|
function->a = MALI_BLEND_OPERAND_A_DEST;
|
|
function->invert_c = invert_src;
|
|
function->c = to_c_factor(src_factor);
|
|
|
|
switch (blend_func) {
|
|
case BLEND_FUNC_ADD:
|
|
function->b = MALI_BLEND_OPERAND_B_SRC_MINUS_DEST;
|
|
break;
|
|
case BLEND_FUNC_REVERSE_SUBTRACT:
|
|
function->b = MALI_BLEND_OPERAND_B_SRC_PLUS_DEST;
|
|
function->negate_b = true;
|
|
break;
|
|
case BLEND_FUNC_SUBTRACT:
|
|
function->b = MALI_BLEND_OPERAND_B_SRC_PLUS_DEST;
|
|
function->negate_a = true;
|
|
break;
|
|
default:
|
|
unreachable("Invalid blend function\n");
|
|
}
|
|
}
|
|
}
|
|
|
|
bool
|
|
pan_blend_is_opaque(const struct pan_blend_equation equation)
|
|
{
|
|
/* If a channel is masked out, we can't use opaque mode even if
|
|
* blending is disabled, since we need a tilebuffer read in there */
|
|
if (equation.color_mask != 0xF)
|
|
return false;
|
|
|
|
/* With nothing masked out, disabled bledning is opaque */
|
|
if (!equation.blend_enable)
|
|
return true;
|
|
|
|
/* Also detect open-coded opaque blending */
|
|
return equation.rgb_src_factor == BLEND_FACTOR_ZERO &&
|
|
equation.rgb_invert_src_factor &&
|
|
equation.rgb_dst_factor == BLEND_FACTOR_ZERO &&
|
|
!equation.rgb_invert_dst_factor &&
|
|
(equation.rgb_func == BLEND_FUNC_ADD ||
|
|
equation.rgb_func == BLEND_FUNC_SUBTRACT) &&
|
|
equation.alpha_src_factor == BLEND_FACTOR_ZERO &&
|
|
equation.alpha_invert_src_factor &&
|
|
equation.alpha_dst_factor == BLEND_FACTOR_ZERO &&
|
|
!equation.alpha_invert_dst_factor &&
|
|
(equation.alpha_func == BLEND_FUNC_ADD ||
|
|
equation.alpha_func == BLEND_FUNC_SUBTRACT);
|
|
}
|
|
|
|
/* Check if (factor, invert) represents a constant value of val, assuming
|
|
* src_alpha is the given constant.
|
|
*/
|
|
|
|
static inline bool
|
|
is_factor_01(unsigned factor, bool invert, unsigned val, unsigned srca)
|
|
{
|
|
assert(val == 0 || val == 1);
|
|
assert(srca == 0 || srca == 1);
|
|
|
|
return ((invert ^ !val) && factor == BLEND_FACTOR_ZERO) ||
|
|
((invert ^ srca ^ !val) && factor == BLEND_FACTOR_SRC_ALPHA);
|
|
}
|
|
|
|
/* Returns if src alpha = 0 implies the blended colour equals the destination
|
|
* colour. Suppose source alpha = 0 and consider cases.
|
|
*
|
|
* Additive blending: Equivalent to D = S * f_s + D * f_d for all D and all S
|
|
* with S_a = 0, for each component. For the alpha component (if it unmasked),
|
|
* we have S_a = 0 so this reduces to D = D * f_d <===> f_d = 1. For RGB
|
|
* components (if unmasked), we need f_s = 0 and f_d = 1.
|
|
*
|
|
* Subtractive blending: Fails in general (D = S * f_S - D * f_D). We
|
|
* would need f_S = 0 and f_D = -1, which is not valid in the APIs.
|
|
*
|
|
* Reverse subtractive blending (D = D * f_D - S * f_S), we need f_D = 1
|
|
* and f_S = 0 up to masking. This is the same as additive blending.
|
|
*
|
|
* Min/max: Fails in general on the RGB components.
|
|
*/
|
|
|
|
bool
|
|
pan_blend_alpha_zero_nop(const struct pan_blend_equation eq)
|
|
{
|
|
if (eq.rgb_func != BLEND_FUNC_ADD &&
|
|
eq.rgb_func != BLEND_FUNC_REVERSE_SUBTRACT)
|
|
return false;
|
|
|
|
if (eq.color_mask & 0x8) {
|
|
if (!is_factor_01(eq.alpha_dst_factor, eq.alpha_invert_dst_factor, 1, 0))
|
|
return false;
|
|
}
|
|
|
|
if (eq.color_mask & 0x7) {
|
|
if (!is_factor_01(eq.rgb_dst_factor, eq.rgb_invert_dst_factor, 1, 0))
|
|
return false;
|
|
|
|
if (!is_factor_01(eq.rgb_src_factor, eq.rgb_invert_src_factor, 0, 0))
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
/* Returns if src alpha = 1 implies the blended colour equals the source
|
|
* colour. Suppose source alpha = 1 and consider cases.
|
|
*
|
|
* Additive blending: S = S * f_s + D * f_d. We need f_s = 1 and f_d = 0.
|
|
*
|
|
* Subtractive blending: S = S * f_s - D * f_d. Same as additive blending.
|
|
*
|
|
* Reverse subtractive blending: S = D * f_d - S * f_s. Fails in general since
|
|
* it would require f_s = -1, which is not valid in the APIs.
|
|
*
|
|
* Min/max: Fails in general on the RGB components.
|
|
*
|
|
* Note if any component is masked, we can't use a store.
|
|
*/
|
|
|
|
bool
|
|
pan_blend_alpha_one_store(const struct pan_blend_equation eq)
|
|
{
|
|
if (eq.rgb_func != BLEND_FUNC_ADD &&
|
|
eq.rgb_func != BLEND_FUNC_SUBTRACT)
|
|
return false;
|
|
|
|
if (eq.color_mask != 0xf)
|
|
return false;
|
|
|
|
return is_factor_01(eq.rgb_src_factor, eq.rgb_invert_src_factor, 1, 1) &&
|
|
is_factor_01(eq.alpha_src_factor, eq.alpha_invert_src_factor, 1, 1) &&
|
|
is_factor_01(eq.rgb_dst_factor, eq.rgb_invert_dst_factor, 0, 1) &&
|
|
is_factor_01(eq.alpha_dst_factor, eq.alpha_invert_dst_factor, 0, 1);
|
|
}
|
|
|
|
static bool
|
|
is_dest_factor(enum blend_factor factor, bool alpha)
|
|
{
|
|
return factor == BLEND_FACTOR_DST_ALPHA ||
|
|
factor == BLEND_FACTOR_DST_COLOR ||
|
|
(factor == BLEND_FACTOR_SRC_ALPHA_SATURATE && !alpha);
|
|
}
|
|
|
|
/* Determines if a blend equation reads back the destination. This can occur by
|
|
* explicitly referencing the destination in the blend equation, or by using a
|
|
* partial writemask. */
|
|
|
|
bool
|
|
pan_blend_reads_dest(const struct pan_blend_equation equation)
|
|
{
|
|
return (equation.color_mask && equation.color_mask != 0xF) ||
|
|
is_dest_factor(equation.rgb_src_factor, false) ||
|
|
is_dest_factor(equation.alpha_src_factor, true) ||
|
|
equation.rgb_dst_factor != BLEND_FACTOR_ZERO ||
|
|
equation.rgb_invert_dst_factor ||
|
|
equation.alpha_dst_factor != BLEND_FACTOR_ZERO ||
|
|
equation.alpha_invert_dst_factor;
|
|
}
|
|
|
|
/* Create the descriptor for a fixed blend mode given the corresponding API
|
|
* state. Assumes the equation can be represented as fixed-function. */
|
|
|
|
void
|
|
pan_blend_to_fixed_function_equation(const struct pan_blend_equation equation,
|
|
struct MALI_BLEND_EQUATION *out)
|
|
{
|
|
/* If no blending is enabled, default back on `replace` mode */
|
|
if (!equation.blend_enable) {
|
|
out->color_mask = equation.color_mask;
|
|
out->rgb.a = MALI_BLEND_OPERAND_A_SRC;
|
|
out->rgb.b = MALI_BLEND_OPERAND_B_SRC;
|
|
out->rgb.c = MALI_BLEND_OPERAND_C_ZERO;
|
|
out->alpha.a = MALI_BLEND_OPERAND_A_SRC;
|
|
out->alpha.b = MALI_BLEND_OPERAND_B_SRC;
|
|
out->alpha.c = MALI_BLEND_OPERAND_C_ZERO;
|
|
return;
|
|
}
|
|
|
|
/* Compile the fixed-function blend */
|
|
to_panfrost_function(equation.rgb_func,
|
|
equation.rgb_src_factor,
|
|
equation.rgb_invert_src_factor,
|
|
equation.rgb_dst_factor,
|
|
equation.rgb_invert_dst_factor,
|
|
false, &out->rgb);
|
|
|
|
to_panfrost_function(equation.alpha_func,
|
|
equation.alpha_src_factor,
|
|
equation.alpha_invert_src_factor,
|
|
equation.alpha_dst_factor,
|
|
equation.alpha_invert_dst_factor,
|
|
true, &out->alpha);
|
|
out->color_mask = equation.color_mask;
|
|
}
|
|
|
|
uint32_t
|
|
pan_pack_blend(const struct pan_blend_equation equation)
|
|
{
|
|
STATIC_ASSERT(sizeof(uint32_t) == MALI_BLEND_EQUATION_LENGTH);
|
|
|
|
uint32_t out = 0;
|
|
|
|
pan_pack(&out, BLEND_EQUATION, cfg) {
|
|
pan_blend_to_fixed_function_equation(equation, &cfg);
|
|
}
|
|
|
|
return out;
|
|
}
|
|
|
|
static uint32_t pan_blend_shader_key_hash(const void *key)
|
|
{
|
|
return _mesa_hash_data(key, sizeof(struct pan_blend_shader_key));
|
|
}
|
|
|
|
static bool pan_blend_shader_key_equal(const void *a, const void *b)
|
|
{
|
|
return !memcmp(a, b, sizeof(struct pan_blend_shader_key));
|
|
}
|
|
|
|
void
|
|
pan_blend_shaders_init(struct panfrost_device *dev)
|
|
{
|
|
dev->blend_shaders.shaders =
|
|
_mesa_hash_table_create(NULL, pan_blend_shader_key_hash,
|
|
pan_blend_shader_key_equal);
|
|
pthread_mutex_init(&dev->blend_shaders.lock, NULL);
|
|
}
|
|
|
|
void
|
|
pan_blend_shaders_cleanup(struct panfrost_device *dev)
|
|
{
|
|
_mesa_hash_table_destroy(dev->blend_shaders.shaders, NULL);
|
|
}
|
|
|
|
#else /* ifndef PAN_ARCH */
|
|
|
|
static const char *
|
|
logicop_str(enum pipe_logicop logicop)
|
|
{
|
|
switch (logicop) {
|
|
case PIPE_LOGICOP_CLEAR: return "clear";
|
|
case PIPE_LOGICOP_NOR: return "nor";
|
|
case PIPE_LOGICOP_AND_INVERTED: return "and-inverted";
|
|
case PIPE_LOGICOP_COPY_INVERTED: return "copy-inverted";
|
|
case PIPE_LOGICOP_AND_REVERSE: return "and-reverse";
|
|
case PIPE_LOGICOP_INVERT: return "invert";
|
|
case PIPE_LOGICOP_XOR: return "xor";
|
|
case PIPE_LOGICOP_NAND: return "nand";
|
|
case PIPE_LOGICOP_AND: return "and";
|
|
case PIPE_LOGICOP_EQUIV: return "equiv";
|
|
case PIPE_LOGICOP_NOOP: return "noop";
|
|
case PIPE_LOGICOP_OR_INVERTED: return "or-inverted";
|
|
case PIPE_LOGICOP_COPY: return "copy";
|
|
case PIPE_LOGICOP_OR_REVERSE: return "or-reverse";
|
|
case PIPE_LOGICOP_OR: return "or";
|
|
case PIPE_LOGICOP_SET: return "set";
|
|
default: unreachable("Invalid logicop\n");
|
|
}
|
|
}
|
|
|
|
static void
|
|
get_equation_str(const struct pan_blend_rt_state *rt_state,
|
|
char *str, unsigned len)
|
|
{
|
|
const char *funcs[] = {
|
|
"add", "sub", "reverse_sub", "min", "max",
|
|
};
|
|
const char *factors[] = {
|
|
"zero", "src_color", "src1_color", "dst_color",
|
|
"src_alpha", "src1_alpha", "dst_alpha",
|
|
"const_color", "const_alpha", "src_alpha_sat",
|
|
};
|
|
int ret;
|
|
|
|
if (!rt_state->equation.blend_enable) {
|
|
ret = snprintf(str, len, "replace");
|
|
assert(ret > 0);
|
|
return;
|
|
}
|
|
|
|
if (rt_state->equation.color_mask & 7) {
|
|
assert(rt_state->equation.rgb_func < ARRAY_SIZE(funcs));
|
|
assert(rt_state->equation.rgb_src_factor < ARRAY_SIZE(factors));
|
|
assert(rt_state->equation.rgb_dst_factor < ARRAY_SIZE(factors));
|
|
ret = snprintf(str, len, "%s%s%s(func=%s,src_factor=%s%s,dst_factor=%s%s)%s",
|
|
(rt_state->equation.color_mask & 1) ? "R" : "",
|
|
(rt_state->equation.color_mask & 2) ? "G" : "",
|
|
(rt_state->equation.color_mask & 4) ? "B" : "",
|
|
funcs[rt_state->equation.rgb_func],
|
|
rt_state->equation.rgb_invert_src_factor ? "-" : "",
|
|
factors[rt_state->equation.rgb_src_factor],
|
|
rt_state->equation.rgb_invert_dst_factor ? "-" : "",
|
|
factors[rt_state->equation.rgb_dst_factor],
|
|
rt_state->equation.color_mask & 8 ? ";" : "");
|
|
assert(ret > 0);
|
|
str += ret;
|
|
len -= ret;
|
|
}
|
|
|
|
if (rt_state->equation.color_mask & 8) {
|
|
assert(rt_state->equation.alpha_func < ARRAY_SIZE(funcs));
|
|
assert(rt_state->equation.alpha_src_factor < ARRAY_SIZE(factors));
|
|
assert(rt_state->equation.alpha_dst_factor < ARRAY_SIZE(factors));
|
|
ret = snprintf(str, len, "A(func=%s,src_factor=%s%s,dst_factor=%s%s)",
|
|
funcs[rt_state->equation.alpha_func],
|
|
rt_state->equation.alpha_invert_src_factor ? "-" : "",
|
|
factors[rt_state->equation.alpha_src_factor],
|
|
rt_state->equation.alpha_invert_dst_factor ? "-" : "",
|
|
factors[rt_state->equation.alpha_dst_factor]);
|
|
assert(ret > 0);
|
|
str += ret;
|
|
len -= ret;
|
|
}
|
|
}
|
|
|
|
static bool
|
|
pan_inline_blend_constants(nir_builder *b, nir_instr *instr, void *data)
|
|
{
|
|
if (instr->type != nir_instr_type_intrinsic)
|
|
return false;
|
|
|
|
nir_intrinsic_instr *intr = nir_instr_as_intrinsic(instr);
|
|
if (intr->intrinsic != nir_intrinsic_load_blend_const_color_rgba)
|
|
return false;
|
|
|
|
float *floats = data;
|
|
const nir_const_value constants[4] = {
|
|
{ .f32 = floats[0] },
|
|
{ .f32 = floats[1] },
|
|
{ .f32 = floats[2] },
|
|
{ .f32 = floats[3] }
|
|
};
|
|
|
|
b->cursor = nir_after_instr(instr);
|
|
nir_ssa_def *constant = nir_build_imm(b, 4, 32, constants);
|
|
nir_ssa_def_rewrite_uses(&intr->dest.ssa, constant);
|
|
nir_instr_remove(instr);
|
|
return true;
|
|
}
|
|
|
|
nir_shader *
|
|
GENX(pan_blend_create_shader)(const struct panfrost_device *dev,
|
|
const struct pan_blend_state *state,
|
|
nir_alu_type src0_type,
|
|
nir_alu_type src1_type,
|
|
unsigned rt)
|
|
{
|
|
const struct pan_blend_rt_state *rt_state = &state->rts[rt];
|
|
char equation_str[128] = { 0 };
|
|
|
|
get_equation_str(rt_state, equation_str, sizeof(equation_str));
|
|
|
|
nir_builder b =
|
|
nir_builder_init_simple_shader(MESA_SHADER_FRAGMENT,
|
|
GENX(pan_shader_get_compiler_options)(),
|
|
"pan_blend(rt=%d,fmt=%s,nr_samples=%d,%s=%s)",
|
|
rt, util_format_name(rt_state->format),
|
|
rt_state->nr_samples,
|
|
state->logicop_enable ? "logicop" : "equation",
|
|
state->logicop_enable ?
|
|
logicop_str(state->logicop_func) : equation_str);
|
|
|
|
const struct util_format_description *format_desc =
|
|
util_format_description(rt_state->format);
|
|
nir_alu_type nir_type = pan_unpacked_type_for_format(format_desc);
|
|
enum glsl_base_type glsl_type = nir_get_glsl_base_type_for_nir_type(nir_type);
|
|
|
|
nir_lower_blend_options options = {
|
|
.logicop_enable = state->logicop_enable,
|
|
.logicop_func = state->logicop_func,
|
|
.rt[0].colormask = rt_state->equation.color_mask,
|
|
.format[0] = rt_state->format
|
|
};
|
|
|
|
if (!rt_state->equation.blend_enable) {
|
|
static const nir_lower_blend_channel replace = {
|
|
.func = BLEND_FUNC_ADD,
|
|
.src_factor = BLEND_FACTOR_ZERO,
|
|
.invert_src_factor = true,
|
|
.dst_factor = BLEND_FACTOR_ZERO,
|
|
.invert_dst_factor = false,
|
|
};
|
|
|
|
options.rt[0].rgb = replace;
|
|
options.rt[0].alpha = replace;
|
|
} else {
|
|
options.rt[0].rgb.func = rt_state->equation.rgb_func;
|
|
options.rt[0].rgb.src_factor = rt_state->equation.rgb_src_factor;
|
|
options.rt[0].rgb.invert_src_factor = rt_state->equation.rgb_invert_src_factor;
|
|
options.rt[0].rgb.dst_factor = rt_state->equation.rgb_dst_factor;
|
|
options.rt[0].rgb.invert_dst_factor = rt_state->equation.rgb_invert_dst_factor;
|
|
options.rt[0].alpha.func = rt_state->equation.alpha_func;
|
|
options.rt[0].alpha.src_factor = rt_state->equation.alpha_src_factor;
|
|
options.rt[0].alpha.invert_src_factor = rt_state->equation.alpha_invert_src_factor;
|
|
options.rt[0].alpha.dst_factor = rt_state->equation.alpha_dst_factor;
|
|
options.rt[0].alpha.invert_dst_factor = rt_state->equation.alpha_invert_dst_factor;
|
|
}
|
|
|
|
nir_alu_type src_types[] = { src0_type ?: nir_type_float32, src1_type ?: nir_type_float32 };
|
|
|
|
/* HACK: workaround buggy TGSI shaders (u_blitter) */
|
|
for (unsigned i = 0; i < ARRAY_SIZE(src_types); ++i) {
|
|
src_types[i] = nir_alu_type_get_base_type(nir_type) |
|
|
nir_alu_type_get_type_size(src_types[i]);
|
|
}
|
|
|
|
nir_variable *c_src =
|
|
nir_variable_create(b.shader, nir_var_shader_in,
|
|
glsl_vector_type(nir_get_glsl_base_type_for_nir_type(src_types[0]), 4),
|
|
"gl_Color");
|
|
c_src->data.location = VARYING_SLOT_COL0;
|
|
nir_variable *c_src1 =
|
|
nir_variable_create(b.shader, nir_var_shader_in,
|
|
glsl_vector_type(nir_get_glsl_base_type_for_nir_type(src_types[1]), 4),
|
|
"gl_Color1");
|
|
c_src1->data.location = VARYING_SLOT_VAR0;
|
|
c_src1->data.driver_location = 1;
|
|
nir_variable *c_out =
|
|
nir_variable_create(b.shader, nir_var_shader_out,
|
|
glsl_vector_type(glsl_type, 4),
|
|
"gl_FragColor");
|
|
c_out->data.location = FRAG_RESULT_DATA0;
|
|
|
|
nir_ssa_def *s_src[] = {nir_load_var(&b, c_src), nir_load_var(&b, c_src1)};
|
|
|
|
/* Saturate integer conversions */
|
|
for (int i = 0; i < ARRAY_SIZE(s_src); ++i) {
|
|
nir_alu_type T = nir_alu_type_get_base_type(nir_type);
|
|
s_src[i] = nir_convert_with_rounding(&b, s_src[i],
|
|
src_types[i], nir_type,
|
|
nir_rounding_mode_undef,
|
|
T != nir_type_float);
|
|
}
|
|
|
|
/* Build a trivial blend shader */
|
|
nir_store_var(&b, c_out, s_src[0], 0xFF);
|
|
|
|
options.src1 = s_src[1];
|
|
|
|
NIR_PASS_V(b.shader, nir_lower_blend, &options);
|
|
nir_shader_instructions_pass(b.shader, pan_inline_blend_constants,
|
|
nir_metadata_block_index | nir_metadata_dominance,
|
|
(void *) state->constants);
|
|
|
|
return b.shader;
|
|
}
|
|
|
|
#if PAN_ARCH >= 6
|
|
uint64_t
|
|
GENX(pan_blend_get_internal_desc)(const struct panfrost_device *dev,
|
|
enum pipe_format fmt, unsigned rt,
|
|
unsigned force_size, bool dithered)
|
|
{
|
|
const struct util_format_description *desc = util_format_description(fmt);
|
|
uint64_t res;
|
|
|
|
pan_pack(&res, INTERNAL_BLEND, cfg) {
|
|
cfg.mode = MALI_BLEND_MODE_OPAQUE;
|
|
cfg.fixed_function.num_comps = desc->nr_channels;
|
|
cfg.fixed_function.rt = rt;
|
|
|
|
nir_alu_type T = pan_unpacked_type_for_format(desc);
|
|
|
|
if (force_size)
|
|
T = nir_alu_type_get_base_type(T) | force_size;
|
|
|
|
switch (T) {
|
|
case nir_type_float16:
|
|
cfg.fixed_function.conversion.register_format =
|
|
MALI_REGISTER_FILE_FORMAT_F16;
|
|
break;
|
|
case nir_type_float32:
|
|
cfg.fixed_function.conversion.register_format =
|
|
MALI_REGISTER_FILE_FORMAT_F32;
|
|
break;
|
|
case nir_type_int8:
|
|
case nir_type_int16:
|
|
cfg.fixed_function.conversion.register_format =
|
|
MALI_REGISTER_FILE_FORMAT_I16;
|
|
break;
|
|
case nir_type_int32:
|
|
cfg.fixed_function.conversion.register_format =
|
|
MALI_REGISTER_FILE_FORMAT_I32;
|
|
break;
|
|
case nir_type_uint8:
|
|
case nir_type_uint16:
|
|
cfg.fixed_function.conversion.register_format =
|
|
MALI_REGISTER_FILE_FORMAT_U16;
|
|
break;
|
|
case nir_type_uint32:
|
|
cfg.fixed_function.conversion.register_format =
|
|
MALI_REGISTER_FILE_FORMAT_U32;
|
|
break;
|
|
default:
|
|
unreachable("Invalid format");
|
|
}
|
|
|
|
cfg.fixed_function.conversion.memory_format =
|
|
panfrost_format_to_bifrost_blend(dev, fmt, dithered);
|
|
}
|
|
|
|
return res;
|
|
}
|
|
#endif
|
|
|
|
struct pan_blend_shader_variant *
|
|
GENX(pan_blend_get_shader_locked)(const struct panfrost_device *dev,
|
|
const struct pan_blend_state *state,
|
|
nir_alu_type src0_type,
|
|
nir_alu_type src1_type,
|
|
unsigned rt)
|
|
{
|
|
struct pan_blend_shader_key key = {
|
|
.format = state->rts[rt].format,
|
|
.src0_type = src0_type,
|
|
.src1_type = src1_type,
|
|
.rt = rt,
|
|
.has_constants = pan_blend_constant_mask(state->rts[rt].equation) != 0,
|
|
.logicop_enable = state->logicop_enable,
|
|
.logicop_func = state->logicop_func,
|
|
.nr_samples = state->rts[rt].nr_samples,
|
|
.equation = state->rts[rt].equation,
|
|
};
|
|
|
|
struct hash_entry *he = _mesa_hash_table_search(dev->blend_shaders.shaders, &key);
|
|
struct pan_blend_shader *shader = he ? he->data : NULL;
|
|
|
|
if (!shader) {
|
|
shader = rzalloc(dev->blend_shaders.shaders, struct pan_blend_shader);
|
|
shader->key = key;
|
|
list_inithead(&shader->variants);
|
|
_mesa_hash_table_insert(dev->blend_shaders.shaders, &shader->key, shader);
|
|
}
|
|
|
|
list_for_each_entry(struct pan_blend_shader_variant, iter,
|
|
&shader->variants, node) {
|
|
if (!key.has_constants ||
|
|
!memcmp(iter->constants, state->constants, sizeof(iter->constants))) {
|
|
return iter;
|
|
}
|
|
}
|
|
|
|
struct pan_blend_shader_variant *variant = NULL;
|
|
|
|
if (shader->nvariants < PAN_BLEND_SHADER_MAX_VARIANTS) {
|
|
variant = rzalloc(shader, struct pan_blend_shader_variant);
|
|
util_dynarray_init(&variant->binary, variant);
|
|
list_add(&variant->node, &shader->variants);
|
|
shader->nvariants++;
|
|
} else {
|
|
variant = list_last_entry(&shader->variants, struct pan_blend_shader_variant, node);
|
|
list_del(&variant->node);
|
|
list_add(&variant->node, &shader->variants);
|
|
util_dynarray_clear(&variant->binary);
|
|
}
|
|
|
|
memcpy(variant->constants, state->constants, sizeof(variant->constants));
|
|
|
|
nir_shader *nir =
|
|
GENX(pan_blend_create_shader)(dev, state, src0_type, src1_type, rt);
|
|
|
|
/* Compile the NIR shader */
|
|
struct panfrost_compile_inputs inputs = {
|
|
.gpu_id = dev->gpu_id,
|
|
.is_blend = true,
|
|
.blend.rt = shader->key.rt,
|
|
.blend.nr_samples = key.nr_samples,
|
|
.fixed_sysval_ubo = -1,
|
|
.rt_formats = { key.format },
|
|
};
|
|
|
|
#if PAN_ARCH >= 6
|
|
inputs.blend.bifrost_blend_desc =
|
|
GENX(pan_blend_get_internal_desc)(dev, key.format, key.rt, 0, false);
|
|
#endif
|
|
|
|
struct pan_shader_info info;
|
|
|
|
GENX(pan_shader_compile)(nir, &inputs, &variant->binary, &info);
|
|
|
|
/* Blend shaders can't have sysvals */
|
|
assert(info.sysvals.sysval_count == 0);
|
|
|
|
variant->work_reg_count = info.work_reg_count;
|
|
|
|
#if PAN_ARCH <= 5
|
|
variant->first_tag = info.midgard.first_tag;
|
|
#endif
|
|
|
|
ralloc_free(nir);
|
|
|
|
return variant;
|
|
}
|
|
#endif /* ifndef PAN_ARCH */
|