vc4_nir_lower_blend.c revision c30b22c421d2139135519449a68bf3120710a552
1bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/* 2bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Copyright © 2015 Broadcom 3bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 4bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Permission is hereby granted, free of charge, to any person obtaining a 5bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * copy of this software and associated documentation files (the "Software"), 6bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * to deal in the Software without restriction, including without limitation 7bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * and/or sell copies of the Software, and to permit persons to whom the 9bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Software is furnished to do so, subject to the following conditions: 10bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 11bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * The above copyright notice and this permission notice (including the next 12bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * paragraph) shall be included in all copies or substantial portions of the 13bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Software. 14bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 15bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 21bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * IN THE SOFTWARE. 22bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 23bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 24bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** 25bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Implements most of the fixed function fragment pipeline in shader code. 26bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 27bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * VC4 doesn't have any hardware support for blending, alpha test, logic ops, 28bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * or color mask. Instead, you read the current contents of the destination 29bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * from the tile buffer after having waited for the scoreboard (which is 30bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * handled by vc4_qpu_emit.c), then do math using your output color and that 31bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * destination value, and update the output color appropriately. 32a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * 33a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * Once this pass is done, the color write will either have one component (for 34a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * single sample) with packed argb8888, or 4 components with the per-sample 35a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * argb8888 result. 36bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 37bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 38bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** 39bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Lowers fixed-function blending to a load of the destination color and a 40bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * series of ALU operations before the store of the output. 41bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 42bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "util/u_format.h" 43bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "vc4_qir.h" 44a39a8fbbaa129f4e52f2a3ad2747182e9a74d910Emil Velikov#include "compiler/nir/nir_builder.h" 45bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "vc4_context.h" 46bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 47a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic bool 48a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtblend_depends_on_dst_color(struct vc4_compile *c) 49a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 50a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt return (c->fs_key->blend.blend_enable || 51a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt c->fs_key->blend.colormask != 0xf || 52a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt c->fs_key->logicop_func != PIPE_LOGICOP_COPY); 53a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 54a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 55bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** Emits a load of the previous fragment color from the tile buffer. */ 56bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 57a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_get_dst_color(nir_builder *b, int sample) 58bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 59bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr *load = 60bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr_create(b->shader, 61bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_load_input); 62bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt load->num_components = 1; 63c30b22c421d2139135519449a68bf3120710a552Eric Anholt nir_intrinsic_set_base(load, VC4_NIR_TLB_COLOR_READ_INPUT + sample); 6478b81be627734ea7fa50ea246c07b0d4a3a1638aJason Ekstrand load->src[0] = nir_src_for_ssa(nir_imm_int(b, 0)); 653124ce699bb3844e793f00e00bfbea5c91744f90Connor Abbott nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL); 66bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder_instr_insert(b, &load->instr); 67bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return &load->dest.ssa; 68bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 69bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 70bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 71bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_srgb_decode(nir_builder *b, nir_ssa_def *srgb) 72bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 73bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *is_low = nir_flt(b, srgb, nir_imm_float(b, 0.04045)); 74bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *low = nir_fmul(b, srgb, nir_imm_float(b, 1.0 / 12.92)); 75bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *high = nir_fpow(b, 76bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fmul(b, 77bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fadd(b, srgb, 78bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 0.055)), 79bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 1.0 / 1.055)), 80bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 2.4)); 81bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 82bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_bcsel(b, is_low, low, high); 83bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 84bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 85bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 86bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_srgb_encode(nir_builder *b, nir_ssa_def *linear) 87bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 88bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *is_low = nir_flt(b, linear, nir_imm_float(b, 0.0031308)); 89bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *low = nir_fmul(b, linear, nir_imm_float(b, 12.92)); 90bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *high = nir_fsub(b, 91bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fmul(b, 92bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 1.055), 93bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fpow(b, 94bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt linear, 95bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 0.41666))), 96bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 0.055)); 97bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 98bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_bcsel(b, is_low, low, high); 99bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 100bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 101bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 10270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_channel_f(nir_builder *b, 10370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **src, 10470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **dst, 10570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned factor, 10670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int channel) 107bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 108bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch(factor) { 109bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_ONE: 110bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 1.0); 111bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC_COLOR: 112bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src[channel]; 113bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA: 114bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src[3]; 115bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_DST_ALPHA: 116bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return dst[3]; 117bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_DST_COLOR: 118bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return dst[channel]; 119bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA_SATURATE: 120bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (channel != 3) { 121bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fmin(b, 122bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt src[3], 123bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fsub(b, 124bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 1.0), 125bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt dst[3])); 126bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } else { 127bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 1.0); 128bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 129bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_CONST_COLOR: 130bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_X + channel); 131bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_CONST_ALPHA: 132bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_W); 133bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_ZERO: 134bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 0.0); 135bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC_COLOR: 136bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), src[channel]); 137bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC_ALPHA: 138bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), src[3]); 139bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_DST_ALPHA: 140bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), dst[3]); 141bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_DST_COLOR: 142bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), dst[channel]); 143bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_CONST_COLOR: 144bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), 145bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_X + channel)); 146bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_CONST_ALPHA: 147bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), 148bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_W)); 149bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 150bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 151bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC1_COLOR: 152bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC1_ALPHA: 153bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC1_COLOR: 154bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC1_ALPHA: 155bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Unsupported. */ 156bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown blend factor %d\n", factor); 157bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 1.0); 158bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 159bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 160bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 161bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 16270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_set_packed_chan(nir_builder *b, nir_ssa_def *src0, nir_ssa_def *src1, 16370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int chan) 16470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 16570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned chan_mask = 0xff << (chan * 8); 16670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ior(b, 16770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_iand(b, src0, nir_imm_int(b, ~chan_mask)), 16870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_iand(b, src1, nir_imm_int(b, chan_mask))); 16970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 17070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 17170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 17270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_channel_i(nir_builder *b, 17370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src, 17470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst, 17570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_a, 17670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_a, 17770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned factor, 17870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int a_chan) 17970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 18070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt switch (factor) { 18170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_ONE: 18270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_imm_int(b, ~0); 18370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC_COLOR: 18470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src; 18570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA: 18670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src_a; 18770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_DST_ALPHA: 18870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return dst_a; 18970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_DST_COLOR: 19070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return dst; 19170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA_SATURATE: 19270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return vc4_nir_set_packed_chan(b, 19370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_umin_4x8(b, 19470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, 19570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_inot(b, dst_a)), 19670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_imm_int(b, ~0), 19770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt a_chan); 19870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_CONST_COLOR: 19970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_RGBA); 20070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_CONST_ALPHA: 20170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_AAAA); 20270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_ZERO: 20370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_imm_int(b, 0); 20470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC_COLOR: 20570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, src); 20670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC_ALPHA: 20770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, src_a); 20870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_DST_ALPHA: 20970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, dst_a); 21070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_DST_COLOR: 21170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, dst); 21270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_CONST_COLOR: 21370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_RGBA)); 21470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_CONST_ALPHA: 21570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, vc4_nir_get_state_uniform(b, QUNIFORM_BLEND_CONST_COLOR_AAAA)); 21670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 21770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt default: 21870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC1_COLOR: 21970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC1_ALPHA: 22070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC1_COLOR: 22170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC1_ALPHA: 22270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Unsupported. */ 22370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt fprintf(stderr, "Unknown blend factor %d\n", factor); 22470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_imm_int(b, ~0); 22570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 22670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 22770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 22870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 22970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_func_f(nir_builder *b, nir_ssa_def *src, nir_ssa_def *dst, 23070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned func) 231bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 232bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch (func) { 233bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_ADD: 234bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fadd(b, src, dst); 235bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_SUBTRACT: 236bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, src, dst); 237bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_REVERSE_SUBTRACT: 238bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, dst, src); 239bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_MIN: 240bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fmin(b, src, dst); 241bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_MAX: 242bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fmax(b, src, dst); 243bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 244bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 245bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Unsupported. */ 246bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown blend func %d\n", func); 247bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src; 248bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 249bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 250bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 251bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 25270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 25370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_func_i(nir_builder *b, nir_ssa_def *src, nir_ssa_def *dst, 25470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned func) 25570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 25670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt switch (func) { 25770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_ADD: 25870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_usadd_4x8(b, src, dst); 25970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_SUBTRACT: 26070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ussub_4x8(b, src, dst); 26170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_REVERSE_SUBTRACT: 26270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ussub_4x8(b, dst, src); 26370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_MIN: 26470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_umin_4x8(b, src, dst); 26570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_MAX: 26670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_umax_4x8(b, src, dst); 26770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 26870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt default: 26970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Unsupported. */ 27070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt fprintf(stderr, "Unknown blend func %d\n", func); 27170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src; 27270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 27370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 27470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 27570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 276bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic void 27770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_do_blending_f(struct vc4_compile *c, nir_builder *b, nir_ssa_def **result, 27870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **src_color, nir_ssa_def **dst_color) 279bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 280bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt struct pipe_rt_blend_state *blend = &c->fs_key->blend; 281bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 282bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (!blend->blend_enable) { 283bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) 284bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt result[i] = src_color[i]; 285bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return; 286bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 287bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 288bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Clamp the src color to [0, 1]. Dest is already clamped. */ 289bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) 290bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt src_color[i] = nir_fsat(b, src_color[i]); 291bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 292bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src_blend[4], *dst_blend[4]; 293bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) { 294bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt int src_factor = ((i != 3) ? blend->rgb_src_factor : 295bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt blend->alpha_src_factor); 296bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt int dst_factor = ((i != 3) ? blend->rgb_dst_factor : 297bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt blend->alpha_dst_factor); 298bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt src_blend[i] = nir_fmul(b, src_color[i], 29970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_f(b, 30070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 30170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_factor, i)); 302bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt dst_blend[i] = nir_fmul(b, dst_color[i], 30370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_f(b, 30470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 30570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_factor, i)); 306bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 307bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 308bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) { 30970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt result[i] = vc4_blend_func_f(b, src_blend[i], dst_blend[i], 31070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt ((i != 3) ? blend->rgb_func : 31170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_func)); 31270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 31370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 31470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 31570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 31670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_splat(nir_builder *b, nir_ssa_def *src) 31770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 31870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *or1 = nir_ior(b, src, nir_ishl(b, src, nir_imm_int(b, 8))); 31970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ior(b, or1, nir_ishl(b, or1, nir_imm_int(b, 16))); 32070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 32170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 32270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 32370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_do_blending_i(struct vc4_compile *c, nir_builder *b, 32470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_color, nir_ssa_def *dst_color, 32570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_float_a) 32670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 32770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt struct pipe_rt_blend_state *blend = &c->fs_key->blend; 32870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 32970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (!blend->blend_enable) 33070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src_color; 33170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 33270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt enum pipe_format color_format = c->fs_key->color_format; 33370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt const uint8_t *format_swiz = vc4_get_format_swizzle(color_format); 33470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *imm_0xff = nir_imm_int(b, 0xff); 33570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_a = nir_pack_unorm_4x8(b, src_float_a); 33670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_a; 33770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int alpha_chan; 33870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt for (alpha_chan = 0; alpha_chan < 4; alpha_chan++) { 33970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (format_swiz[alpha_chan] == 3) 34070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt break; 34170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 34270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4) { 34370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *shift = nir_imm_int(b, alpha_chan * 8); 34470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_a = vc4_nir_splat(b, nir_iand(b, nir_ushr(b, dst_color, 34570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt shift), imm_0xff)); 34670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } else { 34770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_a = nir_imm_int(b, ~0); 34870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 34970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 35070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_factor = vc4_blend_channel_i(b, 35170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 35270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 35370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->rgb_src_factor, 35470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 35570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_factor = vc4_blend_channel_i(b, 35670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 35770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 35870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->rgb_dst_factor, 35970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 36070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 36170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4 && 36270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_src_factor != blend->rgb_src_factor) { 36370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_alpha_factor = 36470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_i(b, 36570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 36670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 36770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_src_factor, 36870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 36970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_factor = vc4_nir_set_packed_chan(b, src_factor, 37070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_alpha_factor, 37170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 37270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 37370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4 && 37470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_dst_factor != blend->rgb_dst_factor) { 37570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_alpha_factor = 37670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_i(b, 37770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 37870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 37970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_dst_factor, 38070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 38170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_factor = vc4_nir_set_packed_chan(b, dst_factor, 38270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_alpha_factor, 38370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 38470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 38570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_blend = nir_umul_unorm_4x8(b, src_color, src_factor); 38670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_blend = nir_umul_unorm_4x8(b, dst_color, dst_factor); 38770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 38870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *result = 38970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_func_i(b, src_blend, dst_blend, blend->rgb_func); 39070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4 && blend->alpha_func != blend->rgb_func) { 39170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *result_a = vc4_blend_func_i(b, 39270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_blend, 39370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_blend, 39470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_func); 39570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt result = vc4_nir_set_packed_chan(b, result, result_a, 39670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 397bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 39870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return result; 399bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 400bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 401bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 402bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_logicop(nir_builder *b, int logicop_func, 403bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src, nir_ssa_def *dst) 404bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 405bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch (logicop_func) { 406bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_CLEAR: 407bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, 0); 408bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_NOR: 409bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, nir_ior(b, src, dst)); 410bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_AND_INVERTED: 411bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_iand(b, nir_inot(b, src), dst); 412bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_COPY_INVERTED: 413bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, src); 414bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_AND_REVERSE: 415bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_iand(b, src, nir_inot(b, dst)); 416bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_INVERT: 417bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, dst); 418bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_XOR: 419bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ixor(b, src, dst); 420bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_NAND: 421bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, nir_iand(b, src, dst)); 422bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_AND: 423bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_iand(b, src, dst); 424bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_EQUIV: 425bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, nir_ixor(b, src, dst)); 426bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_NOOP: 427bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return dst; 428bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_OR_INVERTED: 429bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ior(b, nir_inot(b, src), dst); 430bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_OR_REVERSE: 431bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ior(b, src, nir_inot(b, dst)); 432bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_OR: 433bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ior(b, src, dst); 434bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_SET: 435bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, ~0); 436bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 437bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown logic op %d\n", logicop_func); 438bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* FALLTHROUGH */ 439bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_COPY: 440bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src; 441bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 442bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 443bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 444bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 445bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_pipe_compare_func(nir_builder *b, int func, 446bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src0, nir_ssa_def *src1) 447bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 448bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch (func) { 449bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 450bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown compare func %d\n", func); 451bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* FALLTHROUGH */ 452bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_NEVER: 453bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, 0); 454bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_ALWAYS: 455bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, ~0); 456bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_EQUAL: 457bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_feq(b, src0, src1); 458bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_NOTEQUAL: 459bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fne(b, src0, src1); 460bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_GREATER: 461bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_flt(b, src1, src0); 462bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_GEQUAL: 463bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fge(b, src0, src1); 464bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_LESS: 465bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_flt(b, src0, src1); 466bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_LEQUAL: 467bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fge(b, src1, src0); 468bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 469bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 470bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 471bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic void 472bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_emit_alpha_test_discard(struct vc4_compile *c, nir_builder *b, 473bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *alpha) 474bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 475bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (!c->fs_key->alpha_test) 476bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return; 477bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 478bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *alpha_ref = 479bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_get_state_uniform(b, QUNIFORM_ALPHA_REF); 480bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *condition = 481bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_pipe_compare_func(b, c->fs_key->alpha_test_func, 482bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt alpha, alpha_ref); 483bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 484bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr *discard = 485bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr_create(b->shader, 486bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_discard_if); 487bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt discard->num_components = 1; 488bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt discard->src[0] = nir_src_for_ssa(nir_inot(b, condition)); 489bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder_instr_insert(b, &discard->instr); 490bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 491bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 49270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 49370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_swizzle_and_pack(struct vc4_compile *c, nir_builder *b, 49470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **colors) 49570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 49670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt enum pipe_format color_format = c->fs_key->color_format; 49770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt const uint8_t *format_swiz = vc4_get_format_swizzle(color_format); 49870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 49970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *swizzled[4]; 50070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt for (int i = 0; i < 4; i++) { 50170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt swizzled[i] = vc4_nir_get_swizzled_channel(b, colors, 50270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt format_swiz[i]); 50370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 50470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 50570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_pack_unorm_4x8(b, 50670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_vec4(b, 50770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt swizzled[0], swizzled[1], 50870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt swizzled[2], swizzled[3])); 50970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 51070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 51170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 512a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic nir_ssa_def * 513a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_blend_pipeline(struct vc4_compile *c, nir_builder *b, nir_ssa_def *src, 514a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt int sample) 515bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 516bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt enum pipe_format color_format = c->fs_key->color_format; 517bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt const uint8_t *format_swiz = vc4_get_format_swizzle(color_format); 51870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt bool srgb = util_format_is_srgb(color_format); 519bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 520bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Pull out the float src/dst color components. */ 521a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *packed_dst_color = vc4_nir_get_dst_color(b, sample); 522bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *dst_vec4 = nir_unpack_unorm_4x8(b, packed_dst_color); 523bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src_color[4], *unpacked_dst_color[4]; 524bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (unsigned i = 0; i < 4; i++) { 525a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt src_color[i] = nir_channel(b, src, i); 5264cff16bc3a84569da05e672c8226931678aa62c0Eric Anholt unpacked_dst_color[i] = nir_channel(b, dst_vec4, i); 527bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 528bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 529a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt if (c->fs_key->sample_alpha_to_one && c->fs_key->msaa) 530a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt src_color[3] = nir_imm_float(b, 1.0); 531a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 532bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_emit_alpha_test_discard(c, b, src_color[3]); 533bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 53470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *packed_color; 53570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (srgb) { 53670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Unswizzle the destination color. */ 53770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_color[4]; 53870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt for (unsigned i = 0; i < 4; i++) { 53970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_color[i] = vc4_nir_get_swizzled_channel(b, 54070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unpacked_dst_color, 54170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt format_swiz[i]); 54270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 54370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 54470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Turn dst color to linear. */ 545bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 3; i++) 546bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt dst_color[i] = vc4_nir_srgb_decode(b, dst_color[i]); 547bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 54870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *blend_color[4]; 54970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_do_blending_f(c, b, blend_color, src_color, dst_color); 550bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 55170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* sRGB encode the output color */ 552bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 3; i++) 553bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt blend_color[i] = vc4_nir_srgb_encode(b, blend_color[i]); 554bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 55570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt packed_color = vc4_nir_swizzle_and_pack(c, b, blend_color); 55670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } else { 55770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *packed_src_color = 55870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_nir_swizzle_and_pack(c, b, src_color); 559bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 56070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt packed_color = 56170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_do_blending_i(c, b, 56270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt packed_src_color, packed_dst_color, 56370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color[3]); 56470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 565bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 566bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt packed_color = vc4_logicop(b, c->fs_key->logicop_func, 567bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt packed_color, packed_dst_color); 568bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 569bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* If the bit isn't set in the color mask, then just return the 570bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * original dst color, instead. 571bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 572bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt uint32_t colormask = 0xffffffff; 573bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) { 574bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (format_swiz[i] < 4 && 575bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt !(c->fs_key->blend.colormask & (1 << format_swiz[i]))) { 576bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt colormask &= ~(0xff << (i * 8)); 577bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 578bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 579bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 580a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt return nir_ior(b, 581a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_iand(b, packed_color, 582a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, colormask)), 583a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_iand(b, packed_dst_color, 584a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, ~colormask))); 585a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 586a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 587a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic int 588a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_next_output_driver_location(nir_shader *s) 589a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 590a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt int maxloc = -1; 591a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 59253b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt nir_foreach_variable(var, &s->outputs) 59353b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt maxloc = MAX2(maxloc, (int)var->data.driver_location); 594a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 59553b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt return maxloc + 1; 596a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 597a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 598a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic void 599a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_store_sample_mask(struct vc4_compile *c, nir_builder *b, 600a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *val) 601a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 602a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_variable *sample_mask = nir_variable_create(c->s, nir_var_shader_out, 603a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt glsl_uint_type(), 604a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt "sample_mask"); 605a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt sample_mask->data.driver_location = 606a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt vc4_nir_next_output_driver_location(c->s); 607a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt sample_mask->data.location = FRAG_RESULT_SAMPLE_MASK; 608a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 609a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr *intr = 610a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr_create(c->s, nir_intrinsic_store_output); 611bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt intr->num_components = 1; 612c30b22c421d2139135519449a68bf3120710a552Eric Anholt nir_intrinsic_set_base(intr, sample_mask->data.driver_location); 613a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 614a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt intr->src[0] = nir_src_for_ssa(val); 61578b81be627734ea7fa50ea246c07b0d4a3a1638aJason Ekstrand intr->src[1] = nir_src_for_ssa(nir_imm_int(b, 0)); 616a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_builder_instr_insert(b, &intr->instr); 617a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 618a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 619a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic void 620a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_lower_blend_instr(struct vc4_compile *c, nir_builder *b, 621a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr *intr) 622a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 623a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *frag_color = intr->src[0].ssa; 624a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 625a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt if (c->fs_key->sample_coverage) { 626a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr *load = 627a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr_create(b->shader, 628a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_load_sample_mask_in); 629a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt load->num_components = 1; 6303124ce699bb3844e793f00e00bfbea5c91744f90Connor Abbott nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL); 631a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_builder_instr_insert(b, &load->instr); 632a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 633a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *bitmask = &load->dest.ssa; 634a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 635a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt vc4_nir_store_sample_mask(c, b, bitmask); 636a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } else if (c->fs_key->sample_alpha_to_coverage) { 637a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *a = nir_channel(b, frag_color, 3); 638a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 639a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt /* XXX: We should do a nice dither based on the fragment 640a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * coordinate, instead. 641a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt */ 642a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *num_samples = nir_imm_float(b, VC4_MAX_SAMPLES); 643a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *num_bits = nir_f2i(b, nir_fmul(b, a, num_samples)); 644a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *bitmask = nir_isub(b, 645a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ishl(b, 646a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, 1), 647a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt num_bits), 648a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, 1)); 649a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt vc4_nir_store_sample_mask(c, b, bitmask); 650a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } 651a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 652a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt /* The TLB color read returns each sample in turn, so if our blending 653a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * depends on the destination color, we're going to have to run the 654a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * blending function separately for each destination sample value, and 655a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * then output the per-sample color using TLB_COLOR_MS. 656a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt */ 657a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *blend_output; 658a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt if (c->fs_key->msaa && blend_depends_on_dst_color(c)) { 659a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt c->msaa_per_sample_output = true; 660a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 661a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *samples[4]; 662a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt for (int i = 0; i < VC4_MAX_SAMPLES; i++) 663a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt samples[i] = vc4_nir_blend_pipeline(c, b, frag_color, i); 664a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt blend_output = nir_vec4(b, 665a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt samples[0], samples[1], 666a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt samples[2], samples[3]); 667a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } else { 668a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt blend_output = vc4_nir_blend_pipeline(c, b, frag_color, 0); 669a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } 670a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 671a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_instr_rewrite_src(&intr->instr, &intr->src[0], 672a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_src_for_ssa(blend_output)); 673a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt intr->num_components = blend_output->num_components; 674bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 675bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 676bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic bool 6777c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbottvc4_nir_lower_blend_block(nir_block *block, struct vc4_compile *c) 678bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 679707e72f13bb78869ee95d3286980bf1709cba6cfJason Ekstrand nir_foreach_instr_safe(instr, block) { 680bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (instr->type != nir_instr_type_intrinsic) 681bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt continue; 682bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr *intr = nir_instr_as_intrinsic(instr); 683bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (intr->intrinsic != nir_intrinsic_store_output) 684bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt continue; 685bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 686bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_variable *output_var = NULL; 6876bd9e0351205dc475f45b58979702b5cf414aa07Boyan Ding nir_foreach_variable(var, &c->s->outputs) { 688c30b22c421d2139135519449a68bf3120710a552Eric Anholt if (var->data.driver_location == 689c30b22c421d2139135519449a68bf3120710a552Eric Anholt nir_intrinsic_base(intr)) { 690bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt output_var = var; 691bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt break; 692bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 693bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 694bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt assert(output_var); 6958fd3e53f3dc40e4013348e63a0cc7a2787410899Eric Anholt 696cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt if (output_var->data.location != FRAG_RESULT_COLOR && 697cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt output_var->data.location != FRAG_RESULT_DATA0) { 698bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt continue; 699cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt } 700bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 701bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_function_impl *impl = 702bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_cf_node_get_function(&block->cf_node); 703bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder b; 704bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder_init(&b, impl); 7050a913a9d85f2eb772be6a133965c5b8a4aa3c800Kenneth Graunke b.cursor = nir_before_instr(&intr->instr); 706bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_lower_blend_instr(c, &b, intr); 707bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 708bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return true; 709bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 710bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 711bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvoid 71299a759a4a3c29c283ae93612017d2f31c0ddbe73Eric Anholtvc4_nir_lower_blend(nir_shader *s, struct vc4_compile *c) 713bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 7149464d8c49813aba77285e7465b96e92a91ed327cJason Ekstrand nir_foreach_function(function, s) { 715237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand if (function->impl) { 7167c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott nir_foreach_block(block, function->impl) { 7177c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott vc4_nir_lower_blend_block(block, c); 7187c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott } 719bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 720237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand nir_metadata_preserve(function->impl, 721bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_metadata_block_index | 722bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_metadata_dominance); 723bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 724bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 725bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 726