1bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/* 2bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Copyright © 2015 Broadcom 3bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 4bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Permission is hereby granted, free of charge, to any person obtaining a 5bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * copy of this software and associated documentation files (the "Software"), 6bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * to deal in the Software without restriction, including without limitation 7bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * and/or sell copies of the Software, and to permit persons to whom the 9bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Software is furnished to do so, subject to the following conditions: 10bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 11bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * The above copyright notice and this permission notice (including the next 12bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * paragraph) shall be included in all copies or substantial portions of the 13bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Software. 14bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 15bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 21bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * IN THE SOFTWARE. 22bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 23bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 24bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** 25bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Implements most of the fixed function fragment pipeline in shader code. 26bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * 27bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * VC4 doesn't have any hardware support for blending, alpha test, logic ops, 28bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * or color mask. Instead, you read the current contents of the destination 29bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * from the tile buffer after having waited for the scoreboard (which is 30bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * handled by vc4_qpu_emit.c), then do math using your output color and that 31bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * destination value, and update the output color appropriately. 32a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * 33a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * Once this pass is done, the color write will either have one component (for 34a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * single sample) with packed argb8888, or 4 components with the per-sample 35a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * argb8888 result. 36bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 37bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 38bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** 39bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Lowers fixed-function blending to a load of the destination color and a 40bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * series of ALU operations before the store of the output. 41bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 42bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "util/u_format.h" 43bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "vc4_qir.h" 44a39a8fbbaa129f4e52f2a3ad2747182e9a74d910Emil Velikov#include "compiler/nir/nir_builder.h" 45bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "vc4_context.h" 46bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 47a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic bool 48a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtblend_depends_on_dst_color(struct vc4_compile *c) 49a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 50a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt return (c->fs_key->blend.blend_enable || 51a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt c->fs_key->blend.colormask != 0xf || 52a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt c->fs_key->logicop_func != PIPE_LOGICOP_COPY); 53a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 54a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 55bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** Emits a load of the previous fragment color from the tile buffer. */ 56bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 57a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_get_dst_color(nir_builder *b, int sample) 58bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 59bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr *load = 60bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr_create(b->shader, 61bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_load_input); 62bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt load->num_components = 1; 63c30b22c421d2139135519449a68bf3120710a552Eric Anholt nir_intrinsic_set_base(load, VC4_NIR_TLB_COLOR_READ_INPUT + sample); 6478b81be627734ea7fa50ea246c07b0d4a3a1638aJason Ekstrand load->src[0] = nir_src_for_ssa(nir_imm_int(b, 0)); 653124ce699bb3844e793f00e00bfbea5c91744f90Connor Abbott nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL); 66bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder_instr_insert(b, &load->instr); 67bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return &load->dest.ssa; 68bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 69bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 70bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 71bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_srgb_decode(nir_builder *b, nir_ssa_def *srgb) 72bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 73bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *is_low = nir_flt(b, srgb, nir_imm_float(b, 0.04045)); 74bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *low = nir_fmul(b, srgb, nir_imm_float(b, 1.0 / 12.92)); 75bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *high = nir_fpow(b, 76bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fmul(b, 77bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fadd(b, srgb, 78bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 0.055)), 79bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 1.0 / 1.055)), 80bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 2.4)); 81bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 82bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_bcsel(b, is_low, low, high); 83bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 84bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 85bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 86bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_srgb_encode(nir_builder *b, nir_ssa_def *linear) 87bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 88bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *is_low = nir_flt(b, linear, nir_imm_float(b, 0.0031308)); 89bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *low = nir_fmul(b, linear, nir_imm_float(b, 12.92)); 90bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *high = nir_fsub(b, 91bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fmul(b, 92bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 1.055), 93bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fpow(b, 94bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt linear, 95bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 0.41666))), 96bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 0.055)); 97bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 98bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_bcsel(b, is_low, low, high); 99bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 100bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 101bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 10270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_channel_f(nir_builder *b, 10370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **src, 10470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **dst, 10570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned factor, 10670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int channel) 107bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 108bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch(factor) { 109bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_ONE: 110bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 1.0); 111bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC_COLOR: 112bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src[channel]; 113bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA: 114bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src[3]; 115bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_DST_ALPHA: 116bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return dst[3]; 117bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_DST_COLOR: 118bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return dst[channel]; 119bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA_SATURATE: 120bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (channel != 3) { 121bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fmin(b, 122bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt src[3], 123bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_fsub(b, 124bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_imm_float(b, 1.0), 125bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt dst[3])); 126bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } else { 127bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 1.0); 128bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 129bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_CONST_COLOR: 130e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt return nir_load_system_value(b, 131e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_intrinsic_load_blend_const_color_r_float + 132e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt channel, 133e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt 0); 134bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_CONST_ALPHA: 135e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt return nir_load_blend_const_color_a_float(b); 136bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_ZERO: 137bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 0.0); 138bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC_COLOR: 139bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), src[channel]); 140bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC_ALPHA: 141bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), src[3]); 142bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_DST_ALPHA: 143bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), dst[3]); 144bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_DST_COLOR: 145bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), dst[channel]); 146bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_CONST_COLOR: 147bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), 148e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_load_system_value(b, 149e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_intrinsic_load_blend_const_color_r_float + 150e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt channel, 151e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt 0)); 152bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_CONST_ALPHA: 153bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, nir_imm_float(b, 1.0), 154e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_load_blend_const_color_a_float(b)); 155bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 156bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 157bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC1_COLOR: 158bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_SRC1_ALPHA: 159bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC1_COLOR: 160bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLENDFACTOR_INV_SRC1_ALPHA: 161bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Unsupported. */ 162bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown blend factor %d\n", factor); 163bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_float(b, 1.0); 164bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 165bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 166bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 167bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 16870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_set_packed_chan(nir_builder *b, nir_ssa_def *src0, nir_ssa_def *src1, 16970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int chan) 17070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 17170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned chan_mask = 0xff << (chan * 8); 17270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ior(b, 17370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_iand(b, src0, nir_imm_int(b, ~chan_mask)), 17470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_iand(b, src1, nir_imm_int(b, chan_mask))); 17570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 17670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 17770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 17870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_channel_i(nir_builder *b, 17970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src, 18070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst, 18170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_a, 18270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_a, 18370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned factor, 18470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int a_chan) 18570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 18670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt switch (factor) { 18770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_ONE: 18870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_imm_int(b, ~0); 18970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC_COLOR: 19070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src; 19170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA: 19270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src_a; 19370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_DST_ALPHA: 19470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return dst_a; 19570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_DST_COLOR: 19670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return dst; 19770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC_ALPHA_SATURATE: 19870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return vc4_nir_set_packed_chan(b, 19970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_umin_4x8(b, 20070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, 20170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_inot(b, dst_a)), 20270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_imm_int(b, ~0), 20370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt a_chan); 20470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_CONST_COLOR: 205e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt return nir_load_blend_const_color_rgba8888_unorm(b); 20670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_CONST_ALPHA: 207e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt return nir_load_blend_const_color_aaaa8888_unorm(b); 20870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_ZERO: 20970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_imm_int(b, 0); 21070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC_COLOR: 21170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, src); 21270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC_ALPHA: 21370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, src_a); 21470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_DST_ALPHA: 21570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, dst_a); 21670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_DST_COLOR: 21770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_inot(b, dst); 21870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_CONST_COLOR: 219e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt return nir_inot(b, 220e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_load_blend_const_color_rgba8888_unorm(b)); 22170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_CONST_ALPHA: 222e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt return nir_inot(b, 223e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_load_blend_const_color_aaaa8888_unorm(b)); 22470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 22570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt default: 22670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC1_COLOR: 22770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_SRC1_ALPHA: 22870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC1_COLOR: 22970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLENDFACTOR_INV_SRC1_ALPHA: 23070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Unsupported. */ 23170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt fprintf(stderr, "Unknown blend factor %d\n", factor); 23270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_imm_int(b, ~0); 23370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 23470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 23570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 23670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 23770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_func_f(nir_builder *b, nir_ssa_def *src, nir_ssa_def *dst, 23870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned func) 239bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 240bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch (func) { 241bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_ADD: 242bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fadd(b, src, dst); 243bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_SUBTRACT: 244bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, src, dst); 245bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_REVERSE_SUBTRACT: 246bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fsub(b, dst, src); 247bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_MIN: 248bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fmin(b, src, dst); 249bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_BLEND_MAX: 250bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fmax(b, src, dst); 251bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 252bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 253bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Unsupported. */ 254bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown blend func %d\n", func); 255bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src; 256bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 257bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 258bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 259bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 26070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 26170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_func_i(nir_builder *b, nir_ssa_def *src, nir_ssa_def *dst, 26270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unsigned func) 26370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 26470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt switch (func) { 26570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_ADD: 26670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_usadd_4x8(b, src, dst); 26770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_SUBTRACT: 26870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ussub_4x8(b, src, dst); 26970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_REVERSE_SUBTRACT: 27070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ussub_4x8(b, dst, src); 27170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_MIN: 27270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_umin_4x8(b, src, dst); 27370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt case PIPE_BLEND_MAX: 27470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_umax_4x8(b, src, dst); 27570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 27670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt default: 27770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Unsupported. */ 27870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt fprintf(stderr, "Unknown blend func %d\n", func); 27970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src; 28070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 28170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 28270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 28370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 284bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic void 28570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_do_blending_f(struct vc4_compile *c, nir_builder *b, nir_ssa_def **result, 28670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **src_color, nir_ssa_def **dst_color) 287bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 288bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt struct pipe_rt_blend_state *blend = &c->fs_key->blend; 289bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 290bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (!blend->blend_enable) { 291bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) 292bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt result[i] = src_color[i]; 293bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return; 294bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 295bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 296bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Clamp the src color to [0, 1]. Dest is already clamped. */ 297bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) 298bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt src_color[i] = nir_fsat(b, src_color[i]); 299bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 300bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src_blend[4], *dst_blend[4]; 301bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) { 302bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt int src_factor = ((i != 3) ? blend->rgb_src_factor : 303bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt blend->alpha_src_factor); 304bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt int dst_factor = ((i != 3) ? blend->rgb_dst_factor : 305bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt blend->alpha_dst_factor); 306bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt src_blend[i] = nir_fmul(b, src_color[i], 30770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_f(b, 30870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 30970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_factor, i)); 310bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt dst_blend[i] = nir_fmul(b, dst_color[i], 31170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_f(b, 31270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 31370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_factor, i)); 314bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 315bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 316bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) { 31770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt result[i] = vc4_blend_func_f(b, src_blend[i], dst_blend[i], 31870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt ((i != 3) ? blend->rgb_func : 31970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_func)); 32070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 32170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 32270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 32370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 32470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_splat(nir_builder *b, nir_ssa_def *src) 32570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 32670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *or1 = nir_ior(b, src, nir_ishl(b, src, nir_imm_int(b, 8))); 32770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_ior(b, or1, nir_ishl(b, or1, nir_imm_int(b, 16))); 32870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 32970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 33070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 33170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_do_blending_i(struct vc4_compile *c, nir_builder *b, 33270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_color, nir_ssa_def *dst_color, 33370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_float_a) 33470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 33570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt struct pipe_rt_blend_state *blend = &c->fs_key->blend; 33670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 33770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (!blend->blend_enable) 33870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return src_color; 33970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 34070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt enum pipe_format color_format = c->fs_key->color_format; 34170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt const uint8_t *format_swiz = vc4_get_format_swizzle(color_format); 34270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *imm_0xff = nir_imm_int(b, 0xff); 34370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_a = nir_pack_unorm_4x8(b, src_float_a); 34470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_a; 34570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt int alpha_chan; 34670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt for (alpha_chan = 0; alpha_chan < 4; alpha_chan++) { 34770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (format_swiz[alpha_chan] == 3) 34870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt break; 34970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 35070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4) { 35170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *shift = nir_imm_int(b, alpha_chan * 8); 35270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_a = vc4_nir_splat(b, nir_iand(b, nir_ushr(b, dst_color, 35370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt shift), imm_0xff)); 35470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } else { 35570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_a = nir_imm_int(b, ~0); 35670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 35770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 35870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_factor = vc4_blend_channel_i(b, 35970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 36070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 36170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->rgb_src_factor, 36270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 36370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_factor = vc4_blend_channel_i(b, 36470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 36570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 36670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->rgb_dst_factor, 36770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 36870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 36970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4 && 37070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_src_factor != blend->rgb_src_factor) { 37170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_alpha_factor = 37270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_i(b, 37370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 37470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 37570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_src_factor, 37670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 37770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_factor = vc4_nir_set_packed_chan(b, src_factor, 37870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_alpha_factor, 37970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 38070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 38170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4 && 38270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_dst_factor != blend->rgb_dst_factor) { 38370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_alpha_factor = 38470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_channel_i(b, 38570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color, dst_color, 38670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_a, dst_a, 38770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_dst_factor, 38870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 38970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_factor = vc4_nir_set_packed_chan(b, dst_factor, 39070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_alpha_factor, 39170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 39270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 39370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *src_blend = nir_umul_unorm_4x8(b, src_color, src_factor); 39470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_blend = nir_umul_unorm_4x8(b, dst_color, dst_factor); 39570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 39670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *result = 39770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_blend_func_i(b, src_blend, dst_blend, blend->rgb_func); 39870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (alpha_chan != 4 && blend->alpha_func != blend->rgb_func) { 39970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *result_a = vc4_blend_func_i(b, 40070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_blend, 40170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_blend, 40270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt blend->alpha_func); 40370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt result = vc4_nir_set_packed_chan(b, result, result_a, 40470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt alpha_chan); 405bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 40670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return result; 407bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 408bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 409bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 410bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_logicop(nir_builder *b, int logicop_func, 411bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src, nir_ssa_def *dst) 412bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 413bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch (logicop_func) { 414bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_CLEAR: 415bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, 0); 416bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_NOR: 417bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, nir_ior(b, src, dst)); 418bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_AND_INVERTED: 419bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_iand(b, nir_inot(b, src), dst); 420bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_COPY_INVERTED: 421bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, src); 422bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_AND_REVERSE: 423bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_iand(b, src, nir_inot(b, dst)); 424bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_INVERT: 425bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, dst); 426bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_XOR: 427bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ixor(b, src, dst); 428bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_NAND: 429bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, nir_iand(b, src, dst)); 430bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_AND: 431bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_iand(b, src, dst); 432bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_EQUIV: 433bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_inot(b, nir_ixor(b, src, dst)); 434bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_NOOP: 435bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return dst; 436bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_OR_INVERTED: 437bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ior(b, nir_inot(b, src), dst); 438bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_OR_REVERSE: 439bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ior(b, src, nir_inot(b, dst)); 440bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_OR: 441bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_ior(b, src, dst); 442bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_SET: 443bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, ~0); 444bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 445bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown logic op %d\n", logicop_func); 446bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* FALLTHROUGH */ 447bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_LOGICOP_COPY: 448bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return src; 449bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 450bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 451bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 452bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def * 453bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_pipe_compare_func(nir_builder *b, int func, 454bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src0, nir_ssa_def *src1) 455bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 456bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt switch (func) { 457bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt default: 458bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt fprintf(stderr, "Unknown compare func %d\n", func); 459bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* FALLTHROUGH */ 460bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_NEVER: 461bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, 0); 462bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_ALWAYS: 463bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_imm_int(b, ~0); 464bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_EQUAL: 465bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_feq(b, src0, src1); 466bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_NOTEQUAL: 467bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fne(b, src0, src1); 468bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_GREATER: 469bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_flt(b, src1, src0); 470bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_GEQUAL: 471bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fge(b, src0, src1); 472bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_LESS: 473bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_flt(b, src0, src1); 474bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt case PIPE_FUNC_LEQUAL: 475bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return nir_fge(b, src1, src0); 476bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 477bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 478bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 479bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic void 480bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_emit_alpha_test_discard(struct vc4_compile *c, nir_builder *b, 481bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *alpha) 482bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 483bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (!c->fs_key->alpha_test) 484bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return; 485bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 486bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *condition = 487bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_pipe_compare_func(b, c->fs_key->alpha_test_func, 488e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt alpha, 489e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt nir_load_alpha_ref_float(b)); 490bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 491bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr *discard = 492bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr_create(b->shader, 493bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_discard_if); 494bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt discard->num_components = 1; 495bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt discard->src[0] = nir_src_for_ssa(nir_inot(b, condition)); 496bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder_instr_insert(b, &discard->instr); 497e1af20f18a86f52a9640faf2d4ff8a71b0a4fa9bTimothy Arceri c->s->info->fs.uses_discard = true; 498bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 499bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 50070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def * 50170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_swizzle_and_pack(struct vc4_compile *c, nir_builder *b, 50270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def **colors) 50370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{ 50470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt enum pipe_format color_format = c->fs_key->color_format; 50570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt const uint8_t *format_swiz = vc4_get_format_swizzle(color_format); 50670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 50770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *swizzled[4]; 50870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt for (int i = 0; i < 4; i++) { 50970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt swizzled[i] = vc4_nir_get_swizzled_channel(b, colors, 51070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt format_swiz[i]); 51170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 51270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 51370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt return nir_pack_unorm_4x8(b, 51470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_vec4(b, 51570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt swizzled[0], swizzled[1], 51670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt swizzled[2], swizzled[3])); 51770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 51870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt} 51970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 520a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic nir_ssa_def * 521a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_blend_pipeline(struct vc4_compile *c, nir_builder *b, nir_ssa_def *src, 522a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt int sample) 523bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 524bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt enum pipe_format color_format = c->fs_key->color_format; 525bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt const uint8_t *format_swiz = vc4_get_format_swizzle(color_format); 52670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt bool srgb = util_format_is_srgb(color_format); 527bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 528bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* Pull out the float src/dst color components. */ 529a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *packed_dst_color = vc4_nir_get_dst_color(b, sample); 530bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *dst_vec4 = nir_unpack_unorm_4x8(b, packed_dst_color); 531bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_ssa_def *src_color[4], *unpacked_dst_color[4]; 532bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (unsigned i = 0; i < 4; i++) { 533a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt src_color[i] = nir_channel(b, src, i); 5344cff16bc3a84569da05e672c8226931678aa62c0Eric Anholt unpacked_dst_color[i] = nir_channel(b, dst_vec4, i); 535bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 536bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 537a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt if (c->fs_key->sample_alpha_to_one && c->fs_key->msaa) 538a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt src_color[3] = nir_imm_float(b, 1.0); 539a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 540bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_emit_alpha_test_discard(c, b, src_color[3]); 541bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 54270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *packed_color; 54370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt if (srgb) { 54470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Unswizzle the destination color. */ 54570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *dst_color[4]; 54670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt for (unsigned i = 0; i < 4; i++) { 54770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt dst_color[i] = vc4_nir_get_swizzled_channel(b, 54870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt unpacked_dst_color, 54970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt format_swiz[i]); 55070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 55170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt 55270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* Turn dst color to linear. */ 553bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 3; i++) 554bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt dst_color[i] = vc4_nir_srgb_decode(b, dst_color[i]); 555bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 55670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *blend_color[4]; 55770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_do_blending_f(c, b, blend_color, src_color, dst_color); 558bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 55970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt /* sRGB encode the output color */ 560bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 3; i++) 561bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt blend_color[i] = vc4_nir_srgb_encode(b, blend_color[i]); 562bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 56370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt packed_color = vc4_nir_swizzle_and_pack(c, b, blend_color); 56470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } else { 56570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt nir_ssa_def *packed_src_color = 56670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_nir_swizzle_and_pack(c, b, src_color); 567bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 56870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt packed_color = 56970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt vc4_do_blending_i(c, b, 57070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt packed_src_color, packed_dst_color, 57170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt src_color[3]); 57270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt } 573bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 574bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt packed_color = vc4_logicop(b, c->fs_key->logicop_func, 575bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt packed_color, packed_dst_color); 576bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 577bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt /* If the bit isn't set in the color mask, then just return the 578bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * original dst color, instead. 579bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */ 580bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt uint32_t colormask = 0xffffffff; 581bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt for (int i = 0; i < 4; i++) { 582bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (format_swiz[i] < 4 && 583bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt !(c->fs_key->blend.colormask & (1 << format_swiz[i]))) { 584bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt colormask &= ~(0xff << (i * 8)); 585bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 586bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 587bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 588a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt return nir_ior(b, 589a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_iand(b, packed_color, 590a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, colormask)), 591a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_iand(b, packed_dst_color, 592a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, ~colormask))); 593a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 594a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 595a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic int 596a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_next_output_driver_location(nir_shader *s) 597a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 598a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt int maxloc = -1; 599a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 60053b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt nir_foreach_variable(var, &s->outputs) 60153b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt maxloc = MAX2(maxloc, (int)var->data.driver_location); 602a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 60353b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt return maxloc + 1; 604a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 605a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 606a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic void 607a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_store_sample_mask(struct vc4_compile *c, nir_builder *b, 608a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *val) 609a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 610a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_variable *sample_mask = nir_variable_create(c->s, nir_var_shader_out, 611a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt glsl_uint_type(), 612a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt "sample_mask"); 613a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt sample_mask->data.driver_location = 614a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt vc4_nir_next_output_driver_location(c->s); 615a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt sample_mask->data.location = FRAG_RESULT_SAMPLE_MASK; 616a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 617a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr *intr = 618a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr_create(c->s, nir_intrinsic_store_output); 619bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt intr->num_components = 1; 620c30b22c421d2139135519449a68bf3120710a552Eric Anholt nir_intrinsic_set_base(intr, sample_mask->data.driver_location); 621a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 622a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt intr->src[0] = nir_src_for_ssa(val); 62378b81be627734ea7fa50ea246c07b0d4a3a1638aJason Ekstrand intr->src[1] = nir_src_for_ssa(nir_imm_int(b, 0)); 624a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_builder_instr_insert(b, &intr->instr); 625a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt} 626a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 627a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic void 628a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_lower_blend_instr(struct vc4_compile *c, nir_builder *b, 629a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr *intr) 630a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{ 631a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *frag_color = intr->src[0].ssa; 632a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 633a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt if (c->fs_key->sample_coverage) { 634a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr *load = 635a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_instr_create(b->shader, 636a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_intrinsic_load_sample_mask_in); 637a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt load->num_components = 1; 6383124ce699bb3844e793f00e00bfbea5c91744f90Connor Abbott nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL); 639a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_builder_instr_insert(b, &load->instr); 640a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 641a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *bitmask = &load->dest.ssa; 642a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 643a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt vc4_nir_store_sample_mask(c, b, bitmask); 644a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } else if (c->fs_key->sample_alpha_to_coverage) { 645a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *a = nir_channel(b, frag_color, 3); 646a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 647a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt /* XXX: We should do a nice dither based on the fragment 648a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * coordinate, instead. 649a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt */ 650a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *num_samples = nir_imm_float(b, VC4_MAX_SAMPLES); 651a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *num_bits = nir_f2i(b, nir_fmul(b, a, num_samples)); 652a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *bitmask = nir_isub(b, 653a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ishl(b, 654a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, 1), 655a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt num_bits), 656a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_imm_int(b, 1)); 657a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt vc4_nir_store_sample_mask(c, b, bitmask); 658a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } 659a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 660a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt /* The TLB color read returns each sample in turn, so if our blending 661a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * depends on the destination color, we're going to have to run the 662a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * blending function separately for each destination sample value, and 663a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * then output the per-sample color using TLB_COLOR_MS. 664a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt */ 665a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *blend_output; 666a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt if (c->fs_key->msaa && blend_depends_on_dst_color(c)) { 667a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt c->msaa_per_sample_output = true; 668a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 669a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_ssa_def *samples[4]; 670a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt for (int i = 0; i < VC4_MAX_SAMPLES; i++) 671a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt samples[i] = vc4_nir_blend_pipeline(c, b, frag_color, i); 672a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt blend_output = nir_vec4(b, 673a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt samples[0], samples[1], 674a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt samples[2], samples[3]); 675a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } else { 676a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt blend_output = vc4_nir_blend_pipeline(c, b, frag_color, 0); 677a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt } 678a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt 679a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_instr_rewrite_src(&intr->instr, &intr->src[0], 680a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt nir_src_for_ssa(blend_output)); 681a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt intr->num_components = blend_output->num_components; 682bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 683bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 684bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic bool 6857c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbottvc4_nir_lower_blend_block(nir_block *block, struct vc4_compile *c) 686bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 687707e72f13bb78869ee95d3286980bf1709cba6cfJason Ekstrand nir_foreach_instr_safe(instr, block) { 688bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (instr->type != nir_instr_type_intrinsic) 689bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt continue; 690bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_intrinsic_instr *intr = nir_instr_as_intrinsic(instr); 691bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt if (intr->intrinsic != nir_intrinsic_store_output) 692bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt continue; 693bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 694bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_variable *output_var = NULL; 6956bd9e0351205dc475f45b58979702b5cf414aa07Boyan Ding nir_foreach_variable(var, &c->s->outputs) { 696c30b22c421d2139135519449a68bf3120710a552Eric Anholt if (var->data.driver_location == 697c30b22c421d2139135519449a68bf3120710a552Eric Anholt nir_intrinsic_base(intr)) { 698bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt output_var = var; 699bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt break; 700bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 701bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 702bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt assert(output_var); 7038fd3e53f3dc40e4013348e63a0cc7a2787410899Eric Anholt 704cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt if (output_var->data.location != FRAG_RESULT_COLOR && 705cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt output_var->data.location != FRAG_RESULT_DATA0) { 706bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt continue; 707cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt } 708bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 709bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_function_impl *impl = 710bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_cf_node_get_function(&block->cf_node); 711bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder b; 712bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_builder_init(&b, impl); 7130a913a9d85f2eb772be6a133965c5b8a4aa3c800Kenneth Graunke b.cursor = nir_before_instr(&intr->instr); 714bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt vc4_nir_lower_blend_instr(c, &b, intr); 715bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 716bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt return true; 717bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 718bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 719bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvoid 72099a759a4a3c29c283ae93612017d2f31c0ddbe73Eric Anholtvc4_nir_lower_blend(nir_shader *s, struct vc4_compile *c) 721bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{ 7229464d8c49813aba77285e7465b96e92a91ed327cJason Ekstrand nir_foreach_function(function, s) { 723237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand if (function->impl) { 7247c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott nir_foreach_block(block, function->impl) { 7257c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott vc4_nir_lower_blend_block(block, c); 7267c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott } 727bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt 728237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand nir_metadata_preserve(function->impl, 729bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_metadata_block_index | 730bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt nir_metadata_dominance); 731bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 732bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt } 733bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt} 734