1bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/*
2bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Copyright © 2015 Broadcom
3bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt *
4bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Permission is hereby granted, free of charge, to any person obtaining a
5bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * copy of this software and associated documentation files (the "Software"),
6bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * to deal in the Software without restriction, including without limitation
7bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * and/or sell copies of the Software, and to permit persons to whom the
9bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Software is furnished to do so, subject to the following conditions:
10bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt *
11bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * The above copyright notice and this permission notice (including the next
12bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * paragraph) shall be included in all copies or substantial portions of the
13bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Software.
14bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt *
15bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * IN THE SOFTWARE.
22bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */
23bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
24bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/**
25bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Implements most of the fixed function fragment pipeline in shader code.
26bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt *
27bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * VC4 doesn't have any hardware support for blending, alpha test, logic ops,
28bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * or color mask.  Instead, you read the current contents of the destination
29bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * from the tile buffer after having waited for the scoreboard (which is
30bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * handled by vc4_qpu_emit.c), then do math using your output color and that
31bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * destination value, and update the output color appropriately.
32a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt *
33a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * Once this pass is done, the color write will either have one component (for
34a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * single sample) with packed argb8888, or 4 components with the per-sample
35a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt * argb8888 result.
36bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */
37bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
38bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/**
39bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * Lowers fixed-function blending to a load of the destination color and a
40bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt * series of ALU operations before the store of the output.
41bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt */
42bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "util/u_format.h"
43bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "vc4_qir.h"
44a39a8fbbaa129f4e52f2a3ad2747182e9a74d910Emil Velikov#include "compiler/nir/nir_builder.h"
45bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt#include "vc4_context.h"
46bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
47a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic bool
48a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtblend_depends_on_dst_color(struct vc4_compile *c)
49a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{
50a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        return (c->fs_key->blend.blend_enable ||
51a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                c->fs_key->blend.colormask != 0xf ||
52a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                c->fs_key->logicop_func != PIPE_LOGICOP_COPY);
53a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt}
54a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
55bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt/** Emits a load of the previous fragment color from the tile buffer. */
56bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def *
57a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_get_dst_color(nir_builder *b, int sample)
58bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
59bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_intrinsic_instr *load =
60bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_intrinsic_instr_create(b->shader,
61bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                           nir_intrinsic_load_input);
62bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        load->num_components = 1;
63c30b22c421d2139135519449a68bf3120710a552Eric Anholt        nir_intrinsic_set_base(load, VC4_NIR_TLB_COLOR_READ_INPUT + sample);
6478b81be627734ea7fa50ea246c07b0d4a3a1638aJason Ekstrand        load->src[0] = nir_src_for_ssa(nir_imm_int(b, 0));
653124ce699bb3844e793f00e00bfbea5c91744f90Connor Abbott        nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL);
66bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_builder_instr_insert(b, &load->instr);
67bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        return &load->dest.ssa;
68bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
69bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
70bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic  nir_ssa_def *
71bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_srgb_decode(nir_builder *b, nir_ssa_def *srgb)
72bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
73bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *is_low = nir_flt(b, srgb, nir_imm_float(b, 0.04045));
74bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *low = nir_fmul(b, srgb, nir_imm_float(b, 1.0 / 12.92));
75bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *high = nir_fpow(b,
76bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                     nir_fmul(b,
77bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                              nir_fadd(b, srgb,
78bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                                       nir_imm_float(b, 0.055)),
79bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                              nir_imm_float(b, 1.0 / 1.055)),
80bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                     nir_imm_float(b, 2.4));
81bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
82bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        return nir_bcsel(b, is_low, low, high);
83bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
84bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
85bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic  nir_ssa_def *
86bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_srgb_encode(nir_builder *b, nir_ssa_def *linear)
87bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
88bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *is_low = nir_flt(b, linear, nir_imm_float(b, 0.0031308));
89bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *low = nir_fmul(b, linear, nir_imm_float(b, 12.92));
90bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *high = nir_fsub(b,
91bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                     nir_fmul(b,
92bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                              nir_imm_float(b, 1.055),
93bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                              nir_fpow(b,
94bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                                       linear,
95bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                                       nir_imm_float(b, 0.41666))),
96bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                     nir_imm_float(b, 0.055));
97bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
98bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        return nir_bcsel(b, is_low, low, high);
99bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
100bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
101bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def *
10270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_channel_f(nir_builder *b,
10370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    nir_ssa_def **src,
10470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    nir_ssa_def **dst,
10570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    unsigned factor,
10670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    int channel)
107bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
108bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        switch(factor) {
109bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_ONE:
110bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_float(b, 1.0);
111bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_SRC_COLOR:
112bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return src[channel];
113bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_SRC_ALPHA:
114bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return src[3];
115bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_DST_ALPHA:
116bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return dst[3];
117bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_DST_COLOR:
118bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return dst[channel];
119bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_SRC_ALPHA_SATURATE:
120bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                if (channel != 3) {
121bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        return nir_fmin(b,
122bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                        src[3],
123bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                        nir_fsub(b,
124bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                                 nir_imm_float(b, 1.0),
125bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                                 dst[3]));
126bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                } else {
127bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        return nir_imm_float(b, 1.0);
128bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                }
129bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_CONST_COLOR:
130e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                return nir_load_system_value(b,
131e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                             nir_intrinsic_load_blend_const_color_r_float +
132e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                             channel,
133e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                             0);
134bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_CONST_ALPHA:
135e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                return nir_load_blend_const_color_a_float(b);
136bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_ZERO:
137bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_float(b, 0.0);
138bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_SRC_COLOR:
139bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, nir_imm_float(b, 1.0), src[channel]);
140bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_SRC_ALPHA:
141bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, nir_imm_float(b, 1.0), src[3]);
142bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_DST_ALPHA:
143bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, nir_imm_float(b, 1.0), dst[3]);
144bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_DST_COLOR:
145bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, nir_imm_float(b, 1.0), dst[channel]);
146bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_CONST_COLOR:
147bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, nir_imm_float(b, 1.0),
148e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                nir_load_system_value(b,
149e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                                      nir_intrinsic_load_blend_const_color_r_float +
150e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                                      channel,
151e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                                      0));
152bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_CONST_ALPHA:
153bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, nir_imm_float(b, 1.0),
154e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                nir_load_blend_const_color_a_float(b));
155bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
156bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        default:
157bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_SRC1_COLOR:
158bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_SRC1_ALPHA:
159bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_SRC1_COLOR:
160bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLENDFACTOR_INV_SRC1_ALPHA:
161bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                /* Unsupported. */
162bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                fprintf(stderr, "Unknown blend factor %d\n", factor);
163bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_float(b, 1.0);
164bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
165bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
166bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
167bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def *
16870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_set_packed_chan(nir_builder *b, nir_ssa_def *src0, nir_ssa_def *src1,
16970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        int chan)
17070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{
17170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        unsigned chan_mask = 0xff << (chan * 8);
17270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        return nir_ior(b,
17370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                       nir_iand(b, src0, nir_imm_int(b, ~chan_mask)),
17470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                       nir_iand(b, src1, nir_imm_int(b, chan_mask)));
17570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt}
17670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
17770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def *
17870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_channel_i(nir_builder *b,
17970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    nir_ssa_def *src,
18070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    nir_ssa_def *dst,
18170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    nir_ssa_def *src_a,
18270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    nir_ssa_def *dst_a,
18370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    unsigned factor,
18470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                    int a_chan)
18570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{
18670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        switch (factor) {
18770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_ONE:
18870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_imm_int(b, ~0);
18970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_SRC_COLOR:
19070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return src;
19170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_SRC_ALPHA:
19270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return src_a;
19370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_DST_ALPHA:
19470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return dst_a;
19570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_DST_COLOR:
19670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return dst;
19770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_SRC_ALPHA_SATURATE:
19870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return vc4_nir_set_packed_chan(b,
19970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                               nir_umin_4x8(b,
20070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                            src_a,
20170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                            nir_inot(b, dst_a)),
20270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                               nir_imm_int(b, ~0),
20370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                               a_chan);
20470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_CONST_COLOR:
205e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                return nir_load_blend_const_color_rgba8888_unorm(b);
20670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_CONST_ALPHA:
207e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                return nir_load_blend_const_color_aaaa8888_unorm(b);
20870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_ZERO:
20970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_imm_int(b, 0);
21070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_SRC_COLOR:
21170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_inot(b, src);
21270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_SRC_ALPHA:
21370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_inot(b, src_a);
21470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_DST_ALPHA:
21570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_inot(b, dst_a);
21670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_DST_COLOR:
21770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_inot(b, dst);
21870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_CONST_COLOR:
219e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                return nir_inot(b,
220e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                nir_load_blend_const_color_rgba8888_unorm(b));
22170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_CONST_ALPHA:
222e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                return nir_inot(b,
223e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                nir_load_blend_const_color_aaaa8888_unorm(b));
22470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
22570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        default:
22670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_SRC1_COLOR:
22770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_SRC1_ALPHA:
22870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_SRC1_COLOR:
22970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLENDFACTOR_INV_SRC1_ALPHA:
23070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                /* Unsupported. */
23170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                fprintf(stderr, "Unknown blend factor %d\n", factor);
23270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_imm_int(b, ~0);
23370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
23470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt}
23570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
23670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def *
23770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_func_f(nir_builder *b, nir_ssa_def *src, nir_ssa_def *dst,
23870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                 unsigned func)
239bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
240bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        switch (func) {
241bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLEND_ADD:
242bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fadd(b, src, dst);
243bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLEND_SUBTRACT:
244bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, src, dst);
245bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLEND_REVERSE_SUBTRACT:
246bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fsub(b, dst, src);
247bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLEND_MIN:
248bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fmin(b, src, dst);
249bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_BLEND_MAX:
250bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fmax(b, src, dst);
251bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
252bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        default:
253bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                /* Unsupported. */
254bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                fprintf(stderr, "Unknown blend func %d\n", func);
255bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return src;
256bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
257bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
258bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
259bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
26070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def *
26170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_blend_func_i(nir_builder *b, nir_ssa_def *src, nir_ssa_def *dst,
26270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                 unsigned func)
26370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{
26470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        switch (func) {
26570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLEND_ADD:
26670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_usadd_4x8(b, src, dst);
26770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLEND_SUBTRACT:
26870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_ussub_4x8(b, src, dst);
26970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLEND_REVERSE_SUBTRACT:
27070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_ussub_4x8(b, dst, src);
27170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLEND_MIN:
27270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_umin_4x8(b, src, dst);
27370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        case PIPE_BLEND_MAX:
27470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return nir_umax_4x8(b, src, dst);
27570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
27670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        default:
27770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                /* Unsupported. */
27870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                fprintf(stderr, "Unknown blend func %d\n", func);
27970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return src;
28070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
28170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
28270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt}
28370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
284bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic void
28570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_do_blending_f(struct vc4_compile *c, nir_builder *b, nir_ssa_def **result,
28670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                  nir_ssa_def **src_color, nir_ssa_def **dst_color)
287bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
288bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        struct pipe_rt_blend_state *blend = &c->fs_key->blend;
289bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
290bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        if (!blend->blend_enable) {
291bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                for (int i = 0; i < 4; i++)
292bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        result[i] = src_color[i];
293bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return;
294bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
295bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
296bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        /* Clamp the src color to [0, 1].  Dest is already clamped. */
297bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        for (int i = 0; i < 4; i++)
298bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                src_color[i] = nir_fsat(b, src_color[i]);
299bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
300bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *src_blend[4], *dst_blend[4];
301bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        for (int i = 0; i < 4; i++) {
302bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                int src_factor = ((i != 3) ? blend->rgb_src_factor :
303bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                  blend->alpha_src_factor);
304bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                int dst_factor = ((i != 3) ? blend->rgb_dst_factor :
305bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                  blend->alpha_dst_factor);
306bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                src_blend[i] = nir_fmul(b, src_color[i],
30770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                        vc4_blend_channel_f(b,
30870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                            src_color, dst_color,
30970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                            src_factor, i));
310bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                dst_blend[i] = nir_fmul(b, dst_color[i],
31170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                        vc4_blend_channel_f(b,
31270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                            src_color, dst_color,
31370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                            dst_factor, i));
314bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
315bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
316bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        for (int i = 0; i < 4; i++) {
31770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                result[i] = vc4_blend_func_f(b, src_blend[i], dst_blend[i],
31870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                             ((i != 3) ? blend->rgb_func :
31970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                              blend->alpha_func));
32070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
32170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt}
32270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
32370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def *
32470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_splat(nir_builder *b, nir_ssa_def *src)
32570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{
32670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *or1 = nir_ior(b, src, nir_ishl(b, src, nir_imm_int(b, 8)));
32770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        return nir_ior(b, or1, nir_ishl(b, or1, nir_imm_int(b, 16)));
32870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt}
32970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
33070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def *
33170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_do_blending_i(struct vc4_compile *c, nir_builder *b,
33270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                  nir_ssa_def *src_color, nir_ssa_def *dst_color,
33370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                  nir_ssa_def *src_float_a)
33470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{
33570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        struct pipe_rt_blend_state *blend = &c->fs_key->blend;
33670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
33770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        if (!blend->blend_enable)
33870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                return src_color;
33970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
34070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        enum pipe_format color_format = c->fs_key->color_format;
34170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        const uint8_t *format_swiz = vc4_get_format_swizzle(color_format);
34270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *imm_0xff = nir_imm_int(b, 0xff);
34370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *src_a = nir_pack_unorm_4x8(b, src_float_a);
34470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *dst_a;
34570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        int alpha_chan;
34670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        for (alpha_chan = 0; alpha_chan < 4; alpha_chan++) {
34770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                if (format_swiz[alpha_chan] == 3)
34870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        break;
34970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
35070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        if (alpha_chan != 4) {
35170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *shift = nir_imm_int(b, alpha_chan * 8);
35270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                dst_a = vc4_nir_splat(b, nir_iand(b, nir_ushr(b, dst_color,
35370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                              shift), imm_0xff));
35470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        } else {
35570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                dst_a = nir_imm_int(b, ~0);
35670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
35770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
35870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *src_factor = vc4_blend_channel_i(b,
35970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      src_color, dst_color,
36070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      src_a, dst_a,
36170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      blend->rgb_src_factor,
36270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      alpha_chan);
36370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *dst_factor = vc4_blend_channel_i(b,
36470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      src_color, dst_color,
36570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      src_a, dst_a,
36670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      blend->rgb_dst_factor,
36770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                      alpha_chan);
36870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
36970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        if (alpha_chan != 4 &&
37070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt            blend->alpha_src_factor != blend->rgb_src_factor) {
37170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *src_alpha_factor =
37270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        vc4_blend_channel_i(b,
37370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            src_color, dst_color,
37470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            src_a, dst_a,
37570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            blend->alpha_src_factor,
37670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            alpha_chan);
37770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                src_factor = vc4_nir_set_packed_chan(b, src_factor,
37870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                     src_alpha_factor,
37970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                     alpha_chan);
38070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
38170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        if (alpha_chan != 4 &&
38270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt            blend->alpha_dst_factor != blend->rgb_dst_factor) {
38370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *dst_alpha_factor =
38470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        vc4_blend_channel_i(b,
38570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            src_color, dst_color,
38670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            src_a, dst_a,
38770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            blend->alpha_dst_factor,
38870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                            alpha_chan);
38970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                dst_factor = vc4_nir_set_packed_chan(b, dst_factor,
39070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                     dst_alpha_factor,
39170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                     alpha_chan);
39270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
39370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *src_blend = nir_umul_unorm_4x8(b, src_color, src_factor);
39470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *dst_blend = nir_umul_unorm_4x8(b, dst_color, dst_factor);
39570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
39670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *result =
39770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                vc4_blend_func_i(b, src_blend, dst_blend, blend->rgb_func);
39870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        if (alpha_chan != 4 && blend->alpha_func != blend->rgb_func) {
39970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *result_a = vc4_blend_func_i(b,
40070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                         src_blend,
40170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                         dst_blend,
40270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                         blend->alpha_func);
40370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                result = vc4_nir_set_packed_chan(b, result, result_a,
40470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                 alpha_chan);
405bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
40670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        return result;
407bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
408bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
409bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def *
410bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_logicop(nir_builder *b, int logicop_func,
411bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt            nir_ssa_def *src, nir_ssa_def *dst)
412bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
413bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        switch (logicop_func) {
414bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_CLEAR:
415bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_int(b, 0);
416bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_NOR:
417bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_inot(b, nir_ior(b, src, dst));
418bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_AND_INVERTED:
419bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_iand(b, nir_inot(b, src), dst);
420bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_COPY_INVERTED:
421bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_inot(b, src);
422bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_AND_REVERSE:
423bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_iand(b, src, nir_inot(b, dst));
424bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_INVERT:
425bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_inot(b, dst);
426bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_XOR:
427bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_ixor(b, src, dst);
428bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_NAND:
429bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_inot(b, nir_iand(b, src, dst));
430bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_AND:
431bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_iand(b, src, dst);
432bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_EQUIV:
433bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_inot(b, nir_ixor(b, src, dst));
434bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_NOOP:
435bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return dst;
436bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_OR_INVERTED:
437bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_ior(b, nir_inot(b, src), dst);
438bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_OR_REVERSE:
439bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_ior(b, src, nir_inot(b, dst));
440bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_OR:
441bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_ior(b, src, dst);
442bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_SET:
443bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_int(b, ~0);
444bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        default:
445bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                fprintf(stderr, "Unknown logic op %d\n", logicop_func);
446bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                /* FALLTHROUGH */
447bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_LOGICOP_COPY:
448bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return src;
449bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
450bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
451bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
452bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic nir_ssa_def *
453bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_pipe_compare_func(nir_builder *b, int func,
454bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                          nir_ssa_def *src0, nir_ssa_def *src1)
455bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
456bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        switch (func) {
457bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        default:
458bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                fprintf(stderr, "Unknown compare func %d\n", func);
459bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                /* FALLTHROUGH */
460bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_NEVER:
461bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_int(b, 0);
462bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_ALWAYS:
463bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_imm_int(b, ~0);
464bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_EQUAL:
465bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_feq(b, src0, src1);
466bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_NOTEQUAL:
467bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fne(b, src0, src1);
468bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_GREATER:
469bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_flt(b, src1, src0);
470bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_GEQUAL:
471bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fge(b, src0, src1);
472bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_LESS:
473bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_flt(b, src0, src1);
474bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        case PIPE_FUNC_LEQUAL:
475bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return nir_fge(b, src1, src0);
476bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
477bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
478bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
479bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic void
480bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvc4_nir_emit_alpha_test_discard(struct vc4_compile *c, nir_builder *b,
481bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                nir_ssa_def *alpha)
482bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
483bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        if (!c->fs_key->alpha_test)
484bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                return;
485bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
486bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *condition =
487bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                vc4_nir_pipe_compare_func(b, c->fs_key->alpha_test_func,
488e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                          alpha,
489e8378fee0c20ecd26451c079c725420077606cb9Eric Anholt                                          nir_load_alpha_ref_float(b));
490bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
491bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_intrinsic_instr *discard =
492bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_intrinsic_instr_create(b->shader,
493bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                           nir_intrinsic_discard_if);
494bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        discard->num_components = 1;
495bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        discard->src[0] = nir_src_for_ssa(nir_inot(b, condition));
496bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_builder_instr_insert(b, &discard->instr);
497e1af20f18a86f52a9640faf2d4ff8a71b0a4fa9bTimothy Arceri        c->s->info->fs.uses_discard = true;
498bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
499bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
50070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtstatic nir_ssa_def *
50170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholtvc4_nir_swizzle_and_pack(struct vc4_compile *c, nir_builder *b,
50270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                         nir_ssa_def **colors)
50370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt{
50470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        enum pipe_format color_format = c->fs_key->color_format;
50570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        const uint8_t *format_swiz = vc4_get_format_swizzle(color_format);
50670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
50770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *swizzled[4];
50870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        for (int i = 0; i < 4; i++) {
50970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                swizzled[i] = vc4_nir_get_swizzled_channel(b, colors,
51070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                           format_swiz[i]);
51170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
51270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
51370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        return nir_pack_unorm_4x8(b,
51470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                  nir_vec4(b,
51570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                           swizzled[0], swizzled[1],
51670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                           swizzled[2], swizzled[3]));
51770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
51870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt}
51970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
520a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic nir_ssa_def *
521a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_blend_pipeline(struct vc4_compile *c, nir_builder *b, nir_ssa_def *src,
522a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                       int sample)
523bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
524bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        enum pipe_format color_format = c->fs_key->color_format;
525bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        const uint8_t *format_swiz = vc4_get_format_swizzle(color_format);
52670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        bool srgb = util_format_is_srgb(color_format);
527bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
528bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        /* Pull out the float src/dst color components. */
529a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_ssa_def *packed_dst_color = vc4_nir_get_dst_color(b, sample);
530bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *dst_vec4 = nir_unpack_unorm_4x8(b, packed_dst_color);
531bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        nir_ssa_def *src_color[4], *unpacked_dst_color[4];
532bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        for (unsigned i = 0; i < 4; i++) {
533a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                src_color[i] = nir_channel(b, src, i);
5344cff16bc3a84569da05e672c8226931678aa62c0Eric Anholt                unpacked_dst_color[i] = nir_channel(b, dst_vec4, i);
535bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
536bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
537a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        if (c->fs_key->sample_alpha_to_one && c->fs_key->msaa)
538a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                src_color[3] = nir_imm_float(b, 1.0);
539a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
540bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        vc4_nir_emit_alpha_test_discard(c, b, src_color[3]);
541bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
54270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        nir_ssa_def *packed_color;
54370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        if (srgb) {
54470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                /* Unswizzle the destination color. */
54570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *dst_color[4];
54670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                for (unsigned i = 0; i < 4; i++) {
54770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        dst_color[i] = vc4_nir_get_swizzled_channel(b,
54870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                                    unpacked_dst_color,
54970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                                                    format_swiz[i]);
55070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                }
55170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt
55270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                /* Turn dst color to linear. */
553bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                for (int i = 0; i < 3; i++)
554bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        dst_color[i] = vc4_nir_srgb_decode(b, dst_color[i]);
555bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
55670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *blend_color[4];
55770b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                vc4_do_blending_f(c, b, blend_color, src_color, dst_color);
558bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
55970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                /* sRGB encode the output color */
560bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                for (int i = 0; i < 3; i++)
561bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        blend_color[i] = vc4_nir_srgb_encode(b, blend_color[i]);
562bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
56370b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                packed_color = vc4_nir_swizzle_and_pack(c, b, blend_color);
56470b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        } else {
56570b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                nir_ssa_def *packed_src_color =
56670b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        vc4_nir_swizzle_and_pack(c, b, src_color);
567bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
56870b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                packed_color =
56970b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                        vc4_do_blending_i(c, b,
57070b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                          packed_src_color, packed_dst_color,
57170b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt                                          src_color[3]);
57270b06fb5d55d639fd74596a2ff6971cb57c030caEric Anholt        }
573bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
574bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        packed_color = vc4_logicop(b, c->fs_key->logicop_func,
575bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                   packed_color, packed_dst_color);
576bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
577bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        /* If the bit isn't set in the color mask, then just return the
578bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt         * original dst color, instead.
579bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt         */
580bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        uint32_t colormask = 0xffffffff;
581bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        for (int i = 0; i < 4; i++) {
582bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                if (format_swiz[i] < 4 &&
583bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                    !(c->fs_key->blend.colormask & (1 << format_swiz[i]))) {
584bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        colormask &= ~(0xff << (i * 8));
585bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                }
586bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
587bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
588a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        return nir_ior(b,
589a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                       nir_iand(b, packed_color,
590a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                nir_imm_int(b, colormask)),
591a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                       nir_iand(b, packed_dst_color,
592a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                nir_imm_int(b, ~colormask)));
593a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt}
594a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
595a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic int
596a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_next_output_driver_location(nir_shader *s)
597a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{
598a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        int maxloc = -1;
599a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
60053b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt        nir_foreach_variable(var, &s->outputs)
60153b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt                maxloc = MAX2(maxloc, (int)var->data.driver_location);
602a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
60353b2523c6ed8202ba44596bee7ec7ba8420c4e92Eric Anholt        return maxloc + 1;
604a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt}
605a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
606a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic void
607a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_store_sample_mask(struct vc4_compile *c, nir_builder *b,
608a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                          nir_ssa_def *val)
609a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{
610a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_variable *sample_mask = nir_variable_create(c->s, nir_var_shader_out,
611a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                        glsl_uint_type(),
612a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                        "sample_mask");
613a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        sample_mask->data.driver_location =
614a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                vc4_nir_next_output_driver_location(c->s);
615a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        sample_mask->data.location = FRAG_RESULT_SAMPLE_MASK;
616a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
617a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_intrinsic_instr *intr =
618a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_intrinsic_instr_create(c->s, nir_intrinsic_store_output);
619bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        intr->num_components = 1;
620c30b22c421d2139135519449a68bf3120710a552Eric Anholt        nir_intrinsic_set_base(intr, sample_mask->data.driver_location);
621a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
622a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        intr->src[0] = nir_src_for_ssa(val);
62378b81be627734ea7fa50ea246c07b0d4a3a1638aJason Ekstrand        intr->src[1] = nir_src_for_ssa(nir_imm_int(b, 0));
624a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_builder_instr_insert(b, &intr->instr);
625a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt}
626a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
627a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtstatic void
628a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholtvc4_nir_lower_blend_instr(struct vc4_compile *c, nir_builder *b,
629a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                          nir_intrinsic_instr *intr)
630a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt{
631a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_ssa_def *frag_color = intr->src[0].ssa;
632a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
633a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        if (c->fs_key->sample_coverage) {
634a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_intrinsic_instr *load =
635a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                        nir_intrinsic_instr_create(b->shader,
636a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                   nir_intrinsic_load_sample_mask_in);
637a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                load->num_components = 1;
6383124ce699bb3844e793f00e00bfbea5c91744f90Connor Abbott                nir_ssa_dest_init(&load->instr, &load->dest, 1, 32, NULL);
639a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_builder_instr_insert(b, &load->instr);
640a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
641a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_ssa_def *bitmask = &load->dest.ssa;
642a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
643a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                vc4_nir_store_sample_mask(c, b, bitmask);
644a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        } else if (c->fs_key->sample_alpha_to_coverage) {
645a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_ssa_def *a = nir_channel(b, frag_color, 3);
646a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
647a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                /* XXX: We should do a nice dither based on the fragment
648a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                 * coordinate, instead.
649a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                 */
650a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_ssa_def *num_samples = nir_imm_float(b, VC4_MAX_SAMPLES);
651a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_ssa_def *num_bits = nir_f2i(b, nir_fmul(b, a, num_samples));
652a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_ssa_def *bitmask = nir_isub(b,
653a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                nir_ishl(b,
654a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                         nir_imm_int(b, 1),
655a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                         num_bits),
656a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                                nir_imm_int(b, 1));
657a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                vc4_nir_store_sample_mask(c, b, bitmask);
658a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        }
659a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
660a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        /* The TLB color read returns each sample in turn, so if our blending
661a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt         * depends on the destination color, we're going to have to run the
662a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt         * blending function separately for each destination sample value, and
663a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt         * then output the per-sample color using TLB_COLOR_MS.
664a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt         */
665a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_ssa_def *blend_output;
666a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        if (c->fs_key->msaa && blend_depends_on_dst_color(c)) {
667a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                c->msaa_per_sample_output = true;
668a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
669a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                nir_ssa_def *samples[4];
670a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                for (int i = 0; i < VC4_MAX_SAMPLES; i++)
671a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                        samples[i] = vc4_nir_blend_pipeline(c, b, frag_color, i);
672a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                blend_output = nir_vec4(b,
673a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                        samples[0], samples[1],
674a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                                        samples[2], samples[3]);
675a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        } else {
676a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                blend_output = vc4_nir_blend_pipeline(c, b, frag_color, 0);
677a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        }
678a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt
679a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        nir_instr_rewrite_src(&intr->instr, &intr->src[0],
680a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt                              nir_src_for_ssa(blend_output));
681a97b40dca4949b5b8b3320e76768e54f430c9e78Eric Anholt        intr->num_components = blend_output->num_components;
682bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
683bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
684bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtstatic bool
6857c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbottvc4_nir_lower_blend_block(nir_block *block, struct vc4_compile *c)
686bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
687707e72f13bb78869ee95d3286980bf1709cba6cfJason Ekstrand        nir_foreach_instr_safe(instr, block) {
688bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                if (instr->type != nir_instr_type_intrinsic)
689bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        continue;
690bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_intrinsic_instr *intr = nir_instr_as_intrinsic(instr);
691bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                if (intr->intrinsic != nir_intrinsic_store_output)
692bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        continue;
693bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
694bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_variable *output_var = NULL;
6956bd9e0351205dc475f45b58979702b5cf414aa07Boyan Ding                nir_foreach_variable(var, &c->s->outputs) {
696c30b22c421d2139135519449a68bf3120710a552Eric Anholt                        if (var->data.driver_location ==
697c30b22c421d2139135519449a68bf3120710a552Eric Anholt                            nir_intrinsic_base(intr)) {
698bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                output_var = var;
699bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                break;
700bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        }
701bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                }
702bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                assert(output_var);
7038fd3e53f3dc40e4013348e63a0cc7a2787410899Eric Anholt
704cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt                if (output_var->data.location != FRAG_RESULT_COLOR &&
705cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt                    output_var->data.location != FRAG_RESULT_DATA0) {
706bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        continue;
707cfa980f49356eb2d94178f8cc9d67d01b4e3d695Eric Anholt                }
708bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
709bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_function_impl *impl =
710bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                        nir_cf_node_get_function(&block->cf_node);
711bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_builder b;
712bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                nir_builder_init(&b, impl);
7130a913a9d85f2eb772be6a133965c5b8a4aa3c800Kenneth Graunke                b.cursor = nir_before_instr(&intr->instr);
714bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                vc4_nir_lower_blend_instr(c, &b, intr);
715bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
716bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        return true;
717bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
718bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
719bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholtvoid
72099a759a4a3c29c283ae93612017d2f31c0ddbe73Eric Anholtvc4_nir_lower_blend(nir_shader *s, struct vc4_compile *c)
721bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt{
7229464d8c49813aba77285e7465b96e92a91ed327cJason Ekstrand        nir_foreach_function(function, s) {
723237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand                if (function->impl) {
7247c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott                        nir_foreach_block(block, function->impl) {
7257c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott                                vc4_nir_lower_blend_block(block, c);
7267c36f9eb52ead4cb5cd0f81d1f282e0568223ca3Connor Abbott                        }
727bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt
728237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand                        nir_metadata_preserve(function->impl,
729bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                              nir_metadata_block_index |
730bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                                              nir_metadata_dominance);
731bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt                }
732bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt        }
733bf3c50fba221f216e38d3f60f89161ced4c684c0Eric Anholt}
734