blob: c73bb4211d20fd1d7ef96814c86c250de1b4a540 [file] [log] [blame]
Nicolas Capens68a82382018-10-02 13:16:55 -04001// Copyright 2016 The SwiftShader Authors. All Rights Reserved.
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15#include "PixelProgram.hpp"
16
Nicolas Capens28556362021-07-24 02:36:09 -040017#include "Constants.hpp"
Nicolas Capens68a82382018-10-02 13:16:55 -040018#include "SamplerCore.hpp"
Nicolas Capens1d8c8db2018-11-05 16:30:42 -050019#include "Device/Primitive.hpp"
20#include "Device/Renderer.hpp"
Nicolas Capens678d3932021-11-04 16:01:31 -040021#include "Vulkan/VkDevice.hpp"
Nicolas Capens68a82382018-10-02 13:16:55 -040022
Nicolas Capens157ba262019-12-10 17:49:14 -050023namespace sw {
24
Nicolas Capens28556362021-07-24 02:36:09 -040025PixelProgram::PixelProgram(
26 const PixelProcessor::State &state,
27 const vk::PipelineLayout *pipelineLayout,
28 const SpirvShader *spirvShader,
29 const vk::DescriptorSet::Bindings &descriptorSets)
30 : PixelRoutine(state, pipelineLayout, spirvShader, descriptorSets)
31{
32}
33
Nicolas Capensafdb5122022-06-30 11:31:35 -040034// Union all cMask and return it as Booleans
35SIMD::Int PixelProgram::maskAny(Int cMask[4], const SampleSet &samples)
Nicolas Capens68a82382018-10-02 13:16:55 -040036{
Nicolas Capens157ba262019-12-10 17:49:14 -050037 // See if at least 1 sample is used
Nicolas Capens28556362021-07-24 02:36:09 -040038 Int maskUnion = 0;
39 for(unsigned int q : samples)
Alexis Hetu920100c2019-07-15 17:25:02 -040040 {
Nicolas Capens28556362021-07-24 02:36:09 -040041 maskUnion |= cMask[q];
Nicolas Capens157ba262019-12-10 17:49:14 -050042 }
Alexis Hetu920100c2019-07-15 17:25:02 -040043
Nicolas Capensafdb5122022-06-30 11:31:35 -040044 // Convert to Booleans
Nicolas Capens02658a72022-07-03 01:20:37 -040045 SIMD::Int laneBits = SIMD::Int([](int i) { return 1 << i; }); // 1, 2, 4, 8, ...
Nicolas Capensafdb5122022-06-30 11:31:35 -040046 SIMD::Int mask(maskUnion);
Nicolas Capens02658a72022-07-03 01:20:37 -040047 mask = CmpNEQ(mask & laneBits, 0);
Nicolas Capens157ba262019-12-10 17:49:14 -050048 return mask;
49}
50
Nicolas Capensafdb5122022-06-30 11:31:35 -040051// Union all cMask/sMask/zMask and return it as Booleans
52SIMD::Int PixelProgram::maskAny(Int cMask[4], Int sMask[4], Int zMask[4], const SampleSet &samples)
Nicolas Capens157ba262019-12-10 17:49:14 -050053{
54 // See if at least 1 sample is used
Nicolas Capens28556362021-07-24 02:36:09 -040055 Int maskUnion = 0;
56 for(unsigned int q : samples)
Nicolas Capens157ba262019-12-10 17:49:14 -050057 {
Nicolas Capens28556362021-07-24 02:36:09 -040058 maskUnion |= (cMask[q] & sMask[q] & zMask[q]);
Nicolas Capens157ba262019-12-10 17:49:14 -050059 }
60
Nicolas Capensafdb5122022-06-30 11:31:35 -040061 // Convert to Booleans
Nicolas Capens02658a72022-07-03 01:20:37 -040062 SIMD::Int laneBits = SIMD::Int([](int i) { return 1 << i; }); // 1, 2, 4, 8, ...
Nicolas Capensafdb5122022-06-30 11:31:35 -040063 SIMD::Int mask(maskUnion);
Nicolas Capens02658a72022-07-03 01:20:37 -040064 mask = CmpNEQ(mask & laneBits, 0);
Nicolas Capens157ba262019-12-10 17:49:14 -050065 return mask;
66}
67
Nicolas Capensafdb5122022-06-30 11:31:35 -040068void PixelProgram::setBuiltins(Int &x, Int &y, SIMD::Float (&z)[4], SIMD::Float &w, Int cMask[4], const SampleSet &samples)
Nicolas Capens157ba262019-12-10 17:49:14 -050069{
70 routine.setImmutableInputBuiltins(spirvShader);
71
Ben Clayton5beaef92019-12-03 12:23:35 +000072 // TODO(b/146486064): Consider only assigning these to the SpirvRoutine iff
73 // they are ever going to be read.
Alexis Hetu09df3eb2021-01-14 10:46:33 -050074 float x0 = 0.5f;
75 float y0 = 0.5f;
76 float x1 = 1.5f;
77 float y1 = 1.5f;
Nicolas Capens28556362021-07-24 02:36:09 -040078
79 // "When Sample Shading is enabled, the x and y components of FragCoord reflect the
80 // location of one of the samples corresponding to the shader invocation. Otherwise,
81 // the x and y components of FragCoord reflect the location of the center of the fragment."
82 if(state.sampleShadingEnabled && state.multiSampleCount > 1)
Alexis Hetu09df3eb2021-01-14 10:46:33 -050083 {
Nicolas Capens1c8155a2022-06-29 03:13:02 -040084 x0 = VkSampleLocations4[samples[0]][0];
85 y0 = VkSampleLocations4[samples[0]][1];
Alexis Hetu09df3eb2021-01-14 10:46:33 -050086 x1 = 1.0f + x0;
87 y1 = 1.0f + y0;
88 }
Nicolas Capens28556362021-07-24 02:36:09 -040089
Alexis Hetu09df3eb2021-01-14 10:46:33 -050090 routine.fragCoord[0] = SIMD::Float(Float(x)) + SIMD::Float(x0, x1, x0, x1);
91 routine.fragCoord[1] = SIMD::Float(Float(y)) + SIMD::Float(y0, y0, y1, y1);
Ben Clayton5beaef92019-12-03 12:23:35 +000092 routine.fragCoord[2] = z[0]; // sample 0
93 routine.fragCoord[3] = w;
Marc-Antoine Desrochesb44162f2020-03-05 13:35:43 -050094
Ben Clayton5beaef92019-12-03 12:23:35 +000095 routine.invocationsPerSubgroup = SIMD::Width;
Nicolas Capens28556362021-07-24 02:36:09 -040096 routine.helperInvocation = ~maskAny(cMask, samples);
Nicolas Capens3edbc042022-03-01 16:02:18 -050097 routine.windowSpacePosition[0] = SIMD::Int(x) + SIMD::Int(0, 1, 0, 1);
98 routine.windowSpacePosition[1] = SIMD::Int(y) + SIMD::Int(0, 0, 1, 1);
Alexis Hetu310874c2022-02-23 10:57:58 -050099 routine.layer = *Pointer<Int>(data + OFFSET(DrawData, layer));
Ben Clayton5beaef92019-12-03 12:23:35 +0000100
Ben Clayton200a4632020-09-25 17:33:17 +0100101 // PointCoord formula reference: https://www.khronos.org/registry/vulkan/specs/1.2/html/vkspec.html#primsrast-points-basic
102 // Note we don't add a 0.5 offset to x and y here (like for fragCoord) because pointCoordX/Y have 0.5 subtracted as part of the viewport transform.
103 SIMD::Float pointSizeInv = SIMD::Float(*Pointer<Float>(primitive + OFFSET(Primitive, pointSizeInv)));
Nicolas Capensdb643372022-08-10 22:28:12 -0400104 routine.pointCoord[0] = SIMD::Float(0.5f) + pointSizeInv * (((SIMD::Float(Float(x)) + SIMD::Float(0.0f, 1.0f, 0.0f, 1.0f)) - SIMD::Float(*Pointer<Float>(primitive + OFFSET(Primitive, x0)))));
105 routine.pointCoord[1] = SIMD::Float(0.5f) + pointSizeInv * (((SIMD::Float(Float(y)) + SIMD::Float(0.0f, 0.0f, 1.0f, 1.0f)) - SIMD::Float(*Pointer<Float>(primitive + OFFSET(Primitive, y0)))));
Ben Clayton200a4632020-09-25 17:33:17 +0100106
Nicolas Capens71134742022-10-12 12:44:16 -0400107 routine.setInputBuiltin(spirvShader, spv::BuiltInViewIndex, [&](const Spirv::BuiltinMapping &builtin, Array<SIMD::Float> &value) {
Nicolas Capens157ba262019-12-10 17:49:14 -0500108 assert(builtin.SizeInComponents == 1);
Alexis Hetu310874c2022-02-23 10:57:58 -0500109 value[builtin.FirstComponent] = As<SIMD::Float>(SIMD::Int(routine.layer));
Nicolas Capens157ba262019-12-10 17:49:14 -0500110 });
111
Nicolas Capens71134742022-10-12 12:44:16 -0400112 routine.setInputBuiltin(spirvShader, spv::BuiltInFragCoord, [&](const Spirv::BuiltinMapping &builtin, Array<SIMD::Float> &value) {
Nicolas Capens157ba262019-12-10 17:49:14 -0500113 assert(builtin.SizeInComponents == 4);
Ben Clayton5beaef92019-12-03 12:23:35 +0000114 value[builtin.FirstComponent + 0] = routine.fragCoord[0];
115 value[builtin.FirstComponent + 1] = routine.fragCoord[1];
116 value[builtin.FirstComponent + 2] = routine.fragCoord[2];
117 value[builtin.FirstComponent + 3] = routine.fragCoord[3];
Nicolas Capens157ba262019-12-10 17:49:14 -0500118 });
119
Nicolas Capens71134742022-10-12 12:44:16 -0400120 routine.setInputBuiltin(spirvShader, spv::BuiltInPointCoord, [&](const Spirv::BuiltinMapping &builtin, Array<SIMD::Float> &value) {
Nicolas Capens157ba262019-12-10 17:49:14 -0500121 assert(builtin.SizeInComponents == 2);
Ben Clayton200a4632020-09-25 17:33:17 +0100122 value[builtin.FirstComponent + 0] = routine.pointCoord[0];
123 value[builtin.FirstComponent + 1] = routine.pointCoord[1];
Nicolas Capens157ba262019-12-10 17:49:14 -0500124 });
125
Nicolas Capens71134742022-10-12 12:44:16 -0400126 routine.setInputBuiltin(spirvShader, spv::BuiltInSubgroupSize, [&](const Spirv::BuiltinMapping &builtin, Array<SIMD::Float> &value) {
Nicolas Capens157ba262019-12-10 17:49:14 -0500127 assert(builtin.SizeInComponents == 1);
128 value[builtin.FirstComponent] = As<SIMD::Float>(SIMD::Int(SIMD::Width));
129 });
130
Nicolas Capens71134742022-10-12 12:44:16 -0400131 routine.setInputBuiltin(spirvShader, spv::BuiltInHelperInvocation, [&](const Spirv::BuiltinMapping &builtin, Array<SIMD::Float> &value) {
Nicolas Capens157ba262019-12-10 17:49:14 -0500132 assert(builtin.SizeInComponents == 1);
Ben Clayton5beaef92019-12-03 12:23:35 +0000133 value[builtin.FirstComponent] = As<SIMD::Float>(routine.helperInvocation);
Nicolas Capens157ba262019-12-10 17:49:14 -0500134 });
Nicolas Capens157ba262019-12-10 17:49:14 -0500135}
136
Nicolas Capens28556362021-07-24 02:36:09 -0400137void PixelProgram::executeShader(Int cMask[4], Int sMask[4], Int zMask[4], const SampleSet &samples)
Nicolas Capens157ba262019-12-10 17:49:14 -0500138{
Nicolas Capens06aaffa2021-11-10 10:19:50 -0500139 routine.device = device;
Nicolas Capens157ba262019-12-10 17:49:14 -0500140 routine.descriptorSets = data + OFFSET(DrawData, descriptorSets);
141 routine.descriptorDynamicOffsets = data + OFFSET(DrawData, descriptorDynamicOffsets);
142 routine.pushConstants = data + OFFSET(DrawData, pushConstants);
Nicolas Capens678d3932021-11-04 16:01:31 -0400143 routine.constants = device + OFFSET(vk::Device, constants);
Nicolas Capens157ba262019-12-10 17:49:14 -0500144
145 auto it = spirvShader->inputBuiltins.find(spv::BuiltInFrontFacing);
Nicolas Capens81bc9d92019-12-16 15:05:57 -0500146 if(it != spirvShader->inputBuiltins.end())
Nicolas Capens157ba262019-12-10 17:49:14 -0500147 {
148 ASSERT(it->second.SizeInComponents == 1);
Nicolas Capensafdb5122022-06-30 11:31:35 -0400149 auto frontFacing = SIMD::Int(*Pointer<Int>(primitive + OFFSET(Primitive, clockwiseMask)));
150 routine.getVariable(it->second.Id)[it->second.FirstComponent] = As<SIMD::Float>(frontFacing);
Nicolas Capens157ba262019-12-10 17:49:14 -0500151 }
152
153 it = spirvShader->inputBuiltins.find(spv::BuiltInSampleMask);
Nicolas Capens81bc9d92019-12-16 15:05:57 -0500154 if(it != spirvShader->inputBuiltins.end())
Nicolas Capens157ba262019-12-10 17:49:14 -0500155 {
Nicolas Capensafdb5122022-06-30 11:31:35 -0400156 ASSERT(SIMD::Width == 4);
157 SIMD::Int laneBits = SIMD::Int(1, 2, 4, 8);
Nicolas Capens157ba262019-12-10 17:49:14 -0500158
Nicolas Capensafdb5122022-06-30 11:31:35 -0400159 SIMD::Int inputSampleMask = 0;
Nicolas Capens28556362021-07-24 02:36:09 -0400160 for(unsigned int q : samples)
Nicolas Capens157ba262019-12-10 17:49:14 -0500161 {
Nicolas Capensafdb5122022-06-30 11:31:35 -0400162 inputSampleMask |= SIMD::Int(1 << q) & CmpNEQ(SIMD::Int(cMask[q]) & laneBits, 0);
Nicolas Capens157ba262019-12-10 17:49:14 -0500163 }
164
Nicolas Capensafdb5122022-06-30 11:31:35 -0400165 routine.getVariable(it->second.Id)[it->second.FirstComponent] = As<SIMD::Float>(inputSampleMask);
Nicolas Capens157ba262019-12-10 17:49:14 -0500166 // Sample mask input is an array, as the spec contemplates MSAA levels higher than 32.
167 // Fill any non-zero indices with 0.
Nicolas Capens81bc9d92019-12-16 15:05:57 -0500168 for(auto i = 1u; i < it->second.SizeInComponents; i++)
Nicolas Capens28556362021-07-24 02:36:09 -0400169 {
Nicolas Capensafdb5122022-06-30 11:31:35 -0400170 routine.getVariable(it->second.Id)[it->second.FirstComponent + i] = 0;
Nicolas Capens28556362021-07-24 02:36:09 -0400171 }
Alexis Hetu920100c2019-07-15 17:25:02 -0400172 }
173
Alexis Hetu377716d2021-01-14 11:16:05 -0500174 it = spirvShader->inputBuiltins.find(spv::BuiltInSampleId);
175 if(it != spirvShader->inputBuiltins.end())
176 {
Nicolas Capens28556362021-07-24 02:36:09 -0400177 ASSERT(samples.size() == 1);
178 int sampleId = samples[0];
Alexis Hetu377716d2021-01-14 11:16:05 -0500179 routine.getVariable(it->second.Id)[it->second.FirstComponent] =
Nicolas Capens28556362021-07-24 02:36:09 -0400180 As<SIMD::Float>(SIMD::Int(sampleId));
Alexis Hetu377716d2021-01-14 11:16:05 -0500181 }
182
183 it = spirvShader->inputBuiltins.find(spv::BuiltInSamplePosition);
184 if(it != spirvShader->inputBuiltins.end())
185 {
Nicolas Capens28556362021-07-24 02:36:09 -0400186 ASSERT(samples.size() == 1);
187 int sampleId = samples[0];
Alexis Hetu377716d2021-01-14 11:16:05 -0500188 routine.getVariable(it->second.Id)[it->second.FirstComponent + 0] =
Nicolas Capens1c8155a2022-06-29 03:13:02 -0400189 SIMD::Float((state.multiSampleCount > 1) ? VkSampleLocations4[sampleId][0] : 0.5f);
Alexis Hetu377716d2021-01-14 11:16:05 -0500190 routine.getVariable(it->second.Id)[it->second.FirstComponent + 1] =
Nicolas Capens1c8155a2022-06-29 03:13:02 -0400191 SIMD::Float((state.multiSampleCount > 1) ? VkSampleLocations4[sampleId][1] : 0.5f);
Alexis Hetu377716d2021-01-14 11:16:05 -0500192 }
193
Nicolas Capens157ba262019-12-10 17:49:14 -0500194 // Note: all lanes initially active to facilitate derivatives etc. Actual coverage is
195 // handled separately, through the cMask.
Nicolas Capensafdb5122022-06-30 11:31:35 -0400196 SIMD::Int activeLaneMask = 0xFFFFFFFF;
197 SIMD::Int storesAndAtomicsMask = maskAny(cMask, sMask, zMask, samples);
Nicolas Capens23ccff72022-04-05 13:00:22 -0400198 routine.discardMask = 0;
Alexis Hetu920100c2019-07-15 17:25:02 -0400199
Alexis Hetu0bcb71f2021-01-14 12:05:12 -0500200 spirvShader->emit(&routine, activeLaneMask, storesAndAtomicsMask, descriptorSets, state.multiSampleCount);
Nicolas Capens157ba262019-12-10 17:49:14 -0500201 spirvShader->emitEpilog(&routine);
202
Nicolas Capens91ec7752021-09-11 00:30:57 -0400203 for(int i = 0; i < MAX_COLOR_BUFFERS; i++)
Nicolas Capens157ba262019-12-10 17:49:14 -0500204 {
Nicolas Capens8c5df9c2021-10-27 16:29:54 -0400205 c[i].x = routine.outputs[i * 4 + 0];
Nicolas Capens157ba262019-12-10 17:49:14 -0500206 c[i].y = routine.outputs[i * 4 + 1];
207 c[i].z = routine.outputs[i * 4 + 2];
208 c[i].w = routine.outputs[i * 4 + 3];
Alexis Hetu920100c2019-07-15 17:25:02 -0400209 }
210
Nicolas Capens157ba262019-12-10 17:49:14 -0500211 clampColor(c);
212
Nicolas Capens23ccff72022-04-05 13:00:22 -0400213 if(spirvShader->getAnalysis().ContainsDiscard)
Nicolas Capens68a82382018-10-02 13:16:55 -0400214 {
Nicolas Capens28556362021-07-24 02:36:09 -0400215 for(unsigned int q : samples)
Chris Forbes02d4c0d2019-08-21 12:04:34 -0700216 {
Nicolas Capens23ccff72022-04-05 13:00:22 -0400217 cMask[q] &= ~routine.discardMask;
Nicolas Capens68a82382018-10-02 13:16:55 -0400218 }
219 }
220
Nicolas Capens157ba262019-12-10 17:49:14 -0500221 it = spirvShader->outputBuiltins.find(spv::BuiltInSampleMask);
Nicolas Capens81bc9d92019-12-16 15:05:57 -0500222 if(it != spirvShader->outputBuiltins.end())
Nicolas Capens68a82382018-10-02 13:16:55 -0400223 {
Nicolas Capens157ba262019-12-10 17:49:14 -0500224 auto outputSampleMask = As<SIMD::Int>(routine.getVariable(it->second.Id)[it->second.FirstComponent]);
225
Nicolas Capens28556362021-07-24 02:36:09 -0400226 for(unsigned int q : samples)
Nicolas Capens68a82382018-10-02 13:16:55 -0400227 {
Nicolas Capens28556362021-07-24 02:36:09 -0400228 cMask[q] &= SignMask(CmpNEQ(outputSampleMask & SIMD::Int(1 << q), SIMD::Int(0)));
Nicolas Capens68a82382018-10-02 13:16:55 -0400229 }
230 }
231
Nicolas Capens157ba262019-12-10 17:49:14 -0500232 it = spirvShader->outputBuiltins.find(spv::BuiltInFragDepth);
Nicolas Capens81bc9d92019-12-16 15:05:57 -0500233 if(it != spirvShader->outputBuiltins.end())
Nicolas Capens68a82382018-10-02 13:16:55 -0400234 {
Nicolas Capensdcfc0a62021-07-26 19:50:09 -0400235 for(unsigned int q : samples)
Sean Risser024bf322021-05-18 13:58:37 -0400236 {
Nicolas Capensdcfc0a62021-07-26 19:50:09 -0400237 z[q] = routine.getVariable(it->second.Id)[it->second.FirstComponent];
Sean Risser024bf322021-05-18 13:58:37 -0400238 }
Nicolas Capens68a82382018-10-02 13:16:55 -0400239 }
Nicolas Capens68a82382018-10-02 13:16:55 -0400240}
Nicolas Capens157ba262019-12-10 17:49:14 -0500241
Nicolas Capens28556362021-07-24 02:36:09 -0400242Bool PixelProgram::alphaTest(Int cMask[4], const SampleSet &samples)
Nicolas Capens157ba262019-12-10 17:49:14 -0500243{
244 if(!state.alphaToCoverage)
245 {
246 return true;
247 }
248
Nicolas Capens28556362021-07-24 02:36:09 -0400249 alphaToCoverage(cMask, c[0].w, samples);
Alexis Hetu09df3eb2021-01-14 10:46:33 -0500250
Nicolas Capens28556362021-07-24 02:36:09 -0400251 Int pass = 0;
252 for(unsigned int q : samples)
Nicolas Capens157ba262019-12-10 17:49:14 -0500253 {
254 pass = pass | cMask[q];
255 }
256
257 return pass != 0x0;
258}
259
Nicolas Capensefbbb2f2021-09-22 14:20:09 -0400260void PixelProgram::blendColor(Pointer<Byte> cBuffer[4], Int &x, Int sMask[4], Int zMask[4], Int cMask[4], const SampleSet &samples)
Nicolas Capens157ba262019-12-10 17:49:14 -0500261{
Nicolas Capens91ec7752021-09-11 00:30:57 -0400262 for(int index = 0; index < MAX_COLOR_BUFFERS; index++)
Nicolas Capens157ba262019-12-10 17:49:14 -0500263 {
264 if(!state.colorWriteActive(index))
265 {
266 continue;
267 }
268
Nicolas Capens91ec7752021-09-11 00:30:57 -0400269 auto format = state.colorFormat[index];
Nicolas Capens157ba262019-12-10 17:49:14 -0500270 switch(format)
271 {
Sean Risser584c2cf2021-09-14 04:07:02 -0400272 case VK_FORMAT_R4G4B4A4_UNORM_PACK16:
273 case VK_FORMAT_B4G4R4A4_UNORM_PACK16:
Alexis Hetu4c696962022-03-09 09:28:03 -0500274 case VK_FORMAT_A4R4G4B4_UNORM_PACK16:
275 case VK_FORMAT_A4B4G4R4_UNORM_PACK16:
Sean Risser584c2cf2021-09-14 04:07:02 -0400276 case VK_FORMAT_B5G6R5_UNORM_PACK16:
277 case VK_FORMAT_R5G5B5A1_UNORM_PACK16:
278 case VK_FORMAT_B5G5R5A1_UNORM_PACK16:
Nicolas Capens112faf42019-12-13 17:32:26 -0500279 case VK_FORMAT_A1R5G5B5_UNORM_PACK16:
280 case VK_FORMAT_R5G6B5_UNORM_PACK16:
281 case VK_FORMAT_B8G8R8A8_UNORM:
282 case VK_FORMAT_B8G8R8A8_SRGB:
283 case VK_FORMAT_R8G8B8A8_UNORM:
284 case VK_FORMAT_R8G8B8A8_SRGB:
285 case VK_FORMAT_R8G8_UNORM:
286 case VK_FORMAT_R8_UNORM:
Nicolas Capens112faf42019-12-13 17:32:26 -0500287 case VK_FORMAT_A8B8G8R8_UNORM_PACK32:
288 case VK_FORMAT_A8B8G8R8_SRGB_PACK32:
289 case VK_FORMAT_A2B10G10R10_UNORM_PACK32:
290 case VK_FORMAT_A2R10G10B10_UNORM_PACK32:
Nicolas Capens28556362021-07-24 02:36:09 -0400291 for(unsigned int q : samples)
Nicolas Capens112faf42019-12-13 17:32:26 -0500292 {
Nicolas Capens28556362021-07-24 02:36:09 -0400293 Pointer<Byte> buffer = cBuffer[index] + q * *Pointer<Int>(data + OFFSET(DrawData, colorSliceB[index]));
Alexis Hetu7a571322021-10-27 16:20:28 -0400294
Nicolas Capensd1116fa2022-06-29 10:39:18 -0400295 SIMD::Float4 colorf = alphaBlend(index, buffer, c[index], x);
Alexis Hetu7a571322021-10-27 16:20:28 -0400296
Nicolas Capensd1116fa2022-06-29 10:39:18 -0400297 ASSERT(SIMD::Width == 4);
Nicolas Capens28556362021-07-24 02:36:09 -0400298 Vector4s color;
Nicolas Capense8c074d2022-07-25 10:38:12 -0400299 color.x = UShort4(Extract128(colorf.x, 0) * 0xFFFF, true); // Saturating
300 color.y = UShort4(Extract128(colorf.y, 0) * 0xFFFF, true); // Saturating
301 color.z = UShort4(Extract128(colorf.z, 0) * 0xFFFF, true); // Saturating
302 color.w = UShort4(Extract128(colorf.w, 0) * 0xFFFF, true); // Saturating
Nicolas Capens28556362021-07-24 02:36:09 -0400303 writeColor(index, buffer, x, color, sMask[q], zMask[q], cMask[q]);
Nicolas Capens112faf42019-12-13 17:32:26 -0500304 }
305 break;
306 case VK_FORMAT_R16_SFLOAT:
307 case VK_FORMAT_R16G16_SFLOAT:
308 case VK_FORMAT_R16G16B16A16_SFLOAT:
309 case VK_FORMAT_B10G11R11_UFLOAT_PACK32:
310 case VK_FORMAT_R32_SFLOAT:
311 case VK_FORMAT_R32G32_SFLOAT:
312 case VK_FORMAT_R32G32B32A32_SFLOAT:
313 case VK_FORMAT_R32_SINT:
314 case VK_FORMAT_R32G32_SINT:
315 case VK_FORMAT_R32G32B32A32_SINT:
316 case VK_FORMAT_R32_UINT:
317 case VK_FORMAT_R32G32_UINT:
318 case VK_FORMAT_R32G32B32A32_UINT:
Nicolas Capens542593f2021-10-27 16:29:54 -0400319 case VK_FORMAT_R16_UNORM:
320 case VK_FORMAT_R16G16_UNORM:
321 case VK_FORMAT_R16G16B16A16_UNORM:
Nicolas Capens112faf42019-12-13 17:32:26 -0500322 case VK_FORMAT_R16_SINT:
323 case VK_FORMAT_R16G16_SINT:
324 case VK_FORMAT_R16G16B16A16_SINT:
325 case VK_FORMAT_R16_UINT:
326 case VK_FORMAT_R16G16_UINT:
327 case VK_FORMAT_R16G16B16A16_UINT:
328 case VK_FORMAT_R8_SINT:
329 case VK_FORMAT_R8G8_SINT:
330 case VK_FORMAT_R8G8B8A8_SINT:
331 case VK_FORMAT_R8_UINT:
332 case VK_FORMAT_R8G8_UINT:
333 case VK_FORMAT_R8G8B8A8_UINT:
334 case VK_FORMAT_A8B8G8R8_UINT_PACK32:
335 case VK_FORMAT_A8B8G8R8_SINT_PACK32:
336 case VK_FORMAT_A2B10G10R10_UINT_PACK32:
337 case VK_FORMAT_A2R10G10B10_UINT_PACK32:
Nicolas Capens28556362021-07-24 02:36:09 -0400338 for(unsigned int q : samples)
Nicolas Capens112faf42019-12-13 17:32:26 -0500339 {
Nicolas Capens28556362021-07-24 02:36:09 -0400340 Pointer<Byte> buffer = cBuffer[index] + q * *Pointer<Int>(data + OFFSET(DrawData, colorSliceB[index]));
Nicolas Capens157ba262019-12-10 17:49:14 -0500341
Nicolas Capensd1116fa2022-06-29 10:39:18 -0400342 SIMD::Float4 C = alphaBlend(index, buffer, c[index], x);
343 ASSERT(SIMD::Width == 4);
344 Vector4f color;
345 color.x = Extract128(C.x, 0);
346 color.y = Extract128(C.y, 0);
347 color.z = Extract128(C.z, 0);
348 color.w = Extract128(C.w, 0);
Nicolas Capens28556362021-07-24 02:36:09 -0400349 writeColor(index, buffer, x, color, sMask[q], zMask[q], cMask[q]);
Nicolas Capens112faf42019-12-13 17:32:26 -0500350 }
351 break;
352 default:
353 UNSUPPORTED("VkFormat: %d", int(format));
Nicolas Capens157ba262019-12-10 17:49:14 -0500354 }
355 }
356}
357
Nicolas Capensd1116fa2022-06-29 10:39:18 -0400358void PixelProgram::clampColor(SIMD::Float4 color[MAX_COLOR_BUFFERS])
Nicolas Capens157ba262019-12-10 17:49:14 -0500359{
Nicolas Capens8c5df9c2021-10-27 16:29:54 -0400360 // "If the color attachment is fixed-point, the components of the source and destination values and blend factors
361 // are each clamped to [0,1] or [-1,1] respectively for an unsigned normalized or signed normalized color attachment
362 // prior to evaluating the blend operations. If the color attachment is floating-point, no clamping occurs."
363
Nicolas Capens91ec7752021-09-11 00:30:57 -0400364 for(int index = 0; index < MAX_COLOR_BUFFERS; index++)
Nicolas Capens157ba262019-12-10 17:49:14 -0500365 {
366 if(!state.colorWriteActive(index) && !(index == 0 && state.alphaToCoverage))
367 {
368 continue;
369 }
370
Nicolas Capens91ec7752021-09-11 00:30:57 -0400371 switch(state.colorFormat[index])
Nicolas Capens157ba262019-12-10 17:49:14 -0500372 {
Nicolas Capens112faf42019-12-13 17:32:26 -0500373 case VK_FORMAT_UNDEFINED:
374 break;
Sean Risser584c2cf2021-09-14 04:07:02 -0400375 case VK_FORMAT_R4G4B4A4_UNORM_PACK16:
376 case VK_FORMAT_B4G4R4A4_UNORM_PACK16:
Alexis Hetu4c696962022-03-09 09:28:03 -0500377 case VK_FORMAT_A4R4G4B4_UNORM_PACK16:
378 case VK_FORMAT_A4B4G4R4_UNORM_PACK16:
Sean Risser584c2cf2021-09-14 04:07:02 -0400379 case VK_FORMAT_B5G6R5_UNORM_PACK16:
380 case VK_FORMAT_R5G5B5A1_UNORM_PACK16:
381 case VK_FORMAT_B5G5R5A1_UNORM_PACK16:
Nicolas Capens112faf42019-12-13 17:32:26 -0500382 case VK_FORMAT_A1R5G5B5_UNORM_PACK16:
383 case VK_FORMAT_R5G6B5_UNORM_PACK16:
384 case VK_FORMAT_B8G8R8A8_UNORM:
385 case VK_FORMAT_B8G8R8A8_SRGB:
386 case VK_FORMAT_R8G8B8A8_UNORM:
387 case VK_FORMAT_R8G8B8A8_SRGB:
388 case VK_FORMAT_R8G8_UNORM:
389 case VK_FORMAT_R8_UNORM:
Nicolas Capens542593f2021-10-27 16:29:54 -0400390 case VK_FORMAT_R16_UNORM:
Nicolas Capens112faf42019-12-13 17:32:26 -0500391 case VK_FORMAT_R16G16_UNORM:
392 case VK_FORMAT_R16G16B16A16_UNORM:
393 case VK_FORMAT_A8B8G8R8_UNORM_PACK32:
394 case VK_FORMAT_A8B8G8R8_SRGB_PACK32:
395 case VK_FORMAT_A2B10G10R10_UNORM_PACK32:
396 case VK_FORMAT_A2R10G10B10_UNORM_PACK32:
Nicolas Capensafdb5122022-06-30 11:31:35 -0400397 color[index].x = Min(Max(color[index].x, 0.0f), 1.0f);
398 color[index].y = Min(Max(color[index].y, 0.0f), 1.0f);
399 color[index].z = Min(Max(color[index].z, 0.0f), 1.0f);
400 color[index].w = Min(Max(color[index].w, 0.0f), 1.0f);
Nicolas Capens112faf42019-12-13 17:32:26 -0500401 break;
402 case VK_FORMAT_R32_SFLOAT:
403 case VK_FORMAT_R32G32_SFLOAT:
404 case VK_FORMAT_R32G32B32A32_SFLOAT:
405 case VK_FORMAT_R32_SINT:
406 case VK_FORMAT_R32G32_SINT:
407 case VK_FORMAT_R32G32B32A32_SINT:
408 case VK_FORMAT_R32_UINT:
409 case VK_FORMAT_R32G32_UINT:
410 case VK_FORMAT_R32G32B32A32_UINT:
411 case VK_FORMAT_R16_SFLOAT:
412 case VK_FORMAT_R16G16_SFLOAT:
413 case VK_FORMAT_R16G16B16A16_SFLOAT:
414 case VK_FORMAT_B10G11R11_UFLOAT_PACK32:
415 case VK_FORMAT_R16_SINT:
416 case VK_FORMAT_R16G16_SINT:
417 case VK_FORMAT_R16G16B16A16_SINT:
418 case VK_FORMAT_R16_UINT:
419 case VK_FORMAT_R16G16_UINT:
420 case VK_FORMAT_R16G16B16A16_UINT:
421 case VK_FORMAT_R8_SINT:
422 case VK_FORMAT_R8G8_SINT:
423 case VK_FORMAT_R8G8B8A8_SINT:
424 case VK_FORMAT_R8_UINT:
425 case VK_FORMAT_R8G8_UINT:
426 case VK_FORMAT_R8G8B8A8_UINT:
427 case VK_FORMAT_A8B8G8R8_UINT_PACK32:
428 case VK_FORMAT_A8B8G8R8_SINT_PACK32:
429 case VK_FORMAT_A2B10G10R10_UINT_PACK32:
430 case VK_FORMAT_A2R10G10B10_UINT_PACK32:
431 break;
432 default:
Nicolas Capens91ec7752021-09-11 00:30:57 -0400433 UNSUPPORTED("VkFormat: %d", int(state.colorFormat[index]));
Nicolas Capens157ba262019-12-10 17:49:14 -0500434 }
435 }
436}
437
Ben Claytonbc1c067be2019-12-17 20:37:37 +0000438} // namespace sw