// Copyright 2016 The SwiftShader Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "PixelShader.hpp"
#include "Common/Debug.hpp"
#include <string.h>
namespace sw
{
PixelShader::PixelShader(const PixelShader *ps) : Shader()
{
shaderModel = 0x0300;
vPosDeclared = false;
vFaceDeclared = false;
centroid = false;
if(ps) // Make a copy
{
for(size_t i = 0; i < ps->getLength(); i++)
{
append(new sw::Shader::Instruction(*ps->getInstruction(i)));
}
memcpy(input, ps->input, sizeof(input));
vPosDeclared = ps->vPosDeclared;
vFaceDeclared = ps->vFaceDeclared;
usedSamplers = ps->usedSamplers;
optimize();
analyze();
}
}
PixelShader::PixelShader(const unsigned long *token) : Shader()
{
parse(token);
vPosDeclared = false;
vFaceDeclared = false;
centroid = false;
optimize();
analyze();
}
PixelShader::~PixelShader()
{
}
int PixelShader::validate(const unsigned long *const token)
{
if(!token)
{
return 0;
}
unsigned short version = (unsigned short)(token[0] & 0x0000FFFF);
// unsigned char minorVersion = (unsigned char)(token[0] & 0x000000FF);
unsigned char majorVersion = (unsigned char)((token[0] & 0x0000FF00) >> 8);
ShaderType shaderType = (ShaderType)((token[0] & 0xFFFF0000) >> 16);
if(shaderType != SHADER_PIXEL || majorVersion > 3)
{
return 0;
}
int instructionCount = 1;
for(int i = 0; token[i] != 0x0000FFFF; i++)
{
if((token[i] & 0x0000FFFF) == 0x0000FFFE) // Comment token
{
int length = (token[i] & 0x7FFF0000) >> 16;
i += length;
}
else
{
Shader::Opcode opcode = (Shader::Opcode)(token[i] & 0x0000FFFF);
switch(opcode)
{
case Shader::OPCODE_RESERVED0:
case Shader::OPCODE_MOVA:
return 0; // Unsupported operation
default:
instructionCount++;
break;
}
i += size(token[i], version);
}
}
return instructionCount;
}
bool PixelShader::depthOverride() const
{
return zOverride;
}
bool PixelShader::containsKill() const
{
return kill;
}
bool PixelShader::containsCentroid() const
{
return centroid;
}
bool PixelShader::usesDiffuse(int component) const
{
return input[0][component].active();
}
bool PixelShader::usesSpecular(int component) const
{
return input[1][component].active();
}
bool PixelShader::usesTexture(int coordinate, int component) const
{
return input[2 + coordinate][component].active();
}
void PixelShader::setInput(int inputIdx, int nbComponents, const sw::Shader::Semantic& semantic)
{
for(int i = 0; i < nbComponents; ++i)
{
input[inputIdx][i] = semantic;
}
}
const sw::Shader::Semantic& PixelShader::getInput(int inputIdx, int component) const
{
return input[inputIdx][component];
}
void PixelShader::analyze()
{
analyzeZOverride();
analyzeKill();
analyzeInterpolants();
analyzeDirtyConstants();
analyzeDynamicBranching();
analyzeSamplers();
analyzeCallSites();
analyzeDynamicIndexing();
}
void PixelShader::analyzeZOverride()
{
zOverride = false;
for(const auto &inst : instruction)
{
if(inst->opcode == Shader::OPCODE_TEXM3X2DEPTH ||
inst->opcode == Shader::OPCODE_TEXDEPTH ||
inst->dst.type == Shader::PARAMETER_DEPTHOUT)
{
zOverride = true;
break;
}
}
}
void PixelShader::analyzeKill()
{
kill = false;
for(const auto &inst : instruction)
{
if(inst->opcode == Shader::OPCODE_TEXKILL ||
inst->opcode == Shader::OPCODE_DISCARD)
{
kill = true;
break;
}
}
}
void PixelShader::analyzeInterpolants()
{
if(shaderModel < 0x0300)
{
// Set default mapping; disable unused interpolants below
input[0][0] = Semantic(Shader::USAGE_COLOR, 0);
input[0][1] = Semantic(Shader::USAGE_COLOR, 0);
input[0][2] = Semantic(Shader::USAGE_COLOR, 0);
input[0][3] = Semantic(Shader::USAGE_COLOR, 0);
input[1][0] = Semantic(Shader::USAGE_COLOR, 1);
input[1][1] = Semantic(Shader::USAGE_COLOR, 1);
input[1][2] = Semantic(Shader::USAGE_COLOR, 1);
input[1][3] = Semantic(Shader::USAGE_COLOR, 1);
for(int i = 0; i < 8; i++)
{
input[2 + i][0] = Semantic(Shader::USAGE_TEXCOORD, i);
input[2 + i][1] = Semantic(Shader::USAGE_TEXCOORD, i);
input[2 + i][2] = Semantic(Shader::USAGE_TEXCOORD, i);
input[2 + i][3] = Semantic(Shader::USAGE_TEXCOORD, i);
}
Shader::SamplerType samplerType[16];
for(int i = 0; i < 16; i++)
{
samplerType[i] = Shader::SAMPLER_UNKNOWN;
}
for(const auto &inst : instruction)
{
if(inst->dst.type == Shader::PARAMETER_SAMPLER)
{
int sampler = inst->dst.index;
samplerType[sampler] = inst->samplerType;
}
}
bool interpolant[MAX_FRAGMENT_INPUTS][4] = {{false}}; // Interpolants in use
for(const auto &inst : instruction)
{
if(inst->dst.type == Shader::PARAMETER_TEXTURE)
{
int index = inst->dst.index + 2;
switch(inst->opcode)
{
case Shader::OPCODE_TEX:
case Shader::OPCODE_TEXBEM:
case Shader::OPCODE_TEXBEML:
case Shader::OPCODE_TEXCOORD:
case Shader::OPCODE_TEXDP3:
case Shader::OPCODE_TEXDP3TEX:
case Shader::OPCODE_TEXM3X2DEPTH:
case Shader::OPCODE_TEXM3X2PAD:
case Shader::OPCODE_TEXM3X2TEX:
case Shader::OPCODE_TEXM3X3:
case Shader::OPCODE_TEXM3X3PAD:
case Shader::OPCODE_TEXM3X3TEX:
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
break;
case Shader::OPCODE_TEXKILL:
if(majorVersion < 2)
{
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
}
else
{
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
interpolant[index][3] = true;
}
break;
case Shader::OPCODE_TEXM3X3VSPEC:
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
interpolant[index - 2][3] = true;
interpolant[index - 1][3] = true;
interpolant[index - 0][3] = true;
break;
case Shader::OPCODE_DCL:
break; // Ignore
default: // Arithmetic instruction
if(shaderModel >= 0x0104)
{
ASSERT(false);
}
}
}
for(int argument = 0; argument < 4; argument++)
{
if(inst->src[argument].type == Shader::PARAMETER_INPUT ||
inst->src[argument].type == Shader::PARAMETER_TEXTURE)
{
int index = inst->src[argument].index;
int swizzle = inst->src[argument].swizzle;
int mask = inst->dst.mask;
if(inst->src[argument].type == Shader::PARAMETER_TEXTURE)
{
index += 2;
}
switch(inst->opcode)
{
case Shader::OPCODE_TEX:
case Shader::OPCODE_TEXLDD:
case Shader::OPCODE_TEXLDL:
case Shader::OPCODE_TEXLOD:
case Shader::OPCODE_TEXBIAS:
case Shader::OPCODE_TEXOFFSET:
case Shader::OPCODE_TEXOFFSETBIAS:
case Shader::OPCODE_TEXLODOFFSET:
case Shader::OPCODE_TEXELFETCH:
case Shader::OPCODE_TEXELFETCHOFFSET:
case Shader::OPCODE_TEXGRAD:
case Shader::OPCODE_TEXGRADOFFSET:
{
int sampler = inst->src[1].index;
switch(samplerType[sampler])
{
case Shader::SAMPLER_UNKNOWN:
if(shaderModel == 0x0104)
{
if((inst->src[0].swizzle & 0x30) == 0x20) // .xyz
{
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
}
else // .xyw
{
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][3] = true;
}
}
else
{
ASSERT(false);
}
break;
case Shader::SAMPLER_1D:
interpolant[index][0] = true;
break;
case Shader::SAMPLER_2D:
interpolant[index][0] = true;
interpolant[index][1] = true;
break;
case Shader::SAMPLER_CUBE:
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
break;
case Shader::SAMPLER_VOLUME:
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
break;
default:
ASSERT(false);
}
if(inst->bias)
{
interpolant[index][3] = true;
}
if(inst->project)
{
interpolant[index][3] = true;
}
if(shaderModel == 0x0104 && inst->opcode == Shader::OPCODE_TEX)
{
if(inst->src[0].modifier == Shader::MODIFIER_DZ)
{
interpolant[index][2] = true;
}
if(inst->src[0].modifier == Shader::MODIFIER_DW)
{
interpolant[index][3] = true;
}
}
}
break;
case Shader::OPCODE_M3X2:
if(mask & 0x1)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
if(argument == 1)
{
if(mask & 0x2)
{
interpolant[index + 1][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index + 1][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index + 1][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index + 1][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
}
break;
case Shader::OPCODE_M3X3:
if(mask & 0x1)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
if(argument == 1)
{
if(mask & 0x2)
{
interpolant[index + 1][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index + 1][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index + 1][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index + 1][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
if(mask & 0x4)
{
interpolant[index + 2][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index + 2][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index + 2][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index + 2][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
}
break;
case Shader::OPCODE_M3X4:
if(mask & 0x1)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
if(argument == 1)
{
if(mask & 0x2)
{
interpolant[index + 1][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index + 1][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index + 1][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index + 1][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
if(mask & 0x4)
{
interpolant[index + 2][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index + 2][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index + 2][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index + 2][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
if(mask & 0x8)
{
interpolant[index + 3][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index + 3][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index + 3][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index + 3][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
}
}
break;
case Shader::OPCODE_M4X3:
if(mask & 0x1)
{
interpolant[index][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index][3] |= swizzleContainsComponent(swizzle, 3);
}
if(argument == 1)
{
if(mask & 0x2)
{
interpolant[index + 1][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index + 1][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index + 1][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index + 1][3] |= swizzleContainsComponent(swizzle, 3);
}
if(mask & 0x4)
{
interpolant[index + 2][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index + 2][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index + 2][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index + 2][3] |= swizzleContainsComponent(swizzle, 3);
}
}
break;
case Shader::OPCODE_M4X4:
if(mask & 0x1)
{
interpolant[index][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index][3] |= swizzleContainsComponent(swizzle, 3);
}
if(argument == 1)
{
if(mask & 0x2)
{
interpolant[index + 1][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index + 1][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index + 1][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index + 1][3] |= swizzleContainsComponent(swizzle, 3);
}
if(mask & 0x4)
{
interpolant[index + 2][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index + 2][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index + 2][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index + 2][3] |= swizzleContainsComponent(swizzle, 3);
}
if(mask & 0x8)
{
interpolant[index + 3][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index + 3][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index + 3][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index + 3][3] |= swizzleContainsComponent(swizzle, 3);
}
}
break;
case Shader::OPCODE_CRS:
if(mask & 0x1)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x6);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x6);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x6);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x6);
}
if(mask & 0x2)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x5);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x5);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x5);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x5);
}
if(mask & 0x4)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x3);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x3);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x3);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x3);
}
break;
case Shader::OPCODE_DP2ADD:
if(argument == 0 || argument == 1)
{
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x3);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x3);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x3);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x3);
}
else // argument == 2
{
interpolant[index][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index][3] |= swizzleContainsComponent(swizzle, 3);
}
break;
case Shader::OPCODE_DP3:
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7);
break;
case Shader::OPCODE_DP4:
interpolant[index][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index][3] |= swizzleContainsComponent(swizzle, 3);
break;
case Shader::OPCODE_SINCOS:
case Shader::OPCODE_EXP2X:
case Shader::OPCODE_LOG2X:
case Shader::OPCODE_POWX:
case Shader::OPCODE_RCPX:
case Shader::OPCODE_RSQX:
interpolant[index][0] |= swizzleContainsComponent(swizzle, 0);
interpolant[index][1] |= swizzleContainsComponent(swizzle, 1);
interpolant[index][2] |= swizzleContainsComponent(swizzle, 2);
interpolant[index][3] |= swizzleContainsComponent(swizzle, 3);
break;
case Shader::OPCODE_NRM3:
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, 0x7 | mask);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, 0x7 | mask);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, 0x7 | mask);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, 0x7 | mask);
break;
case Shader::OPCODE_MOV:
case Shader::OPCODE_ADD:
case Shader::OPCODE_SUB:
case Shader::OPCODE_MUL:
case Shader::OPCODE_MAD:
case Shader::OPCODE_ABS:
case Shader::OPCODE_CMP0:
case Shader::OPCODE_CND:
case Shader::OPCODE_FRC:
case Shader::OPCODE_LRP:
case Shader::OPCODE_MAX:
case Shader::OPCODE_MIN:
case Shader::OPCODE_CMP:
case Shader::OPCODE_BREAKC:
case Shader::OPCODE_DFDX:
case Shader::OPCODE_DFDY:
interpolant[index][0] |= swizzleContainsComponentMasked(swizzle, 0, mask);
interpolant[index][1] |= swizzleContainsComponentMasked(swizzle, 1, mask);
interpolant[index][2] |= swizzleContainsComponentMasked(swizzle, 2, mask);
interpolant[index][3] |= swizzleContainsComponentMasked(swizzle, 3, mask);
break;
case Shader::OPCODE_TEXCOORD:
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
interpolant[index][3] = true;
break;
case Shader::OPCODE_TEXDP3:
case Shader::OPCODE_TEXDP3TEX:
case Shader::OPCODE_TEXM3X2PAD:
case Shader::OPCODE_TEXM3X3PAD:
case Shader::OPCODE_TEXM3X2TEX:
case Shader::OPCODE_TEXM3X3SPEC:
case Shader::OPCODE_TEXM3X3VSPEC:
case Shader::OPCODE_TEXBEM:
case Shader::OPCODE_TEXBEML:
case Shader::OPCODE_TEXM3X2DEPTH:
case Shader::OPCODE_TEXM3X3:
case Shader::OPCODE_TEXM3X3TEX:
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
break;
case Shader::OPCODE_TEXREG2AR:
case Shader::OPCODE_TEXREG2GB:
case Shader::OPCODE_TEXREG2RGB:
break;
default:
// ASSERT(false); // Refine component usage
interpolant[index][0] = true;
interpolant[index][1] = true;
interpolant[index][2] = true;
interpolant[index][3] = true;
}
}
}
}
for(int index = 0; index < MAX_FRAGMENT_INPUTS; index++)
{
for(int component = 0; component < 4; component++)
{
if(!interpolant[index][component])
{
input[index][component] = Semantic();
}
}
}
}
else // Shader Model 3.0 input declaration; v# indexable
{
for(const auto &inst : instruction)
{
if(inst->opcode == Shader::OPCODE_DCL)
{
if(inst->dst.type == Shader::PARAMETER_INPUT)
{
unsigned char usage = inst->usage;
unsigned char index = inst->usageIndex;
unsigned char mask = inst->dst.mask;
unsigned char reg = inst->dst.index;
if(mask & 0x01) input[reg][0] = Semantic(usage, index);
if(mask & 0x02) input[reg][1] = Semantic(usage, index);
if(mask & 0x04) input[reg][2] = Semantic(usage, index);
if(mask & 0x08) input[reg][3] = Semantic(usage, index);
}
else if(inst->dst.type == Shader::PARAMETER_MISCTYPE)
{
unsigned char index = inst->dst.index;
if(index == Shader::VPosIndex)
{
vPosDeclared = true;
}
else if(index == Shader::VFaceIndex)
{
vFaceDeclared = true;
}
else ASSERT(false);
}
}
}
}
if(shaderModel >= 0x0200)
{
for(const auto &inst : instruction)
{
if(inst->opcode == Shader::OPCODE_DCL)
{
bool centroid = inst->dst.centroid;
unsigned char reg = inst->dst.index;
switch(inst->dst.type)
{
case Shader::PARAMETER_INPUT:
input[reg][0].centroid = centroid;
break;
case Shader::PARAMETER_TEXTURE:
input[2 + reg][0].centroid = centroid;
break;
default:
break;
}
this->centroid = this->centroid || centroid;
}
}
}
}
}