| 1 | // Copyright (c) 2017 The ANGLE Project Authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style license that can be |
| 3 | // found in the LICENSE file. |
| 4 | // |
| 5 | // VectorizeVectorScalarArithmetic.cpp: Turn some arithmetic operations that operate on a float |
| 6 | // vector-scalar pair into vector-vector operations. This is done recursively. Some scalar binary |
| 7 | // operations inside vector constructors are also turned into vector operations. |
| 8 | // |
| 9 | // This is targeted to work around a bug in NVIDIA OpenGL drivers that was reproducible on NVIDIA |
| 10 | // driver version 387.92. It works around the most common occurrences of the bug. |
| 11 | |
| 12 | #include "compiler/translator/tree_ops/VectorizeVectorScalarArithmetic.h" |
| 13 | |
| 14 | #include <set> |
| 15 | |
| 16 | #include "compiler/translator/IntermNode.h" |
| 17 | #include "compiler/translator/tree_util/IntermNode_util.h" |
| 18 | #include "compiler/translator/tree_util/IntermTraverse.h" |
| 19 | |
| 20 | namespace sh |
| 21 | { |
| 22 | |
| 23 | namespace |
| 24 | { |
| 25 | |
| 26 | class VectorizeVectorScalarArithmeticTraverser : public TIntermTraverser |
| 27 | { |
| 28 | public: |
| 29 | VectorizeVectorScalarArithmeticTraverser(TSymbolTable *symbolTable) |
| 30 | : TIntermTraverser(true, false, false, symbolTable), mReplaced(false) |
| 31 | {} |
| 32 | |
| 33 | bool didReplaceScalarsWithVectors() { return mReplaced; } |
| 34 | void nextIteration() |
| 35 | { |
| 36 | mReplaced = false; |
| 37 | mModifiedBlocks.clear(); |
| 38 | } |
| 39 | |
| 40 | protected: |
| 41 | bool visitBinary(Visit visit, TIntermBinary *node) override; |
| 42 | bool visitAggregate(Visit visit, TIntermAggregate *node) override; |
| 43 | |
| 44 | private: |
| 45 | // These helpers should only be called from visitAggregate when visiting a constructor. |
| 46 | // argBinary is the only argument of the constructor. |
| 47 | void replaceMathInsideConstructor(TIntermAggregate *node, TIntermBinary *argBinary); |
| 48 | void replaceAssignInsideConstructor(const TIntermAggregate *node, |
| 49 | const TIntermBinary *argBinary); |
| 50 | |
| 51 | static TIntermTyped *Vectorize(TIntermTyped *node, |
| 52 | TType vectorType, |
| 53 | TIntermTraverser::OriginalNode *originalNodeFate); |
| 54 | |
| 55 | bool mReplaced; |
| 56 | std::set<const TIntermBlock *> mModifiedBlocks; |
| 57 | }; |
| 58 | |
| 59 | TIntermTyped *VectorizeVectorScalarArithmeticTraverser::Vectorize( |
| 60 | TIntermTyped *node, |
| 61 | TType vectorType, |
| 62 | TIntermTraverser::OriginalNode *originalNodeFate) |
| 63 | { |
| 64 | ASSERT(node->isScalar()); |
| 65 | vectorType.setQualifier(EvqTemporary); |
| 66 | TIntermSequence vectorConstructorArgs; |
| 67 | vectorConstructorArgs.push_back(node); |
| 68 | TIntermAggregate *vectorized = |
| 69 | TIntermAggregate::CreateConstructor(vectorType, &vectorConstructorArgs); |
| 70 | TIntermTyped *vectorizedFolded = vectorized->fold(nullptr); |
| 71 | if (originalNodeFate != nullptr) |
| 72 | { |
| 73 | if (vectorizedFolded != vectorized) |
| 74 | { |
| 75 | *originalNodeFate = OriginalNode::IS_DROPPED; |
| 76 | } |
| 77 | else |
| 78 | { |
| 79 | *originalNodeFate = OriginalNode::BECOMES_CHILD; |
| 80 | } |
| 81 | } |
| 82 | return vectorizedFolded; |
| 83 | } |
| 84 | |
| 85 | bool VectorizeVectorScalarArithmeticTraverser::visitBinary(Visit /*visit*/, TIntermBinary *node) |
| 86 | { |
| 87 | TIntermTyped *left = node->getLeft(); |
| 88 | TIntermTyped *right = node->getRight(); |
| 89 | ASSERT(left); |
| 90 | ASSERT(right); |
| 91 | switch (node->getOp()) |
| 92 | { |
| 93 | case EOpAdd: |
| 94 | case EOpAddAssign: |
| 95 | // Only these specific ops are necessary to turn into vector ops. |
| 96 | break; |
| 97 | default: |
| 98 | return true; |
| 99 | } |
| 100 | if (node->getBasicType() != EbtFloat) |
| 101 | { |
| 102 | // Only float ops have reproduced the bug. |
| 103 | return true; |
| 104 | } |
| 105 | if (left->isScalar() && right->isVector()) |
| 106 | { |
| 107 | ASSERT(!node->isAssignment()); |
| 108 | ASSERT(!right->isArray()); |
| 109 | OriginalNode originalNodeFate; |
| 110 | TIntermTyped *leftVectorized = Vectorize(left, right->getType(), &originalNodeFate); |
| 111 | queueReplacementWithParent(node, left, leftVectorized, originalNodeFate); |
| 112 | mReplaced = true; |
| 113 | // Don't replace more nodes in the same subtree on this traversal. However, nodes elsewhere |
| 114 | // in the tree may still be replaced. |
| 115 | return false; |
| 116 | } |
| 117 | else if (left->isVector() && right->isScalar()) |
| 118 | { |
| 119 | OriginalNode originalNodeFate; |
| 120 | TIntermTyped *rightVectorized = Vectorize(right, left->getType(), &originalNodeFate); |
| 121 | queueReplacementWithParent(node, right, rightVectorized, originalNodeFate); |
| 122 | mReplaced = true; |
| 123 | // Don't replace more nodes in the same subtree on this traversal. However, nodes elsewhere |
| 124 | // in the tree may still be replaced. |
| 125 | return false; |
| 126 | } |
| 127 | return true; |
| 128 | } |
| 129 | |
| 130 | void VectorizeVectorScalarArithmeticTraverser::replaceMathInsideConstructor( |
| 131 | TIntermAggregate *node, |
| 132 | TIntermBinary *argBinary) |
| 133 | { |
| 134 | // Turn: |
| 135 | // a * b |
| 136 | // into: |
| 137 | // gvec(a) * gvec(b) |
| 138 | |
| 139 | TIntermTyped *left = argBinary->getLeft(); |
| 140 | TIntermTyped *right = argBinary->getRight(); |
| 141 | ASSERT(left->isScalar() && right->isScalar()); |
| 142 | |
| 143 | TType leftVectorizedType = left->getType(); |
| 144 | leftVectorizedType.setPrimarySize(static_cast<unsigned char>(node->getType().getNominalSize())); |
| 145 | TIntermTyped *leftVectorized = Vectorize(left, leftVectorizedType, nullptr); |
| 146 | TType rightVectorizedType = right->getType(); |
| 147 | rightVectorizedType.setPrimarySize( |
| 148 | static_cast<unsigned char>(node->getType().getNominalSize())); |
| 149 | TIntermTyped *rightVectorized = Vectorize(right, rightVectorizedType, nullptr); |
| 150 | |
| 151 | TIntermBinary *newArg = new TIntermBinary(argBinary->getOp(), leftVectorized, rightVectorized); |
| 152 | queueReplacementWithParent(node, argBinary, newArg, OriginalNode::IS_DROPPED); |
| 153 | } |
| 154 | |
| 155 | void VectorizeVectorScalarArithmeticTraverser::replaceAssignInsideConstructor( |
| 156 | const TIntermAggregate *node, |
| 157 | const TIntermBinary *argBinary) |
| 158 | { |
| 159 | // Turn: |
| 160 | // gvec(a *= b); |
| 161 | // into: |
| 162 | // // This is inserted into the parent block: |
| 163 | // gvec s0 = gvec(a); |
| 164 | // |
| 165 | // // This goes where the gvec constructor used to be: |
| 166 | // ((s0 *= b, a = s0.x), s0); |
| 167 | |
| 168 | TIntermTyped *left = argBinary->getLeft(); |
| 169 | TIntermTyped *right = argBinary->getRight(); |
| 170 | ASSERT(left->isScalar() && right->isScalar()); |
| 171 | ASSERT(!left->hasSideEffects()); |
| 172 | |
| 173 | TType vecType = node->getType(); |
| 174 | vecType.setQualifier(EvqTemporary); |
| 175 | |
| 176 | // gvec s0 = gvec(a); |
| 177 | // s0 is called "tempAssignmentTarget" below. |
| 178 | TIntermTyped *tempAssignmentTargetInitializer = Vectorize(left->deepCopy(), vecType, nullptr); |
| 179 | TIntermDeclaration *tempAssignmentTargetDeclaration = nullptr; |
| 180 | TVariable *tempAssignmentTarget = |
| 181 | DeclareTempVariable(mSymbolTable, tempAssignmentTargetInitializer, EvqTemporary, |
| 182 | &tempAssignmentTargetDeclaration); |
| 183 | |
| 184 | // s0 *= b |
| 185 | TOperator compoundAssignmentOp = argBinary->getOp(); |
| 186 | if (compoundAssignmentOp == EOpMulAssign) |
| 187 | { |
| 188 | compoundAssignmentOp = EOpVectorTimesScalarAssign; |
| 189 | } |
| 190 | TIntermBinary *replacementCompoundAssignment = new TIntermBinary( |
| 191 | compoundAssignmentOp, CreateTempSymbolNode(tempAssignmentTarget), right->deepCopy()); |
| 192 | |
| 193 | // s0.x |
| 194 | TVector<int> swizzleXOffset; |
| 195 | swizzleXOffset.push_back(0); |
| 196 | TIntermSwizzle *tempAssignmentTargetX = |
| 197 | new TIntermSwizzle(CreateTempSymbolNode(tempAssignmentTarget), swizzleXOffset); |
| 198 | // a = s0.x |
| 199 | TIntermBinary *replacementAssignBackToTarget = |
| 200 | new TIntermBinary(EOpAssign, left->deepCopy(), tempAssignmentTargetX); |
| 201 | |
| 202 | // s0 *= b, a = s0.x |
| 203 | TIntermBinary *replacementSequenceLeft = |
| 204 | new TIntermBinary(EOpComma, replacementCompoundAssignment, replacementAssignBackToTarget); |
| 205 | // (s0 *= b, a = s0.x), s0 |
| 206 | // Note that the created comma node is not const qualified in any case, so we can always pass |
| 207 | // shader version 300 here. |
| 208 | TIntermBinary *replacementSequence = TIntermBinary::CreateComma( |
| 209 | replacementSequenceLeft, CreateTempSymbolNode(tempAssignmentTarget), 300); |
| 210 | |
| 211 | insertStatementInParentBlock(tempAssignmentTargetDeclaration); |
| 212 | queueReplacement(replacementSequence, OriginalNode::IS_DROPPED); |
| 213 | } |
| 214 | |
| 215 | bool VectorizeVectorScalarArithmeticTraverser::visitAggregate(Visit /*visit*/, |
| 216 | TIntermAggregate *node) |
| 217 | { |
| 218 | // Transform scalar binary expressions inside vector constructors. |
| 219 | if (!node->isConstructor() || !node->isVector() || node->getSequence()->size() != 1) |
| 220 | { |
| 221 | return true; |
| 222 | } |
| 223 | TIntermTyped *argument = node->getSequence()->back()->getAsTyped(); |
| 224 | ASSERT(argument); |
| 225 | if (!argument->isScalar() || argument->getBasicType() != EbtFloat) |
| 226 | { |
| 227 | return true; |
| 228 | } |
| 229 | TIntermBinary *argBinary = argument->getAsBinaryNode(); |
| 230 | if (!argBinary) |
| 231 | { |
| 232 | return true; |
| 233 | } |
| 234 | |
| 235 | // Only specific ops are necessary to change. |
| 236 | switch (argBinary->getOp()) |
| 237 | { |
| 238 | case EOpMul: |
| 239 | case EOpDiv: |
| 240 | { |
| 241 | replaceMathInsideConstructor(node, argBinary); |
| 242 | mReplaced = true; |
| 243 | // Don't replace more nodes in the same subtree on this traversal. However, nodes |
| 244 | // elsewhere in the tree may still be replaced. |
| 245 | return false; |
| 246 | } |
| 247 | case EOpMulAssign: |
| 248 | case EOpDivAssign: |
| 249 | { |
| 250 | // The case where the left side has side effects is too complicated to deal with, so we |
| 251 | // leave that be. |
| 252 | if (!argBinary->getLeft()->hasSideEffects()) |
| 253 | { |
| 254 | const TIntermBlock *parentBlock = getParentBlock(); |
| 255 | // We can't do more than one insertion to the same block on the same traversal. |
| 256 | if (mModifiedBlocks.find(parentBlock) == mModifiedBlocks.end()) |
| 257 | { |
| 258 | replaceAssignInsideConstructor(node, argBinary); |
| 259 | mModifiedBlocks.insert(parentBlock); |
| 260 | mReplaced = true; |
| 261 | // Don't replace more nodes in the same subtree on this traversal. |
| 262 | // However, nodes elsewhere in the tree may still be replaced. |
| 263 | return false; |
| 264 | } |
| 265 | } |
| 266 | break; |
| 267 | } |
| 268 | default: |
| 269 | return true; |
| 270 | } |
| 271 | return true; |
| 272 | } |
| 273 | |
| 274 | } // anonymous namespace |
| 275 | |
| 276 | void VectorizeVectorScalarArithmetic(TIntermBlock *root, TSymbolTable *symbolTable) |
| 277 | { |
| 278 | VectorizeVectorScalarArithmeticTraverser traverser(symbolTable); |
| 279 | do |
| 280 | { |
| 281 | traverser.nextIteration(); |
| 282 | root->traverse(&traverser); |
| 283 | traverser.updateTree(); |
| 284 | } while (traverser.didReplaceScalarsWithVectors()); |
| 285 | } |
| 286 | |
| 287 | } // namespace sh |