doe300 · long-long-float · May 17, 2020 · May 23, 2020 · May 25, 2020 · May 25, 2020
diff --git a/src/Expression.cpp b/src/Expression.cpp
@@ -6,6 +6,8 @@
 using namespace vc4c;
 
 constexpr OpCode Expression::FAKEOP_UMUL;
+constexpr OpCode Expression::FAKEOP_MUL;
+constexpr OpCode Expression::FAKEOP_DIV;
 
 SubExpression::SubExpression(const Optional<Value>& val) : Base(VariantNamespace::monostate{})
 {

diff --git a/src/Expression.h b/src/Expression.h
@@ -109,6 +109,9 @@ namespace vc4c
         // A fake operation to indicate an unsigned multiplication
         static constexpr OpCode FAKEOP_UMUL{"umul", 132, 132, 2, false, false, FlagBehavior::NONE};
 
+        static constexpr OpCode FAKEOP_MUL{"mul", 132, 132, 2, false, false, FlagBehavior::NONE};
+        static constexpr OpCode FAKEOP_DIV{"div", 132, 132, 2, false, false, FlagBehavior::NONE};
+
         OpCode code;
         SubExpression arg0;
         SubExpression arg1{};

diff --git a/src/normalization/Normalizer.cpp b/src/normalization/Normalizer.cpp
@@ -16,20 +16,25 @@
 #include "../optimization/ControlFlow.h"
 #include "../optimization/Eliminator.h"
 #include "../optimization/Reordering.h"
+#include "../intermediate/operators.h"
 #include "../spirv/SPIRVBuiltins.h"
 #include "Inliner.h"
 #include "LiteralValues.h"
 #include "LongOperations.h"
 #include "MemoryAccess.h"
 #include "Rewrite.h"
 
+#include "../optimization/Combiner.h"
+
 #include "log.h"
 
 #include <string>
 #include <vector>
 
 using namespace vc4c;
 using namespace vc4c::normalization;
+using namespace vc4c::periphery;
+using namespace vc4c::operators;
 
 static bool checkWorkGroupUniform(const Value& arg)
 {
@@ -253,6 +258,16 @@ void Normalizer::normalize(Module& module) const
         PROFILE_COUNTER_WITH_PREV(vc4c::profiler::COUNTER_NORMALIZATION + 2, "Eliminate Phi-nodes (after)",
             method->countInstructions(), vc4c::profiler::COUNTER_NORMALIZATION + 1);
     }
+
+    {
+        // TODO: move this optimization to appropriate location
+        auto kernels = module.getKernels();
+        for(Method* kernelFunc : kernels)
+        {
+            optimizations::combineDMALoads(module, *kernelFunc, config);
+        }
+    }
+
     auto kernels = module.getKernels();
     // 2. inline kernel-functions
     for(Method* kernelFunc : kernels)
@@ -266,6 +281,7 @@ void Normalizer::normalize(Module& module) const
         PROFILE_COUNTER_WITH_PREV(vc4c::profiler::COUNTER_NORMALIZATION + 5, "Inline (after)",
             kernel.countInstructions(), vc4c::profiler::COUNTER_NORMALIZATION + 4);
     }
+
     // 3. run other normalization steps on kernel functions
     const auto f = [&module, this](Method* kernelFunc) -> void { normalizeMethod(module, *kernelFunc); };
     ThreadPool::scheduleAll<Method*>("Normalization", kernels, f, THREAD_LOGGER.get());