Win32-specific optimization in Points module

2018-10-08 18:50:03 +02:00
parent d9015da662
commit dbb96de677
2 changed files with 19 additions and 2 deletions
--- a/src/Mod/Points/App/Points.cpp
+++ b/src/Mod/Points/App/Points.cpp
@@ -85,17 +85,25 @@ Data::Segment* PointKernel::getSubElement(const char* /*Type*/, unsigned long /*
 void PointKernel::transformGeometry(const Base::Matrix4D &rclMat)
 {
    std::vector<value_type>& kernel = getBasicPoints();
+#ifdef _WIN32
+    // Win32-only at the moment since ppl.h is a Microsoft library. Points is not using Qt so we cannot use QtConcurrent
+    // We could also rewrite Points to leverage SIMD instructions
+    // Other option: openMP. But with VC2013 results in high CPU usage even after computation (busy-waits for >100ms)
+    Concurrency::parallel_for_each(kernel.begin(), kernel.end(), [rclMat](value_type& value) {
+        value = rclMat * value;
+    });
+#else
    QtConcurrent::blockingMap(kernel, [rclMat](value_type& value) {
        rclMat.multVec(value, value);
    });
+#endif
 }

 Base::BoundBox3d PointKernel::getBoundBox(void)const
 {
    Base::BoundBox3d bnd;

-    //FIXME: VS 2015 or later causes a linker error
-#if defined _WIN32 
+#ifdef _WIN32
    // Thread-local bounding boxes
    Concurrency::combinable<Base::BoundBox3d> bbs;
    // Cannot use a const_point_iterator here as it is *not* a proper iterator (fails the for_each template)
--- a/src/Mod/Points/App/Properties.cpp
+++ b/src/Mod/Points/App/Properties.cpp
@@ -40,6 +40,9 @@
 #include "PointsPy.h"

 #include <QtConcurrentMap>
+#ifdef _WIN32
+# include <ppl.h>
+#endif

 using namespace Points;
 using namespace std;
@@ -389,9 +392,15 @@ void PropertyNormalList::transformGeometry(const Base::Matrix4D &mat)
    aboutToSetValue();

    // Rotate the normal vectors
+#ifdef _WIN32
+    Concurrency::parallel_for_each(_lValueList.begin(), _lValueList.end(), [rot](Base::Vector3f& value) {
+        value = rot * value;
+    });
+#else
    QtConcurrent::blockingMap(_lValueList, [rot](Base::Vector3f& value) {
        rot.multVec(value, value);
    });
+#endif

    hasSetValue();
 }