浏览代码

refactored generator types and precision

Nicolas Winkler 5 年之前
父节点
当前提交
139f4d17fa

+ 3 - 2
libmandel/include/Generators.h

@@ -48,7 +48,6 @@ namespace mnd
     std::string toString(CpuExtension);
     std::string toString(CpuExtension);
 
 
     Real getPrecision(Precision p);
     Real getPrecision(Precision p);
-    Real getPrecision(GeneratorType p);
     
     
     template<typename T>
     template<typename T>
     Real getPrecision(void);
     Real getPrecision(void);
@@ -82,7 +81,7 @@ namespace mnd
     class MandelDevice;
     class MandelDevice;
 }
 }
 
 
-
+/*
 enum class mnd::GeneratorType : int
 enum class mnd::GeneratorType : int
 {
 {
     UNSPECIFIED,
     UNSPECIFIED,
@@ -113,6 +112,7 @@ enum class mnd::GeneratorType : int
     FIXED128,
     FIXED128,
     FIXED512
     FIXED512
 };
 };
+*/
 
 
 
 
 class mnd::MandelGenerator
 class mnd::MandelGenerator
@@ -175,6 +175,7 @@ public:
 
 
     void addGenerator(const Real& precision, MandelGenerator& generator);
     void addGenerator(const Real& precision, MandelGenerator& generator);
     void addGenerator(Precision p, MandelGenerator& generator);
     void addGenerator(Precision p, MandelGenerator& generator);
+    void addGenerator(MandelGenerator& generator);
     
     
     const std::map<Real, MandelGenerator*, std::greater<Real>>& getGenerators(void) const { return generators; }
     const std::map<Real, MandelGenerator*, std::greater<Real>>& getGenerators(void) const { return generators; }
     inline void clear(void) { generators.clear(); }
     inline void clear(void) { generators.clear(); }

+ 7 - 7
libmandel/include/Mandel.h

@@ -32,9 +32,6 @@ namespace mnd
     struct ClDeviceWrapper;
     struct ClDeviceWrapper;
 
 
     extern MandelContext initializeContext(void);
     extern MandelContext initializeContext(void);
-
-    const std::string& getGeneratorName(mnd::GeneratorType);
-    GeneratorType getTypeFromName(const std::string& name);
 }
 }
 
 
 
 
@@ -49,7 +46,7 @@ private:
     std::string extensions;
     std::string extensions;
     std::unique_ptr<ClDeviceWrapper> clDevice;
     std::unique_ptr<ClDeviceWrapper> clDevice;
 
 
-    std::map<GeneratorType, std::unique_ptr<MandelGenerator>> mandelGenerators;
+    std::map<Precision, std::unique_ptr<MandelGenerator>> mandelGenerators;
 
 
 public:
 public:
     MandelDevice(ClDeviceWrapper, const std::string& platformName);
     MandelDevice(ClDeviceWrapper, const std::string& platformName);
@@ -61,11 +58,11 @@ public:
     inline const std::string& getVendor(void) const { return vendor; }
     inline const std::string& getVendor(void) const { return vendor; }
     inline const std::string& getName(void) const { return name; }
     inline const std::string& getName(void) const { return name; }
 
 
-    MandelGenerator* getGenerator(GeneratorType type) const;
+    MandelGenerator* getGenerator(Precision type) const;
     inline ClDeviceWrapper& getClDevice(void) { return *clDevice; }
     inline ClDeviceWrapper& getClDevice(void) { return *clDevice; }
     inline const ClDeviceWrapper& getClDevice(void) const { return *clDevice; }
     inline const ClDeviceWrapper& getClDevice(void) const { return *clDevice; }
 
 
-    std::vector<GeneratorType> getSupportedTypes(void) const;
+    std::vector<Precision> getSupportedTypes(void) const;
     bool supportsDouble(void) const;
     bool supportsDouble(void) const;
 };
 };
 
 
@@ -75,6 +72,8 @@ class mnd::MandelContext
 private:
 private:
     friend MandelContext mnd::initializeContext(void);
     friend MandelContext mnd::initializeContext(void);
 
 
+    using GeneratorType = std::pair<Precision, CpuExtension>;
+
     CpuInfo cpuInfo;
     CpuInfo cpuInfo;
     std::unique_ptr<asmjit::JitRuntime> jitRuntime;
     std::unique_ptr<asmjit::JitRuntime> jitRuntime;
 
 
@@ -100,8 +99,9 @@ public:
 
 
     asmjit::JitRuntime& getJitRuntime(void);
     asmjit::JitRuntime& getJitRuntime(void);
 
 
-    MandelGenerator* getCpuGenerator(mnd::GeneratorType type);
+    MandelGenerator* getCpuGenerator(mnd::Precision type, mnd::CpuExtension ex);
     std::vector<GeneratorType> getSupportedTypes(void) const;
     std::vector<GeneratorType> getSupportedTypes(void) const;
+    std::vector<MandelGenerator*> getCpuGenerators(mnd::Precision prec) const;
 
 
     const CpuInfo& getCpuInfo(void) const { return cpuInfo; }
     const CpuInfo& getCpuInfo(void) const { return cpuInfo; }
 };
 };

+ 6 - 46
libmandel/src/Generators.cpp

@@ -71,6 +71,12 @@ void AdaptiveGenerator::addGenerator(mnd::Precision p, MandelGenerator& generato
 }
 }
 
 
 
 
+void AdaptiveGenerator::addGenerator(MandelGenerator& generator)
+{
+    generators.insert({ generator.getPrecision(), &generator });
+}
+
+
 void AdaptiveGenerator::generate(const mnd::MandelInfo& info, float* data)
 void AdaptiveGenerator::generate(const mnd::MandelInfo& info, float* data)
 {
 {
     Real pixelW = info.view.width / info.bWidth;
     Real pixelW = info.view.width / info.bWidth;
@@ -188,52 +194,6 @@ namespace mnd
         return precs.at(p);
         return precs.at(p);
     }
     }
 
 
-    Real getPrecision(GeneratorType t)
-    {
-        switch(t) {
-        case GeneratorType::FLOAT:
-        case GeneratorType::FLOAT_SSE2:
-        case GeneratorType::FLOAT_AVX:
-        case GeneratorType::FLOAT_AVX_FMA:
-        case GeneratorType::FLOAT_AVX512:
-        case GeneratorType::FLOAT_NEON:
-            return getPrecision<float>();
-        case GeneratorType::DOUBLE_FLOAT:
-            return getPrecision(Precision::DOUBLE_FLOAT);
-        case GeneratorType::DOUBLE:
-        case GeneratorType::DOUBLE_SSE2:
-        case GeneratorType::DOUBLE_AVX:
-        case GeneratorType::DOUBLE_AVX_FMA:
-        case GeneratorType::DOUBLE_AVX512:
-        case GeneratorType::DOUBLE_NEON:
-            return getPrecision<double>();
-        case GeneratorType::DOUBLE_DOUBLE:
-        case GeneratorType::DOUBLE_DOUBLE_AVX:
-        case GeneratorType::DOUBLE_DOUBLE_AVX_FMA:
-            return getPrecision<DoubleDouble>();
-        case GeneratorType::TRIPLE_DOUBLE:
-        case GeneratorType::TRIPLE_DOUBLE_AVX:
-            return getPrecision<TripleDouble>();
-        case GeneratorType::QUAD_DOUBLE:
-            return getPrecision<QuadDouble>();
-        case GeneratorType::FLOAT128:
-            return getPrecision<Float128>();
-        case GeneratorType::FLOAT256:
-            return getPrecision<Float256>();
-        case GeneratorType::FIXED64:
-            return getPrecision<Fixed64>();
-        case GeneratorType::FIXED128:
-            return getPrecision<Fixed128>();
-        case GeneratorType::FIXED512:
-            return getPrecision<Fixed512>();
-
-        case GeneratorType::UNSPECIFIED:
-        default:
-            return Real(0);
-        }
-    }
-
-
     template<>
     template<>
     Real getPrecision<float>() {
     Real getPrecision<float>() {
         return Real("1.0e-7");
         return Real("1.0e-7");

+ 80 - 156
libmandel/src/Mandel.cpp

@@ -11,73 +11,13 @@
 #endif // WITH_ASMJIT
 #endif // WITH_ASMJIT
 
 
 #include <map>
 #include <map>
+#include <array>
 
 
 using mnd::MandelDevice;
 using mnd::MandelDevice;
 using mnd::MandelContext;
 using mnd::MandelContext;
 using mnd::MandelGenerator;
 using mnd::MandelGenerator;
 using mnd::AdaptiveGenerator;
 using mnd::AdaptiveGenerator;
 
 
-template<typename T, typename U>
-static std::map<U, T> invertMap(const std::map<T, U>& m)
-{
-    std::map<U, T> res;
-    std::transform(m.begin(), m.end(), std::inserter(res, res.end()), [](auto& pair) {
-        return std::pair{ pair.second, pair.first };
-    });
-    return res;
-}
-
-
-static const std::map<mnd::GeneratorType, std::string> typeNames =
-{
-    { mnd::GeneratorType::FLOAT, "float" },
-    { mnd::GeneratorType::FLOAT_SSE2, "float SSE2" },
-    { mnd::GeneratorType::FLOAT_AVX, "float AVX" },
-    { mnd::GeneratorType::FLOAT_AVX_FMA, "float AVX+FMA" },
-    { mnd::GeneratorType::FLOAT_AVX512, "float AVX512" },
-    { mnd::GeneratorType::FLOAT_NEON, "float NEON" },
-    { mnd::GeneratorType::DOUBLE_FLOAT, "double float" },
-    { mnd::GeneratorType::DOUBLE, "double" },
-    { mnd::GeneratorType::DOUBLE_SSE2, "double SSE2" },
-    { mnd::GeneratorType::DOUBLE_AVX, "double AVX" },
-    { mnd::GeneratorType::DOUBLE_AVX_FMA, "double AVX+FMA" },
-    { mnd::GeneratorType::DOUBLE_AVX512, "double AVX512" },
-    { mnd::GeneratorType::DOUBLE_NEON, "double NEON" },
-    { mnd::GeneratorType::DOUBLE_DOUBLE, "double double" },
-    { mnd::GeneratorType::DOUBLE_DOUBLE_AVX, "double double AVX" },
-    { mnd::GeneratorType::DOUBLE_DOUBLE_AVX_FMA, "double double AVX+FMA" },
-    { mnd::GeneratorType::DOUBLE_DOUBLE_NEON, "double double NEON" },
-    { mnd::GeneratorType::TRIPLE_DOUBLE, "triple double" },
-    { mnd::GeneratorType::TRIPLE_DOUBLE_AVX, "triple double AVX" },
-    { mnd::GeneratorType::QUAD_DOUBLE, "quad double" },
-    { mnd::GeneratorType::QUAD_DOUBLE_AVX_FMA, "quad double AVX+FMA" },
-    { mnd::GeneratorType::FLOAT128, "float128" },
-    { mnd::GeneratorType::FLOAT256, "float256" },
-    { mnd::GeneratorType::FIXED64, "fixed64" },
-    { mnd::GeneratorType::FIXED128, "fixed128" },
-    { mnd::GeneratorType::FIXED512, "fixed512" },
-};
-
-
-static const std::map<std::string, mnd::GeneratorType> nameTypes = invertMap(typeNames);
-
-
-namespace mnd
-{
-
-    const std::string& getGeneratorName(mnd::GeneratorType type)
-    {
-        return typeNames.at(type);
-    }
-
-
-    mnd::GeneratorType getTypeFromName(const std::string& name)
-    {
-        return nameTypes.at(name);
-    }
-
-}
-
 
 
 MandelContext mnd::initializeContext(void)
 MandelContext mnd::initializeContext(void)
 {
 {
@@ -95,7 +35,7 @@ MandelDevice::MandelDevice(mnd::ClDeviceWrapper device, const std::string& platf
 }
 }
 
 
 
 
-mnd::MandelGenerator* MandelDevice::getGenerator(mnd::GeneratorType type) const
+mnd::MandelGenerator* MandelDevice::getGenerator(mnd::Precision type) const
 {
 {
     auto it = mandelGenerators.find(type);
     auto it = mandelGenerators.find(type);
     if (it != mandelGenerators.end())
     if (it != mandelGenerators.end())
@@ -105,9 +45,9 @@ mnd::MandelGenerator* MandelDevice::getGenerator(mnd::GeneratorType type) const
 }
 }
 
 
 
 
-std::vector<mnd::GeneratorType> MandelDevice::getSupportedTypes(void) const
+std::vector<mnd::Precision> MandelDevice::getSupportedTypes(void) const
 {
 {
-    std::vector<GeneratorType> types;
+    std::vector<Precision> types;
     for (auto& [type, gen] : mandelGenerators) {
     for (auto& [type, gen] : mandelGenerators) {
         types.push_back(type);
         types.push_back(type);
     }
     }
@@ -132,8 +72,8 @@ MandelContext::MandelContext(void)
     if (cpuInfo.hasAvx512()) {
     if (cpuInfo.hasAvx512()) {
         auto fl = std::make_unique<CpuGenerator<float, mnd::X86_AVX_512, true>>();
         auto fl = std::make_unique<CpuGenerator<float, mnd::X86_AVX_512, true>>();
         //auto db = std::make_unique<CpuGenerator<double, mnd::X86_AVX_512, true>>();
         //auto db = std::make_unique<CpuGenerator<double, mnd::X86_AVX_512, true>>();
-        cpuGenerators.insert({ GeneratorType::FLOAT_AVX512, std::move(fl) });
-        //cpuGenerators.insert({ GeneratorType::DOUBLE_AVX512, std::move(db) });
+        cpuGenerators.insert({ { Precision::FLOAT, CpuExtension::X86_AVX_512 }, std::move(fl) });
+        //cpuGenerators.insert({ { Precision::DOUBLE, CpuExtension::X86_AVX_512 }, std::move(db) });
     }
     }
 #   endif
 #   endif
     if (cpuInfo.hasAvx()) {
     if (cpuInfo.hasAvx()) {
@@ -141,66 +81,66 @@ MandelContext::MandelContext(void)
         auto db = std::make_unique<CpuGenerator<double, mnd::X86_AVX, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::X86_AVX, true>>();
         auto ddb = std::make_unique<CpuGenerator<DoubleDouble, mnd::X86_AVX, true>>();
         auto ddb = std::make_unique<CpuGenerator<DoubleDouble, mnd::X86_AVX, true>>();
         auto tdb = std::make_unique<CpuGenerator<TripleDouble, mnd::X86_AVX, true>>();
         auto tdb = std::make_unique<CpuGenerator<TripleDouble, mnd::X86_AVX, true>>();
-        cpuGenerators.insert({ GeneratorType::FLOAT_AVX, std::move(fl) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_AVX, std::move(db) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE_AVX, std::move(ddb) });
-        cpuGenerators.insert({ GeneratorType::TRIPLE_DOUBLE_AVX, std::move(tdb) });
+        cpuGenerators.insert({ { Precision::FLOAT, CpuExtension::X86_AVX }, std::move(fl) });
+        cpuGenerators.insert({ { Precision::DOUBLE, CpuExtension::X86_AVX }, std::move(db) });
+        cpuGenerators.insert({ { Precision::DOUBLE_DOUBLE, CpuExtension::X86_AVX }, std::move(ddb) });
+        cpuGenerators.insert({ { Precision::TRIPLE_DOUBLE, CpuExtension::X86_AVX }, std::move(tdb) });
     }
     }
     if (cpuInfo.hasAvx2() && cpuInfo.hasFma()) {
     if (cpuInfo.hasAvx2() && cpuInfo.hasFma()) {
         auto favxfma = std::make_unique<CpuGenerator<float, mnd::X86_AVX_FMA, true>>();
         auto favxfma = std::make_unique<CpuGenerator<float, mnd::X86_AVX_FMA, true>>();
         auto davxfma = std::make_unique<CpuGenerator<double, mnd::X86_AVX_FMA, true>>();
         auto davxfma = std::make_unique<CpuGenerator<double, mnd::X86_AVX_FMA, true>>();
         auto ddavxfma = std::make_unique<CpuGenerator<DoubleDouble, mnd::X86_AVX_FMA, true>>();
         auto ddavxfma = std::make_unique<CpuGenerator<DoubleDouble, mnd::X86_AVX_FMA, true>>();
         auto qdavxfma = std::make_unique<CpuGenerator<QuadDouble, mnd::X86_AVX_FMA, true>>();
         auto qdavxfma = std::make_unique<CpuGenerator<QuadDouble, mnd::X86_AVX_FMA, true>>();
-        cpuGenerators.insert({ GeneratorType::FLOAT_AVX_FMA, std::move(favxfma) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_AVX_FMA, std::move(davxfma) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE_AVX_FMA, std::move(ddavxfma) });
-        cpuGenerators.insert({ GeneratorType::QUAD_DOUBLE_AVX_FMA, std::move(qdavxfma) });
+        cpuGenerators.insert({ { Precision::FLOAT, CpuExtension::X86_AVX_FMA }, std::move(favxfma) });
+        cpuGenerators.insert({ { Precision::DOUBLE, CpuExtension::X86_AVX_FMA }, std::move(davxfma) });
+        cpuGenerators.insert({ { Precision::DOUBLE_DOUBLE, CpuExtension::X86_AVX_FMA }, std::move(ddavxfma) });
+        cpuGenerators.insert({ { Precision::QUAD_DOUBLE, CpuExtension::X86_AVX_FMA }, std::move(qdavxfma) });
     }
     }
     if (cpuInfo.hasSse2()) {
     if (cpuInfo.hasSse2()) {
         auto fl = std::make_unique<CpuGenerator<float, mnd::X86_SSE2, true>>();
         auto fl = std::make_unique<CpuGenerator<float, mnd::X86_SSE2, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::X86_SSE2, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::X86_SSE2, true>>();
-        cpuGenerators.insert({ GeneratorType::FLOAT_SSE2, std::move(fl) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_SSE2, std::move(db) });
+        cpuGenerators.insert({ { Precision::FLOAT, CpuExtension::X86_SSE2 }, std::move(fl) });
+        cpuGenerators.insert({ { Precision::DOUBLE, CpuExtension::X86_SSE2 }, std::move(db) });
     }
     }
 #elif defined(__arm__) || defined(__aarch64__) || defined(_M_ARM) 
 #elif defined(__arm__) || defined(__aarch64__) || defined(_M_ARM) 
     if (cpuInfo.hasNeon()) {
     if (cpuInfo.hasNeon()) {
         auto fl = std::make_unique<CpuGenerator<float, mnd::ARM_NEON, true>>();
         auto fl = std::make_unique<CpuGenerator<float, mnd::ARM_NEON, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::ARM_NEON, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::ARM_NEON, true>>();
         auto ddb = std::make_unique<CpuGenerator<mnd::DoubleDouble, mnd::ARM_NEON, true>>();
         auto ddb = std::make_unique<CpuGenerator<mnd::DoubleDouble, mnd::ARM_NEON, true>>();
-        cpuGenerators.insert({ GeneratorType::FLOAT_NEON, std::move(fl) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_NEON, std::move(db) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE_NEON, std::move(ddb) });
+        cpuGenerators.insert({ { Precision::FLOAT, CpuExtension::ARM_NEON }, std::move(fl) });
+        cpuGenerators.insert({ { Precision::DOUBLE, CpuExtension::ARM_NEON }, std::move(db) });
+        cpuGenerators.insert({ { Precision::DOUBLE_DOUBLE, CpuExtension::ARM_NEON }, std::move(ddb) });
     }
     }
 #endif
 #endif
     {
     {
         auto fl = std::make_unique<CpuGenerator<float, mnd::NONE, true>>();
         auto fl = std::make_unique<CpuGenerator<float, mnd::NONE, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::NONE, true>>();
         auto db = std::make_unique<CpuGenerator<double, mnd::NONE, true>>();
-        cpuGenerators.insert({ GeneratorType::FLOAT, std::move(fl) });
-        cpuGenerators.insert({ GeneratorType::DOUBLE, std::move(db) });
+        cpuGenerators.insert({ { Precision::FLOAT, CpuExtension::NONE }, std::move(fl) });
+        cpuGenerators.insert({ { Precision::DOUBLE, CpuExtension::NONE }, std::move(db) });
 
 
         auto fx64 = std::make_unique<CpuGenerator<Fixed64, mnd::NONE, true>>();
         auto fx64 = std::make_unique<CpuGenerator<Fixed64, mnd::NONE, true>>();
         auto fx128 = std::make_unique<CpuGenerator<Fixed128, mnd::NONE, true>>();
         auto fx128 = std::make_unique<CpuGenerator<Fixed128, mnd::NONE, true>>();
-        cpuGenerators.insert({ GeneratorType::FIXED64, std::move(fx64) });
-        cpuGenerators.insert({ GeneratorType::FIXED128, std::move(fx128) });
+        cpuGenerators.insert({ { Precision::FIXED64, CpuExtension::NONE }, std::move(fx64) });
+        cpuGenerators.insert({ { Precision::FIXED128, CpuExtension::NONE }, std::move(fx128) });
     }
     }
 
 
 #ifdef WITH_BOOST
 #ifdef WITH_BOOST
     auto quad = std::make_unique<CpuGenerator<Float128, mnd::NONE, true>>();
     auto quad = std::make_unique<CpuGenerator<Float128, mnd::NONE, true>>();
     auto oct = std::make_unique<CpuGenerator<Float256, mnd::NONE, true>>();
     auto oct = std::make_unique<CpuGenerator<Float256, mnd::NONE, true>>();
-    cpuGenerators.insert({ GeneratorType::FLOAT128, std::move(quad) });
-    cpuGenerators.insert({ GeneratorType::FLOAT256, std::move(oct) });
+    cpuGenerators.insert({ { Precision::FLOAT128, CpuExtension::NONE }, std::move(quad) });
+    cpuGenerators.insert({ { Precision::FLOAT256, CpuExtension::NONE }, std::move(oct) });
 #endif // WITH_BOOST
 #endif // WITH_BOOST
 
 
     auto dd = std::make_unique<CpuGenerator<DoubleDouble, mnd::NONE, true>>();
     auto dd = std::make_unique<CpuGenerator<DoubleDouble, mnd::NONE, true>>();
     auto qd = std::make_unique<CpuGenerator<QuadDouble, mnd::NONE, true>>();
     auto qd = std::make_unique<CpuGenerator<QuadDouble, mnd::NONE, true>>();
-    cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE, std::move(dd) });
-    cpuGenerators.insert({ GeneratorType::QUAD_DOUBLE, std::move(qd) });
+    cpuGenerators.insert({ { Precision::DOUBLE_DOUBLE, CpuExtension::NONE }, std::move(dd) });
+    cpuGenerators.insert({ { Precision::QUAD_DOUBLE, CpuExtension::NONE }, std::move(qd) });
 
 
     auto td = std::make_unique<CpuGenerator<TripleDouble, mnd::NONE, true>>();
     auto td = std::make_unique<CpuGenerator<TripleDouble, mnd::NONE, true>>();
-    cpuGenerators.insert({ GeneratorType::TRIPLE_DOUBLE, std::move(td) });
+    cpuGenerators.insert({ { Precision::TRIPLE_DOUBLE, CpuExtension::NONE }, std::move(td) });
 
 
     auto fix512 = std::make_unique<CpuGenerator<Fixed512, mnd::NONE, true>>();
     auto fix512 = std::make_unique<CpuGenerator<Fixed512, mnd::NONE, true>>();
-    cpuGenerators.insert({ GeneratorType::FIXED512, std::move(fix512) });
+    cpuGenerators.insert({ { Precision::FIXED512, CpuExtension::NONE }, std::move(fix512) });
 
 
     devices = createDevices();
     devices = createDevices();
 
 
@@ -210,68 +150,41 @@ MandelContext::MandelContext(void)
 
 
 std::unique_ptr<mnd::AdaptiveGenerator> MandelContext::createAdaptiveGenerator(void)
 std::unique_ptr<mnd::AdaptiveGenerator> MandelContext::createAdaptiveGenerator(void)
 {
 {
-    auto* floatGen = getCpuGenerator(GeneratorType::FLOAT);
-    auto* doubleGen = getCpuGenerator(GeneratorType::DOUBLE);
-    auto* doubleDoubleGen = getCpuGenerator(GeneratorType::DOUBLE_DOUBLE);
-    auto* tripleDoubleGen = getCpuGenerator(GeneratorType::TRIPLE_DOUBLE);
-    auto* quadDoubleGen = getCpuGenerator(GeneratorType::QUAD_DOUBLE);
-    auto* f256Gen = getCpuGenerator(GeneratorType::FLOAT256);
-    auto* fix512 = getCpuGenerator(GeneratorType::FIXED512);
 
 
-    if (cpuInfo.hasAvx()) {
-        floatGen = getCpuGenerator(GeneratorType::FLOAT_AVX);
-        doubleGen = getCpuGenerator(GeneratorType::DOUBLE_AVX);
-    }
-    else if (cpuInfo.hasSse2()) {
-        floatGen = getCpuGenerator(GeneratorType::FLOAT_SSE2);
-        doubleGen = getCpuGenerator(GeneratorType::DOUBLE_SSE2);
-    }
-    if (cpuInfo.hasAvx2() && cpuInfo.hasFma()) {
-        floatGen = getCpuGenerator(GeneratorType::FLOAT_AVX_FMA);
-        doubleGen = getCpuGenerator(GeneratorType::DOUBLE_AVX_FMA);
-        doubleDoubleGen = getCpuGenerator(GeneratorType::DOUBLE_DOUBLE_AVX_FMA);
-        quadDoubleGen = getCpuGenerator(GeneratorType::QUAD_DOUBLE_AVX_FMA);
-    }
-    if (cpuInfo.hasAvx512()) {
-        floatGen = getCpuGenerator(GeneratorType::FLOAT_AVX512);
-        doubleGen = getCpuGenerator(GeneratorType::DOUBLE_AVX512);
-    }
+    std::vector<Precision> types {
+        Precision::FLOAT,
+        Precision::DOUBLE_FLOAT,
+        Precision::DOUBLE,
+        Precision::DOUBLE_DOUBLE,
+        Precision::TRIPLE_DOUBLE,
+        Precision::QUAD_DOUBLE,
+        Precision::FLOAT256,
+        Precision::FLOAT512
+    };
 
 
-    if (cpuInfo.hasNeon()) {
-        floatGen = getCpuGenerator(GeneratorType::FLOAT_NEON);
-        doubleGen = getCpuGenerator(GeneratorType::DOUBLE_NEON);
-        doubleDoubleGen = getCpuGenerator(GeneratorType::DOUBLE_DOUBLE_NEON);
-    }
+    auto ag = std::make_unique<AdaptiveGenerator>();
 
 
-    if (!devices.empty()) {
-        auto& device = devices[0];
-        auto* fGen = device->getGenerator(GeneratorType::FLOAT);
-        auto* dGen = device->getGenerator(GeneratorType::DOUBLE);
-        auto* ddGen = device->getGenerator(GeneratorType::DOUBLE_DOUBLE);
-        auto* tdGen = device->getGenerator(GeneratorType::TRIPLE_DOUBLE);
-        auto* qdGen = device->getGenerator(GeneratorType::QUAD_DOUBLE);
-
-        if (fGen)
-            floatGen = fGen;
-        if (dGen)
-            doubleGen = dGen;
-        if (ddGen)
-            doubleDoubleGen = ddGen;
-        if (tdGen)
-            tripleDoubleGen = tdGen;
-        if (qdGen)
-            quadDoubleGen = qdGen;
+    for (auto type : types) {
+        MandelGenerator* chosenGen = nullptr;
+        auto generators = getCpuGenerators(type);
+        CpuExtension ex = CpuExtension::NONE;
+        for (auto* generator : generators) {
+            if (generator->getExtension() >= ex) {
+                ex = generator->getExtension();
+                chosenGen = generator;
+            }
+        }
+        for (auto& device : getDevices()) {
+            auto* clGen = device->getGenerator(type);
+            if (clGen != nullptr) {
+                chosenGen = clGen;
+            }
+        }
+        if (chosenGen != nullptr) {
+            ag->addGenerator(mnd::getPrecision(type), *chosenGen);
+        }
     }
     }
 
 
-    auto ag = std::make_unique<AdaptiveGenerator>();
-    ag->addGenerator(getPrecision<float>(), *floatGen);
-    ag->addGenerator(getPrecision<double>(), *doubleGen);
-    ag->addGenerator(getPrecision<DoubleDouble>(), *doubleDoubleGen);
-    ag->addGenerator(getPrecision<TripleDouble>(), *tripleDoubleGen);
-    ag->addGenerator(getPrecision<QuadDouble>(), *quadDoubleGen);
-    ag->addGenerator(getPrecision<Float256>(), *f256Gen);
-    ag->addGenerator(Precision::INF_PREC, *fix512);
-
     return ag;
     return ag;
 }
 }
 
 
@@ -320,15 +233,15 @@ std::vector<std::unique_ptr<MandelDevice>> MandelContext::createDevices(void)
 
 
             //printf("    using opencl device: %s\n", md.name.c_str());
             //printf("    using opencl device: %s\n", md.name.c_str());
             try {
             try {
-                md.mandelGenerators.insert({ GeneratorType::FLOAT, std::make_unique<ClGeneratorFloat>(md) });
-                md.mandelGenerators.insert({ GeneratorType::FIXED64, std::make_unique<ClGenerator64>(md) });
+                md.mandelGenerators.insert({ Precision::FLOAT, std::make_unique<ClGeneratorFloat>(md) });
+                md.mandelGenerators.insert({ Precision::FIXED64, std::make_unique<ClGenerator64>(md) });
                 //md.mandelGenerators.insert({ GeneratorType::FIXED128, std::make_unique<ClGenerator128>(md) });
                 //md.mandelGenerators.insert({ GeneratorType::FIXED128, std::make_unique<ClGenerator128>(md) });
             }
             }
             catch (const std::string& err) {
             catch (const std::string& err) {
                 printf("err: %s", err.c_str());
                 printf("err: %s", err.c_str());
             }
             }
             try {
             try {
-                md.mandelGenerators.insert({ GeneratorType::DOUBLE_FLOAT, std::make_unique<ClGeneratorDoubleFloat>(md) });
+                md.mandelGenerators.insert({ Precision::DOUBLE_FLOAT, std::make_unique<ClGeneratorDoubleFloat>(md) });
             }
             }
             catch (const std::string& err) {
             catch (const std::string& err) {
                 printf("err: %s", err.c_str());
                 printf("err: %s", err.c_str());
@@ -336,10 +249,10 @@ std::vector<std::unique_ptr<MandelDevice>> MandelContext::createDevices(void)
 
 
             if (supportsDouble) {
             if (supportsDouble) {
                 try {
                 try {
-                    md.mandelGenerators.insert({ GeneratorType::DOUBLE, std::make_unique<ClGeneratorDouble>(md) });
-                    md.mandelGenerators.insert({ GeneratorType::DOUBLE_DOUBLE, std::make_unique<ClGeneratorDoubleDouble>(md) });
-                    md.mandelGenerators.insert({ GeneratorType::TRIPLE_DOUBLE, std::make_unique<ClGeneratorTripleDouble>(md) });
-                    md.mandelGenerators.insert({ GeneratorType::QUAD_DOUBLE, std::make_unique<ClGeneratorQuadDouble>(md) });
+                    md.mandelGenerators.insert({ Precision::DOUBLE, std::make_unique<ClGeneratorDouble>(md) });
+                    md.mandelGenerators.insert({ Precision::DOUBLE_DOUBLE, std::make_unique<ClGeneratorDoubleDouble>(md) });
+                    md.mandelGenerators.insert({ Precision::TRIPLE_DOUBLE, std::make_unique<ClGeneratorTripleDouble>(md) });
+                    md.mandelGenerators.insert({ Precision::QUAD_DOUBLE, std::make_unique<ClGeneratorQuadDouble>(md) });
                 }
                 }
                 catch (const std::string& err) {
                 catch (const std::string& err) {
                     printf("err: %s", err.c_str());
                     printf("err: %s", err.c_str());
@@ -386,9 +299,9 @@ asmjit::JitRuntime& MandelContext::getJitRuntime(void)
 }
 }
 
 
 
 
-MandelGenerator* MandelContext::getCpuGenerator(mnd::GeneratorType type)
+MandelGenerator* MandelContext::getCpuGenerator(mnd::Precision type, mnd::CpuExtension ex)
 {
 {
-    auto it = cpuGenerators.find(type);
+    auto it = cpuGenerators.find({ type, ex });
     if (it != cpuGenerators.end())
     if (it != cpuGenerators.end())
         return it->second.get();
         return it->second.get();
     else
     else
@@ -396,7 +309,7 @@ MandelGenerator* MandelContext::getCpuGenerator(mnd::GeneratorType type)
 }
 }
 
 
 
 
-std::vector<mnd::GeneratorType> MandelContext::getSupportedTypes(void) const
+std::vector<MandelContext::GeneratorType> MandelContext::getSupportedTypes(void) const
 {
 {
     std::vector<GeneratorType> types;
     std::vector<GeneratorType> types;
     for (auto& [type, gen] : cpuGenerators) {
     for (auto& [type, gen] : cpuGenerators) {
@@ -406,3 +319,14 @@ std::vector<mnd::GeneratorType> MandelContext::getSupportedTypes(void) const
 }
 }
 
 
 
 
+std::vector<MandelGenerator*> MandelContext::getCpuGenerators(mnd::Precision prec) const
+{
+    std::vector<MandelGenerator*> generators;
+    for (const auto& [type, gen] : cpuGenerators) {
+        if (type.first == prec)
+            generators.push_back(gen.get());
+    }
+    return generators;
+}
+
+

+ 5 - 3
mandelbench/mandelbench.cpp

@@ -117,8 +117,10 @@ int main()
     std::cout << "Benchmarking CPU [" << mc.getCpuInfo().getBrand() << "]" << std::endl;
     std::cout << "Benchmarking CPU [" << mc.getCpuInfo().getBrand() << "]" << std::endl;
 
 
     auto types = mc.getSupportedTypes();
     auto types = mc.getSupportedTypes();
-    for (auto type : types) {
-        REPORT_PERFORMANCE(mnd::getGeneratorName(type) + " [MIps]: ", benchmark(*mc.getCpuGenerator(type)));
+    for (auto [type, extension] : types) {
+        std::string extInfo = extension != mnd::CpuExtension::NONE ?
+            std::string(" ") + mnd::toString(extension) : "";
+        REPORT_PERFORMANCE(mnd::toString(type) + extInfo + " [MIps]: ", benchmark(*mc.getCpuGenerator(type, extension)));
     }
     }
     
     
     std::cout << std::endl;
     std::cout << std::endl;
@@ -127,7 +129,7 @@ int main()
 
 
         auto types = device->getSupportedTypes();
         auto types = device->getSupportedTypes();
         for (auto type : types) {
         for (auto type : types) {
-            REPORT_PERFORMANCE(mnd::getGeneratorName(type) + " [MIps]: ", benchmark(*device->getGenerator(type)));
+            REPORT_PERFORMANCE(mnd::toString(type) + " [MIps]: ", benchmark(*device->getGenerator(type)));
         }
         }
         std::cout << std::endl;
         std::cout << std::endl;
     }
     }

+ 6 - 15
src/choosegenerators.cpp

@@ -181,28 +181,19 @@ ChooseGenerators::ChooseGenerators(mnd::MandelContext& mndCtxt, mnd::AdaptiveGen
     QRegExp floatingpoint{ "^[-+]?(\\d*\\.?\\d+|\\d+\\.?\\d*)([eE][-+]\\d+)?$" };
     QRegExp floatingpoint{ "^[-+]?(\\d*\\.?\\d+|\\d+\\.?\\d*)([eE][-+]\\d+)?$" };
     floatValidator = std::make_unique<QRegExpValidator>(floatingpoint, this);
     floatValidator = std::make_unique<QRegExpValidator>(floatingpoint, this);
 
 
-    for (auto genType : mndCtxt.getSupportedTypes()) {
-        const std::string& typeName = mnd::getGeneratorName(genType);
-        generators.insert({ QString::fromStdString(typeName), mndCtxt.getCpuGenerator(genType) });
+    for (auto [type, extension] : mndCtxt.getSupportedTypes()) {
+        const std::string& typeName = mnd::toString(type);
+        const std::string& extName = mnd::toString(extension);
+        const std::string& name = typeName + (extName != "" ? " " : "") + extName;
+        generators.insert({ QString::fromStdString(name), mndCtxt.getCpuGenerator(type, extension) });
     }
     }
     for (auto& device : mndCtxt.getDevices()) {
     for (auto& device : mndCtxt.getDevices()) {
         for (auto genType : device->getSupportedTypes()) {
         for (auto genType : device->getSupportedTypes()) {
-            const std::string& typeName = mnd::getGeneratorName(genType) + " [" + device->getName() + "]";
+            const std::string& typeName = mnd::toString(genType) + " [" + device->getName() + "]";
             generators.insert({ QString::fromStdString(typeName), device->getGenerator(genType) });
             generators.insert({ QString::fromStdString(typeName), device->getGenerator(genType) });
         }
         }
     }
     }
 
 
-    std::vector<mnd::MandelGenerator*> allGenerators;
-
-    /*for (auto genType : mndCtxt.getSupportedTypes()) {
-        allGenerators.push_back(mndCtxt.getCpuGenerator(genType));
-    }
-    for (auto& device : mndCtxt.getDevices()) {
-        for (auto genType : device.getSupportedTypes()) {
-            allGenerators.push_back(device.getGenerator(genType));
-        }
-    }*/
-
     initializeTables();
     initializeTables();
 
 
     //ui->addRow->setIcon(ui->addRow->style()->standardIcon(QStyle::SP_));
     //ui->addRow->setIcon(ui->addRow->style()->standardIcon(QStyle::SP_));