Mandel.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369
  1. #include "Mandel.h"
  2. #include "Fixed.h"
  3. #include "CpuGenerators.h"
  4. #include "ClGenerators.h"
  5. #include "OpenClInternal.h"
  6. #include "OpenClCode.h"
  7. #include <asmjit/asmjit.h>
  8. #include <map>
  9. using mnd::MandelDevice;
  10. using mnd::MandelContext;
  11. using mnd::MandelGenerator;
  12. using mnd::AdaptiveGenerator;
  13. template<typename T, typename U>
  14. static std::map<U, T> invertMap(const std::map<T, U>& m)
  15. {
  16. std::map<U, T> res;
  17. std::transform(m.begin(), m.end(), std::inserter(res, res.end()), [](auto& pair) {
  18. return std::pair{ pair.second, pair.first };
  19. });
  20. return res;
  21. }
  22. static const std::map<mnd::GeneratorType, std::string> typeNames =
  23. {
  24. { mnd::GeneratorType::FLOAT, "float" },
  25. { mnd::GeneratorType::FLOAT_SSE2, "float SSE2" },
  26. { mnd::GeneratorType::FLOAT_AVX, "float AVX" },
  27. { mnd::GeneratorType::FLOAT_AVX_FMA, "float AVX+FMA" },
  28. { mnd::GeneratorType::FLOAT_AVX512, "float AVX512" },
  29. { mnd::GeneratorType::FLOAT_NEON, "float NEON" },
  30. { mnd::GeneratorType::DOUBLE_FLOAT, "double float" },
  31. { mnd::GeneratorType::DOUBLE, "double" },
  32. { mnd::GeneratorType::DOUBLE_SSE2, "double SSE2" },
  33. { mnd::GeneratorType::DOUBLE_AVX, "double AVX" },
  34. { mnd::GeneratorType::DOUBLE_AVX_FMA, "double AVX+FMA" },
  35. { mnd::GeneratorType::DOUBLE_AVX512, "double AVX512" },
  36. { mnd::GeneratorType::DOUBLE_NEON, "double NEON" },
  37. { mnd::GeneratorType::DOUBLE_DOUBLE, "double double" },
  38. { mnd::GeneratorType::DOUBLE_DOUBLE_AVX, "double double AVX" },
  39. { mnd::GeneratorType::DOUBLE_DOUBLE_AVX_FMA, "double double AVX+FMA" },
  40. { mnd::GeneratorType::QUAD_DOUBLE, "quad double" },
  41. { mnd::GeneratorType::QUAD_DOUBLE_AVX_FMA, "quad double AVX+FMA" },
  42. { mnd::GeneratorType::FLOAT128, "float128" },
  43. { mnd::GeneratorType::FLOAT256, "float256" },
  44. { mnd::GeneratorType::FIXED64, "fixed64" },
  45. { mnd::GeneratorType::FIXED128, "fixed128" },
  46. { mnd::GeneratorType::FIXED512, "fixed512" },
  47. };
  48. static const std::map<std::string, mnd::GeneratorType> nameTypes = invertMap(typeNames);
  49. namespace mnd
  50. {
  51. const std::string& getGeneratorName(mnd::GeneratorType type)
  52. {
  53. return typeNames.at(type);
  54. }
  55. mnd::GeneratorType getTypeFromName(const std::string& name)
  56. {
  57. return nameTypes.at(name);
  58. }
  59. }
  60. MandelContext mnd::initializeContext(void)
  61. {
  62. return MandelContext();
  63. }
  64. MandelDevice::MandelDevice(mnd::ClDeviceWrapper device) :
  65. clDevice{ std::make_unique<ClDeviceWrapper>(std::move(device)) }
  66. {
  67. extensions = clDevice->device.getInfo<CL_DEVICE_EXTENSIONS>();
  68. }
  69. mnd::MandelGenerator* MandelDevice::getGenerator(mnd::GeneratorType type) const
  70. {
  71. auto it = mandelGenerators.find(type);
  72. if (it != mandelGenerators.end())
  73. return it->second.get();
  74. else
  75. return nullptr;
  76. }
  77. std::vector<mnd::GeneratorType> MandelDevice::getSupportedTypes(void) const
  78. {
  79. std::vector<GeneratorType> types;
  80. for (auto& [type, gen] : mandelGenerators) {
  81. types.push_back(type);
  82. }
  83. return types;
  84. }
  85. bool MandelDevice::supportsDouble(void) const
  86. {
  87. return extensions.find("cl_khr_fp64") != std::string::npos;
  88. }
  89. MandelContext::MandelContext(void) :
  90. jitRuntime{ std::make_unique<asmjit::JitRuntime>() }
  91. {
  92. #if defined(__x86_64__) || defined(_M_X64) || defined(__i386) || defined(_M_IX86)
  93. if (cpuInfo.hasAvx512()) {
  94. auto fl = std::make_unique<CpuGenerator<float, mnd::X86_AVX_512, true>>();
  95. auto db = std::make_unique<CpuGenerator<double, mnd::X86_AVX_512, true>>();
  96. cpuGenerators.insert({ GeneratorType::FLOAT_AVX512, std::move(fl) });
  97. cpuGenerators.insert({ GeneratorType::DOUBLE_AVX512, std::move(db) });
  98. }
  99. if (cpuInfo.hasAvx()) {
  100. auto fl = std::make_unique<CpuGenerator<float, mnd::X86_AVX, true>>();
  101. auto db = std::make_unique<CpuGenerator<double, mnd::X86_AVX, true>>();
  102. auto ddb = std::make_unique<CpuGenerator<DoubleDouble, mnd::X86_AVX, true>>();
  103. cpuGenerators.insert({ GeneratorType::FLOAT_AVX, std::move(fl) });
  104. cpuGenerators.insert({ GeneratorType::DOUBLE_AVX, std::move(db) });
  105. cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE_AVX, std::move(ddb) });
  106. if (cpuInfo.hasFma()) {
  107. auto favxfma = std::make_unique<CpuGenerator<float, mnd::X86_AVX_FMA, true>>();
  108. auto davxfma = std::make_unique<CpuGenerator<double, mnd::X86_AVX_FMA, true>>();
  109. auto ddavxfma = std::make_unique<CpuGenerator<DoubleDouble, mnd::X86_AVX_FMA, true>>();
  110. auto qdavxfma = std::make_unique<CpuGenerator<QuadDouble, mnd::X86_AVX_FMA, true>>();
  111. cpuGenerators.insert({ GeneratorType::FLOAT_AVX_FMA, std::move(favxfma) });
  112. cpuGenerators.insert({ GeneratorType::DOUBLE_AVX_FMA, std::move(davxfma) });
  113. cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE_AVX_FMA, std::move(ddavxfma) });
  114. cpuGenerators.insert({ GeneratorType::QUAD_DOUBLE_AVX_FMA, std::move(qdavxfma) });
  115. }
  116. }
  117. if (cpuInfo.hasSse2()) {
  118. auto fl = std::make_unique<CpuGenerator<float, mnd::X86_SSE2, true>>();
  119. auto db = std::make_unique<CpuGenerator<double, mnd::X86_SSE2, true>>();
  120. cpuGenerators.insert({ GeneratorType::FLOAT_SSE2, std::move(fl) });
  121. cpuGenerators.insert({ GeneratorType::DOUBLE_SSE2, std::move(db) });
  122. }
  123. #elif defined(__arm__) || defined(__aarch64__) || defined(_M_ARM)
  124. if (cpuInfo.hasNeon()) {
  125. auto fl = std::make_unique<CpuGenerator<float, mnd::ARM_NEON, true>>();
  126. auto db = std::make_unique<CpuGenerator<double, mnd::ARM_NEON, true>>();
  127. cpuGenerators.insert({ GeneratorType::FLOAT_NEON, std::move(fl) });
  128. cpuGenerators.insert({ GeneratorType::DOUBLE_NEON, std::move(db) });
  129. }
  130. #endif
  131. {
  132. auto fl = std::make_unique<CpuGenerator<float, mnd::NONE, true>>();
  133. auto db = std::make_unique<CpuGenerator<double, mnd::NONE, true>>();
  134. cpuGenerators.insert({ GeneratorType::FLOAT, std::move(fl) });
  135. cpuGenerators.insert({ GeneratorType::DOUBLE, std::move(db) });
  136. auto fx64 = std::make_unique<CpuGenerator<Fixed64, mnd::NONE, true>>();
  137. auto fx128 = std::make_unique<CpuGenerator<Fixed128, mnd::NONE, true>>();
  138. cpuGenerators.insert({ GeneratorType::FIXED64, std::move(fx64) });
  139. cpuGenerators.insert({ GeneratorType::FIXED128, std::move(fx128) });
  140. }
  141. #ifdef WITH_BOOST
  142. auto quad = std::make_unique<CpuGenerator<Float128, mnd::NONE, true>>();
  143. auto oct = std::make_unique<CpuGenerator<Float256, mnd::NONE, true>>();
  144. cpuGenerators.insert({ GeneratorType::FLOAT128, std::move(quad) });
  145. cpuGenerators.insert({ GeneratorType::FLOAT256, std::move(oct) });
  146. #endif // WITH_BOOST
  147. auto dd = std::make_unique<CpuGenerator<DoubleDouble, mnd::NONE, true>>();
  148. auto qd = std::make_unique<CpuGenerator<QuadDouble, mnd::NONE, true>>();
  149. cpuGenerators.insert({ GeneratorType::DOUBLE_DOUBLE, std::move(dd) });
  150. cpuGenerators.insert({ GeneratorType::QUAD_DOUBLE, std::move(qd) });
  151. auto fix512 = std::make_unique<CpuGenerator<Fixed512, mnd::NONE, true>>();
  152. cpuGenerators.insert({ GeneratorType::FIXED512, std::move(fix512) });
  153. devices = createDevices();
  154. adaptiveGenerator = createAdaptiveGenerator();
  155. }
  156. std::unique_ptr<mnd::AdaptiveGenerator> MandelContext::createAdaptiveGenerator(void)
  157. {
  158. auto* floatGen = getCpuGenerator(GeneratorType::FLOAT);
  159. auto* doubleGen = getCpuGenerator(GeneratorType::DOUBLE);
  160. auto* doubleDoubleGen = getCpuGenerator(GeneratorType::DOUBLE_DOUBLE);
  161. auto* quadDoubleGen = getCpuGenerator(GeneratorType::QUAD_DOUBLE);
  162. auto* f256Gen = getCpuGenerator(GeneratorType::FLOAT256);
  163. auto* fix512 = getCpuGenerator(GeneratorType::FIXED512);
  164. if (cpuInfo.hasAvx()) {
  165. floatGen = getCpuGenerator(GeneratorType::FLOAT_AVX);
  166. doubleGen = getCpuGenerator(GeneratorType::DOUBLE_AVX);
  167. }
  168. else if (cpuInfo.hasSse2()) {
  169. floatGen = getCpuGenerator(GeneratorType::FLOAT_SSE2);
  170. doubleGen = getCpuGenerator(GeneratorType::DOUBLE_SSE2);
  171. }
  172. if (cpuInfo.hasAvx() && cpuInfo.hasFma()) {
  173. floatGen = getCpuGenerator(GeneratorType::FLOAT_AVX_FMA);
  174. doubleGen = getCpuGenerator(GeneratorType::DOUBLE_AVX_FMA);
  175. doubleDoubleGen = getCpuGenerator(GeneratorType::DOUBLE_DOUBLE_AVX_FMA);
  176. }
  177. if (cpuInfo.hasAvx512()) {
  178. floatGen = getCpuGenerator(GeneratorType::FLOAT_AVX512);
  179. doubleGen = getCpuGenerator(GeneratorType::DOUBLE_AVX512);
  180. }
  181. if (cpuInfo.hasNeon()) {
  182. floatGen = getCpuGenerator(GeneratorType::FLOAT_NEON);
  183. doubleGen = getCpuGenerator(GeneratorType::DOUBLE_NEON);
  184. }
  185. if (!devices.empty()) {
  186. auto& device = devices[0];
  187. auto* fGen = device->getGenerator(GeneratorType::FLOAT);
  188. auto* dGen = device->getGenerator(GeneratorType::DOUBLE);
  189. auto* ddGen = device->getGenerator(GeneratorType::DOUBLE_DOUBLE);
  190. auto* qdGen = device->getGenerator(GeneratorType::QUAD_DOUBLE);
  191. if (fGen)
  192. floatGen = fGen;
  193. if (dGen)
  194. doubleGen = dGen;
  195. if (ddGen)
  196. doubleDoubleGen = ddGen;
  197. if (qdGen)
  198. quadDoubleGen = qdGen;
  199. }
  200. auto ag = std::make_unique<AdaptiveGenerator>();
  201. ag->addGenerator(getPrecision<float>(), *floatGen);
  202. ag->addGenerator(getPrecision<double>(), *doubleGen);
  203. ag->addGenerator(getPrecision<DoubleDouble>(), *doubleDoubleGen);
  204. ag->addGenerator(getPrecision<QuadDouble>(), *quadDoubleGen);
  205. ag->addGenerator(getPrecision<Float256>(), *f256Gen);
  206. ag->addGenerator(Precision::INF_PREC, *fix512);
  207. return ag;
  208. }
  209. std::vector<std::unique_ptr<MandelDevice>> MandelContext::createDevices(void)
  210. {
  211. std::vector<std::unique_ptr<MandelDevice>> mandelDevices;
  212. #ifdef WITH_OPENCL
  213. std::vector<cl::Platform> platforms;
  214. cl::Platform::get(&platforms);
  215. //platforms.erase(platforms.begin() + 1);
  216. for (auto& platform : platforms) {
  217. std::string name = platform.getInfo<CL_PLATFORM_NAME>();
  218. std::string profile = platform.getInfo<CL_PLATFORM_PROFILE>();
  219. //printf("using opencl platform: %s\n", name.c_str());
  220. //std::string ext = platform.getInfo<CL_PLATFORM_EXTENSIONS>();
  221. //printf("Platform extensions: %s\n", ext.c_str());
  222. //printf("Platform: %s, %s\n", name.c_str(), profile.c_str());
  223. std::vector<cl::Device> devices;
  224. platform.getDevices(CL_DEVICE_TYPE_GPU, &devices);
  225. for (auto& device : devices) {
  226. //printf("Device: %s\n", device.getInfo<CL_DEVICE_NAME>().c_str());
  227. //printf("preferred float width: %d\n", device.getInfo<CL_DEVICE_PREFERRED_VECTOR_WIDTH_FLOAT>());
  228. //printf("vendor: %s\n", device.getInfo<CL_DEVICE_VENDOR>().c_str());
  229. //printf("Device extensions: %s\n", ext.c_str());
  230. auto mandelDevice = std::make_unique<mnd::MandelDevice>(
  231. ClDeviceWrapper{ device, cl::Context{ device } });
  232. MandelDevice& md = *mandelDevice;
  233. auto supportsDouble = md.supportsDouble();
  234. //printf("clock: %d", device.getInfo<CL_DEVICE_MAX_CLOCK_FREQUENCY>());
  235. md.name = device.getInfo<CL_DEVICE_NAME>();
  236. md.vendor = device.getInfo<CL_DEVICE_VENDOR>();
  237. //printf(" using opencl device: %s\n", md.name.c_str());
  238. try {
  239. md.mandelGenerators.insert({ GeneratorType::FLOAT, std::make_unique<ClGeneratorFloat>(md) });
  240. md.mandelGenerators.insert({ GeneratorType::FIXED64, std::make_unique<ClGenerator64>(md) });
  241. md.mandelGenerators.insert({ GeneratorType::DOUBLE_FLOAT, std::make_unique<ClGeneratorDoubleFloat>(md) });
  242. }
  243. catch (const std::string& err) {
  244. printf("err: %s", err.c_str());
  245. }
  246. if (supportsDouble) {
  247. try {
  248. md.mandelGenerators.insert({ GeneratorType::DOUBLE, std::make_unique<ClGeneratorDouble>(md) });
  249. md.mandelGenerators.insert({ GeneratorType::DOUBLE_DOUBLE, std::make_unique<ClGeneratorDoubleDouble>(md) });
  250. md.mandelGenerators.insert({ GeneratorType::QUAD_DOUBLE, std::make_unique<ClGeneratorQuadDouble>(md) });
  251. }
  252. catch (const std::string& err) {
  253. printf("err: %s", err.c_str());
  254. fflush(stdout);
  255. }
  256. }
  257. try {
  258. //md.generator128 = std::make_unique<ClGenerator128>(device);
  259. }
  260. catch (const std::string& /*err*/) {
  261. //fprintf(stderr, "error creating 128bit cl generator: %s\n", err.c_str());
  262. }
  263. mandelDevices.push_back(std::move(mandelDevice));
  264. }
  265. }
  266. #endif // WITH_OPENCL
  267. return mandelDevices;
  268. }
  269. MandelContext::~MandelContext(void)
  270. {
  271. }
  272. AdaptiveGenerator& MandelContext::getDefaultGenerator(void)
  273. {
  274. return *adaptiveGenerator;
  275. }
  276. std::vector<std::unique_ptr<mnd::MandelDevice>>& MandelContext::getDevices(void)
  277. {
  278. return devices;
  279. }
  280. asmjit::JitRuntime& MandelContext::getJitRuntime(void)
  281. {
  282. return *jitRuntime;
  283. }
  284. MandelGenerator* MandelContext::getCpuGenerator(mnd::GeneratorType type)
  285. {
  286. auto it = cpuGenerators.find(type);
  287. if (it != cpuGenerators.end())
  288. return it->second.get();
  289. else
  290. return nullptr;
  291. }
  292. std::vector<mnd::GeneratorType> MandelContext::getSupportedTypes(void) const
  293. {
  294. std::vector<GeneratorType> types;
  295. for (auto& [type, gen] : cpuGenerators) {
  296. types.push_back(type);
  297. }
  298. return types;
  299. }