You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

dgemv_thread_safety.cpp 4.6 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119
  1. #include <iostream>
  2. #include <vector>
  3. #include <random>
  4. #include <future>
  5. #include <omp.h>
  6. #include "../cblas.h"
  7. #include "cpp_thread_safety_common.h"
  8. void launch_cblas_dgemv(double* A, double* x, double* y, const blasint randomMatSize)
  9. {
  10. const blasint inc = 1;
  11. cblas_dgemv(CblasColMajor, CblasNoTrans, randomMatSize, randomMatSize, 1.0, A, randomMatSize, x, inc, 0.1, y, inc);
  12. }
  13. int main(int argc, char* argv[])
  14. {
  15. blasint randomMatSize = 1024; //dimension of the random square matrices and vectors being used
  16. uint32_t numConcurrentThreads = 52; //number of concurrent calls of the functions being tested
  17. uint32_t numTestRounds = 16; //number of testing rounds before success exit
  18. uint32_t maxHwThreads = omp_get_max_threads();
  19. if (maxHwThreads < 52)
  20. numConcurrentThreads = maxHwThreads;
  21. if (argc > 4)
  22. {
  23. std::cout<<"ERROR: too many arguments for thread safety tester"<<std::endl;
  24. abort();
  25. }
  26. if(argc == 4)
  27. {
  28. std::vector<std::string> cliArgs;
  29. for (int i = 1; i < argc; i++)
  30. {
  31. cliArgs.push_back(argv[i]);
  32. std::cout<<argv[i]<<std::endl;
  33. }
  34. randomMatSize = std::stoul(cliArgs.at(0));
  35. numConcurrentThreads = std::stoul(cliArgs.at(1));
  36. numTestRounds = std::stoul(cliArgs.at(2));
  37. }
  38. std::uniform_real_distribution<double> rngdist{-1.0, 1.0};
  39. std::vector<std::vector<double>> matBlock(numConcurrentThreads);
  40. std::vector<std::vector<double>> vecBlock(numConcurrentThreads*2);
  41. std::vector<std::future<void>> futureBlock(numConcurrentThreads);
  42. std::cout<<"*----------------------------*\n";
  43. std::cout<<"| DGEMV thread safety tester |\n";
  44. std::cout<<"*----------------------------*\n";
  45. std::cout<<"Size of random matrices and vectors(N=M): "<<randomMatSize<<'\n';
  46. std::cout<<"Number of concurrent calls into OpenBLAS : "<<numConcurrentThreads<<'\n';
  47. std::cout<<"Number of testing rounds : "<<numTestRounds<<'\n';
  48. std::cout<<"This test will need "<<((static_cast<uint64_t>(randomMatSize*randomMatSize)*numConcurrentThreads*8)+(static_cast<uint64_t>(randomMatSize)*numConcurrentThreads*8*2))/static_cast<double>(1024*1024)<<" MiB of RAM\n"<<std::endl;
  49. FailIfThreadsAreZero(numConcurrentThreads);
  50. std::cout<<"Initializing random number generator..."<<std::flush;
  51. std::mt19937_64 PRNG = InitPRNG();
  52. std::cout<<"done\n";
  53. std::cout<<"Preparing to test CBLAS DGEMV thread safety\n";
  54. std::cout<<"Allocating matrices..."<<std::flush;
  55. for(uint32_t i=0; i<numConcurrentThreads; i++)
  56. {
  57. matBlock.at(i).resize(randomMatSize*randomMatSize);
  58. }
  59. std::cout<<"done\n";
  60. std::cout<<"Allocating vectors..."<<std::flush;
  61. for(uint32_t i=0; i<(numConcurrentThreads*2); i++)
  62. {
  63. vecBlock.at(i).resize(randomMatSize);
  64. }
  65. std::cout<<"done\n";
  66. //pauser();
  67. std::cout<<"Filling matrices with random numbers..."<<std::flush;
  68. FillMatrices(matBlock, PRNG, rngdist, randomMatSize, numConcurrentThreads, 1);
  69. //PrintMatrices(matBlock, randomMatSize, numConcurrentThreads);
  70. std::cout<<"done\n";
  71. std::cout<<"Filling vectors with random numbers..."<<std::flush;
  72. FillVectors(vecBlock, PRNG, rngdist, randomMatSize, numConcurrentThreads, 2);
  73. std::cout<<"done\n";
  74. std::cout<<"Testing CBLAS DGEMV thread safety"<<std::endl;
  75. omp_set_num_threads(numConcurrentThreads);
  76. for(uint32_t R=0; R<numTestRounds; R++)
  77. {
  78. std::cout<<"DGEMV round #"<<R<<std::endl;
  79. std::cout<<"Launching "<<numConcurrentThreads<<" threads simultaneously using OpenMP..."<<std::flush;
  80. #pragma omp parallel for default(none) shared(futureBlock, matBlock, vecBlock, randomMatSize, numConcurrentThreads)
  81. for(uint32_t i=0; i<numConcurrentThreads; i++)
  82. {
  83. futureBlock[i] = std::async(std::launch::async, launch_cblas_dgemv, &matBlock[i][0], &vecBlock[i*2][0], &vecBlock[i*2+1][0], randomMatSize);
  84. }
  85. std::cout<<"done\n";
  86. std::cout<<"Waiting for threads to finish..."<<std::flush;
  87. for(uint32_t i=0; i<numConcurrentThreads; i++)
  88. {
  89. futureBlock[i].get();
  90. }
  91. std::cout<<"done\n";
  92. std::cout<<"Comparing results from different threads..."<<std::flush;
  93. for(uint32_t i=2; i<(numConcurrentThreads*2); i+=2){ //i is the index of vector x, for a given thread
  94. for(uint32_t j = 0; j < static_cast<uint32_t>(randomMatSize); j++)
  95. {
  96. if (std::abs(vecBlock[i+1][j] - vecBlock[1][j]) > 1.0E-13){ //i+1 is the index of vector y, for a given thread
  97. std::cout<<"ERROR: one of the threads returned a different result! Index : "<<i+1<<std::endl;
  98. std::cout<<"CBLAS DGEMV thread safety test FAILED!"<<std::endl;
  99. return -1;
  100. }
  101. }
  102. }
  103. std::cout<<"OK!\n"<<std::endl;
  104. }
  105. std::cout<<"CBLAS DGEMV thread safety test PASSED!\n"<<std::endl;
  106. return 0;
  107. }