speed-test.cc 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237
  1. //**********************************************************************************//
  2. // Copyright (C) 2009-2015 Ovidio Pena <ovidio@bytesfall.com> //
  3. // Copyright (C) 2013-2015 Konstantin Ladutenko <kostyfisik@gmail.com> //
  4. // //
  5. // This file is part of scattnlay //
  6. // //
  7. // This program is free software: you can redistribute it and/or modify //
  8. // it under the terms of the GNU General Public License as published by //
  9. // the Free Software Foundation, either version 3 of the License, or //
  10. // (at your option) any later version. //
  11. // //
  12. // This program is distributed in the hope that it will be useful, //
  13. // but WITHOUT ANY WARRANTY; without even the implied warranty of //
  14. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the //
  15. // GNU General Public License for more details. //
  16. // //
  17. // The only additional remark is that we expect that all publications //
  18. // describing work using this software, or all commercial products //
  19. // using it, cite the following reference: //
  20. // [1] O. Pena and U. Pal, "Scattering of electromagnetic radiation by //
  21. // a multilayered sphere," Computer Physics Communications, //
  22. // vol. 180, Nov. 2009, pp. 2348-2354. //
  23. // //
  24. // You should have received a copy of the GNU General Public License //
  25. // along with this program. If not, see <http://www.gnu.org/licenses/>. //
  26. //**********************************************************************************//
  27. #include <algorithm>
  28. #include <complex>
  29. #include <functional>
  30. #include <iostream>
  31. #include <stdexcept>
  32. #include <string>
  33. #include <vector>
  34. #include <stdlib.h>
  35. #include <stdio.h>
  36. #include <time.h>
  37. #include <string.h>
  38. //sudo aptitude install libgoogle-perftools-dev
  39. //#include <google/heap-profiler.h>
  40. #include "../../src/nmie.h"
  41. timespec diff(timespec start, timespec end);
  42. const double PI=3.14159265358979323846;
  43. template<class T> inline T pow2(const T value) {return value*value;}
  44. //***********************************************************************************//
  45. // This is the main function of 'scattnlay', here we read the parameters as //
  46. // arguments passed to the program which should be executed with the following //
  47. // syntaxis: //
  48. // ./scattnlay -l Layers x1 m1.r m1.i [x2 m2.r m2.i ...] [-t ti tf nt] [-c comment] //
  49. // //
  50. // When all the parameters were correctly passed we setup the integer L (the //
  51. // number of layers) and the arrays x and m, containing the size parameters and //
  52. // refractive indexes of the layers, respectively and call the function nMie. //
  53. // If the calculation is successful the results are printed with the following //
  54. // format: //
  55. // //
  56. // * If no comment was passed: //
  57. // 'Qext, Qsca, Qabs, Qbk, Qpr, g, Albedo' //
  58. // //
  59. // * If a comment was passed: //
  60. // 'comment, Qext, Qsca, Qabs, Qbk, Qpr, g, Albedo' //
  61. //***********************************************************************************//
  62. int main(int argc, char *argv[]) {
  63. try {
  64. std::vector<std::string> args;
  65. args.assign(argv, argv + argc);
  66. std::string error_msg(std::string("Insufficient parameters.\nUsage: ") + args[0]
  67. + " -l Layers x1 m1.r m1.i [x2 m2.r m2.i ...] "
  68. + "[-t ti tf nt] [-c comment]\n");
  69. enum mode_states {read_L, read_x, read_mr, read_mi, read_ti, read_tf, read_nt, read_comment};
  70. // for (auto arg : args) std::cout<< arg <<std::endl;
  71. std::string comment;
  72. int has_comment = 0;
  73. int i, l, L = 0;
  74. std::vector<double> x, Theta;
  75. std::vector<std::complex<double> > m, S1, S2;
  76. double Qext, Qabs, Qsca, Qbk, Qpr, g, Albedo;
  77. std::vector<std::complex<double> > mw, S1w, S2w;
  78. double Qextw, Qabsw, Qscaw, Qbkw, Qprw, gw, Albedow;
  79. double ti = 0.0, tf = 90.0;
  80. int nt = 0;
  81. if (argc < 5) throw std::invalid_argument(error_msg);
  82. //strcpy(comment, "");
  83. // for (i = 1; i < argc; i++) {
  84. int mode = -1;
  85. double tmp_mr;
  86. for (auto arg : args) {
  87. // For each arg in args list we detect the change of the current
  88. // read mode or read the arg. The reading args algorithm works
  89. // as a finite-state machine.
  90. // Detecting new read mode (if it is a valid -key)
  91. if (arg == "-l") {
  92. mode = read_L;
  93. continue;
  94. }
  95. if (arg == "-t") {
  96. if ((mode != read_x) && (mode != read_comment))
  97. throw std::invalid_argument(std::string("Unfinished layer!\n")
  98. +error_msg);
  99. mode = read_ti;
  100. continue;
  101. }
  102. if (arg == "-c") {
  103. if ((mode != read_x) && (mode != read_nt))
  104. throw std::invalid_argument(std::string("Unfinished layer or theta!\n") + error_msg);
  105. mode = read_comment;
  106. continue;
  107. }
  108. // Reading data. For invalid date the exception will be thrown
  109. // with the std:: and catched in the end.
  110. if (mode == read_L) {
  111. L = std::stoi(arg);
  112. mode = read_x;
  113. continue;
  114. }
  115. if (mode == read_x) {
  116. x.push_back(std::stod(arg));
  117. mode = read_mr;
  118. continue;
  119. }
  120. if (mode == read_mr) {
  121. tmp_mr = std::stod(arg);
  122. mode = read_mi;
  123. continue;
  124. }
  125. if (mode == read_mi) {
  126. m.push_back(std::complex<double>( tmp_mr,std::stod(arg) ));
  127. mode = read_x;
  128. continue;
  129. }
  130. if (mode == read_ti) {
  131. ti = std::stod(arg);
  132. mode = read_tf;
  133. continue;
  134. }
  135. if (mode == read_tf) {
  136. tf = std::stod(arg);
  137. mode = read_nt;
  138. continue;
  139. }
  140. if (mode == read_nt) {
  141. nt = std::stoi(arg);
  142. Theta.resize(nt);
  143. S1.resize(nt);
  144. S2.resize(nt);
  145. S1w.resize(nt);
  146. S2w.resize(nt);
  147. continue;
  148. }
  149. if (mode == read_comment) {
  150. comment = arg;
  151. has_comment = 1;
  152. continue;
  153. }
  154. }
  155. if ( (x.size() != m.size()) || (L != x.size()) )
  156. throw std::invalid_argument(std::string("Broken structure!\n")
  157. +error_msg);
  158. if ( (0 == m.size()) || ( 0 == x.size()) )
  159. throw std::invalid_argument(std::string("Empty structure!\n")
  160. +error_msg);
  161. if (nt < 0) {
  162. printf("Error reading Theta.\n");
  163. return -1;
  164. } else if (nt == 1) {
  165. Theta[0] = ti*PI/180.0;
  166. } else {
  167. for (i = 0; i < nt; i++) {
  168. Theta[i] = (ti + (double)i*(tf - ti)/(nt - 1))*PI/180.0;
  169. }
  170. }
  171. timespec time1, time2;
  172. long cpptime_nsec, best_cpp;
  173. long ctime_nsec, best_c;
  174. long cpptime_sec, ctime_sec;
  175. long repeats = 150;
  176. //HeapProfilerStart("heapprof");
  177. do {
  178. clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &time1);
  179. for (int i = 0; i<repeats; ++i) {
  180. nmie::nMie(L, x, m, nt, Theta, &Qextw, &Qscaw,
  181. &Qabsw, &Qbkw, &Qprw, &gw, &Albedow, S1w, S2w);
  182. }
  183. clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &time2);
  184. cpptime_nsec = diff(time1,time2).tv_nsec;
  185. cpptime_sec = diff(time1,time2).tv_sec;
  186. printf("-- C++ time consumed %lg sec\n", (cpptime_nsec/1e9));
  187. repeats *= 10;
  188. } while (cpptime_nsec < 1e8 && ctime_nsec < 1e8);
  189. printf("\n");
  190. if (has_comment) {
  191. printf("%6s, %+.5e, %+.5e, %+.5e, %+.5e, %+.5e, %+.5e, %+.5e \n", comment.c_str(), Qextw, Qscaw, Qabsw, Qbkw, Qprw, gw, Albedow);
  192. } else {
  193. printf("%+.5e, %+.5e, %+.5e, %+.5e, %+.5e, %+.5e, %+.5e \n", Qextw, Qscaw, Qabsw, Qbkw, Qprw, gw, Albedow);
  194. }
  195. if (nt > 0) {
  196. printf(" Theta, S1.r, S1.i, S2.r, S2.i\n");
  197. for (i = 0; i < nt; i++) {
  198. printf("%6.2f, %+.5e, %+.5e, %+.5e, %+.5e \n", Theta[i]*180.0/PI, S1w[i].real(), S1w[i].imag(), S2w[i].real(), S2w[i].imag());
  199. }
  200. }
  201. } catch( const std::invalid_argument& ia ) {
  202. // Will catch if multi_layer_mie fails or other errors.
  203. std::cerr << "Invalid argument: " << ia.what() << std::endl;
  204. return -1;
  205. }
  206. return 0;
  207. }
  208. timespec diff(timespec start, timespec end)
  209. {
  210. timespec temp;
  211. if ((end.tv_nsec-start.tv_nsec)<0) {
  212. temp.tv_sec = end.tv_sec-start.tv_sec-1;
  213. temp.tv_nsec = 1000000000+end.tv_nsec-start.tv_nsec;
  214. } else {
  215. temp.tv_sec = end.tv_sec-start.tv_sec;
  216. temp.tv_nsec = end.tv_nsec-start.tv_nsec;
  217. }
  218. return temp;
  219. }