BaseBenchmark.cpp 9.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371
  1. /*
  2. * Copyright 2014-present Facebook, Inc.
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <atomic>
  17. #include <glog/logging.h>
  18. #include <folly/Benchmark.h>
  19. #include <folly/gen/Base.h>
  20. using namespace folly::gen;
  21. using folly::fbstring;
  22. using std::pair;
  23. using std::set;
  24. using std::tuple;
  25. using std::vector;
  26. static std::atomic<int> testSize(1000);
  27. // clang-format off
  28. static vector<int> testVector =
  29. seq(1, testSize.load())
  30. | mapped([](int) { return rand(); })
  31. | as<vector>();
  32. static vector<vector<int>> testVectorVector =
  33. seq(1, 100)
  34. | map([](int i) {
  35. return seq(1, i) | as<vector>();
  36. })
  37. | as<vector>();
  38. static vector<fbstring> strings =
  39. from(testVector)
  40. | eachTo<fbstring>()
  41. | as<vector>();
  42. // clang-format on
  43. auto square = [](int x) { return x * x; };
  44. BENCHMARK(Sum_Basic_NoGen, iters) {
  45. int limit = testSize.load();
  46. int s = 0;
  47. while (iters--) {
  48. for (int i = 0; i < limit; ++i) {
  49. s += i;
  50. }
  51. }
  52. folly::doNotOptimizeAway(s);
  53. }
  54. BENCHMARK_RELATIVE(Sum_Basic_Gen, iters) {
  55. int limit = testSize.load();
  56. int s = 0;
  57. while (iters--) {
  58. s += range(0, limit) | sum;
  59. }
  60. folly::doNotOptimizeAway(s);
  61. }
  62. BENCHMARK_DRAW_LINE();
  63. BENCHMARK(Sum_Vector_NoGen, iters) {
  64. int s = 0;
  65. while (iters--) {
  66. for (auto& i : testVector) {
  67. s += i;
  68. }
  69. }
  70. folly::doNotOptimizeAway(s);
  71. }
  72. BENCHMARK_RELATIVE(Sum_Vector_Gen, iters) {
  73. int s = 0;
  74. while (iters--) {
  75. s += from(testVector) | sum;
  76. }
  77. folly::doNotOptimizeAway(s);
  78. }
  79. BENCHMARK_DRAW_LINE();
  80. BENCHMARK(Member, iters) {
  81. int s = 0;
  82. while (iters--) {
  83. // clang-format off
  84. s += from(strings)
  85. | member(&fbstring::size)
  86. | sum;
  87. // clang-format on
  88. }
  89. folly::doNotOptimizeAway(s);
  90. }
  91. BENCHMARK_RELATIVE(MapMember, iters) {
  92. int s = 0;
  93. while (iters--) {
  94. // clang-format off
  95. s += from(strings)
  96. | map([](const fbstring& x) { return x.size(); })
  97. | sum;
  98. // clang-format on
  99. }
  100. folly::doNotOptimizeAway(s);
  101. }
  102. BENCHMARK_DRAW_LINE();
  103. BENCHMARK(Count_Vector_NoGen, iters) {
  104. int s = 0;
  105. while (iters--) {
  106. for (auto& i : testVector) {
  107. if (i * 2 < rand()) {
  108. ++s;
  109. }
  110. }
  111. }
  112. folly::doNotOptimizeAway(s);
  113. }
  114. BENCHMARK_RELATIVE(Count_Vector_Gen, iters) {
  115. int s = 0;
  116. while (iters--) {
  117. // clang-format off
  118. s += from(testVector)
  119. | filter([](int i) {
  120. return i * 2 < rand();
  121. })
  122. | count;
  123. // clang-format on
  124. }
  125. folly::doNotOptimizeAway(s);
  126. }
  127. BENCHMARK_DRAW_LINE();
  128. BENCHMARK(Fib_Sum_NoGen, iters) {
  129. int s = 0;
  130. while (iters--) {
  131. auto fib = [](size_t limit) -> vector<int> {
  132. vector<int> ret;
  133. int a = 0;
  134. int b = 1;
  135. for (size_t i = 0; i < limit; i += 2) {
  136. ret.push_back(a += b);
  137. ret.push_back(b += a);
  138. }
  139. return ret;
  140. };
  141. for (auto& v : fib(testSize.load())) {
  142. s += v;
  143. }
  144. }
  145. folly::doNotOptimizeAway(s);
  146. }
  147. BENCHMARK_RELATIVE(Fib_Sum_Gen, iters) {
  148. int s = 0;
  149. while (iters--) {
  150. auto fib = GENERATOR(int) {
  151. int a = 0;
  152. int b = 1;
  153. for (;;) {
  154. yield(a += b);
  155. yield(b += a);
  156. }
  157. };
  158. // Early stopping implemented with exceptions.
  159. s += fib | take(testSize.load()) | sum;
  160. }
  161. folly::doNotOptimizeAway(s);
  162. }
  163. BENCHMARK_RELATIVE(Fib_Sum_Gen_Limit, iters) {
  164. int s = 0;
  165. while (iters--) {
  166. size_t limit = testSize.load();
  167. auto fib = GENERATOR(int) {
  168. int a = 0;
  169. int b = 1;
  170. for (size_t i = 0; i < limit; i += 2) {
  171. yield(a += b);
  172. yield(b += a);
  173. }
  174. };
  175. // No early stopping.
  176. s += fib | sum;
  177. }
  178. folly::doNotOptimizeAway(s);
  179. }
  180. struct FibYielder {
  181. template <class Yield>
  182. void operator()(Yield&& yield) const {
  183. int a = 0;
  184. int b = 1;
  185. for (;;) {
  186. yield(a += b);
  187. yield(b += a);
  188. }
  189. }
  190. };
  191. BENCHMARK_RELATIVE(Fib_Sum_Gen_Static, iters) {
  192. int s = 0;
  193. while (iters--) {
  194. auto fib = generator<int>(FibYielder());
  195. s += fib | take(testSize.load()) | sum;
  196. }
  197. folly::doNotOptimizeAway(s);
  198. }
  199. BENCHMARK_DRAW_LINE();
  200. BENCHMARK(VirtualGen_0Virtual, iters) {
  201. int s = 0;
  202. while (iters--) {
  203. auto numbers = seq(1, 10000);
  204. auto squares = numbers | map(square);
  205. auto quads = squares | map(square);
  206. s += quads | sum;
  207. }
  208. folly::doNotOptimizeAway(s);
  209. }
  210. BENCHMARK_RELATIVE(VirtualGen_1Virtual, iters) {
  211. int s = 0;
  212. while (iters--) {
  213. VirtualGen<int> numbers = seq(1, 10000);
  214. auto squares = numbers | map(square);
  215. auto quads = squares | map(square);
  216. s += quads | sum;
  217. }
  218. folly::doNotOptimizeAway(s);
  219. }
  220. BENCHMARK_RELATIVE(VirtualGen_2Virtual, iters) {
  221. int s = 0;
  222. while (iters--) {
  223. VirtualGen<int> numbers = seq(1, 10000);
  224. VirtualGen<int> squares = numbers | map(square);
  225. auto quads = squares | map(square);
  226. s += quads | sum;
  227. }
  228. folly::doNotOptimizeAway(s);
  229. }
  230. BENCHMARK_RELATIVE(VirtualGen_3Virtual, iters) {
  231. int s = 0;
  232. while (iters--) {
  233. VirtualGen<int> numbers = seq(1, 10000);
  234. VirtualGen<int> squares = numbers | map(square);
  235. VirtualGen<int> quads = squares | map(square);
  236. s += quads | sum;
  237. }
  238. folly::doNotOptimizeAway(s);
  239. }
  240. BENCHMARK_DRAW_LINE();
  241. BENCHMARK(Concat_NoGen, iters) {
  242. int s = 0;
  243. while (iters--) {
  244. for (auto& v : testVectorVector) {
  245. for (auto& i : v) {
  246. s += i;
  247. }
  248. }
  249. }
  250. folly::doNotOptimizeAway(s);
  251. }
  252. BENCHMARK_RELATIVE(Concat_Gen, iters) {
  253. int s = 0;
  254. while (iters--) {
  255. s += from(testVectorVector) | rconcat | sum;
  256. }
  257. folly::doNotOptimizeAway(s);
  258. }
  259. BENCHMARK_DRAW_LINE();
  260. BENCHMARK(Composed_NoGen, iters) {
  261. int s = 0;
  262. while (iters--) {
  263. for (auto& i : testVector) {
  264. s += i * i;
  265. }
  266. }
  267. folly::doNotOptimizeAway(s);
  268. }
  269. BENCHMARK_RELATIVE(Composed_Gen, iters) {
  270. int s = 0;
  271. auto sumSq = map(square) | sum;
  272. while (iters--) {
  273. s += from(testVector) | sumSq;
  274. }
  275. folly::doNotOptimizeAway(s);
  276. }
  277. BENCHMARK_RELATIVE(Composed_GenRegular, iters) {
  278. int s = 0;
  279. while (iters--) {
  280. s += from(testVector) | map(square) | sum;
  281. }
  282. folly::doNotOptimizeAway(s);
  283. }
  284. BENCHMARK_DRAW_LINE();
  285. BENCHMARK(Sample, iters) {
  286. size_t s = 0;
  287. while (iters--) {
  288. auto sampler = seq(1, 10 * 1000 * 1000) | sample(1000);
  289. s += (sampler | sum);
  290. }
  291. folly::doNotOptimizeAway(s);
  292. }
  293. // Results from an Intel(R) Xeon(R) CPU E5-2660 0 @ 2.20GHz
  294. // ============================================================================
  295. // folly/gen/test/BaseBenchmark.cpp relative time/iter iters/s
  296. // ============================================================================
  297. // Sum_Basic_NoGen 372.39ns 2.69M
  298. // Sum_Basic_Gen 195.96% 190.03ns 5.26M
  299. // ----------------------------------------------------------------------------
  300. // Sum_Vector_NoGen 200.41ns 4.99M
  301. // Sum_Vector_Gen 77.14% 259.81ns 3.85M
  302. // ----------------------------------------------------------------------------
  303. // Member 4.56us 219.42K
  304. // MapMember 400.47% 1.14us 878.73K
  305. // ----------------------------------------------------------------------------
  306. // Count_Vector_NoGen 13.96us 71.64K
  307. // Count_Vector_Gen 86.05% 16.22us 61.65K
  308. // ----------------------------------------------------------------------------
  309. // Fib_Sum_NoGen 2.21us 452.63K
  310. // Fib_Sum_Gen 23.94% 9.23us 108.36K
  311. // Fib_Sum_Gen_Static 48.77% 4.53us 220.73K
  312. // ----------------------------------------------------------------------------
  313. // VirtualGen_0Virtual 9.60us 104.13K
  314. // VirtualGen_1Virtual 28.00% 34.30us 29.15K
  315. // VirtualGen_2Virtual 22.62% 42.46us 23.55K
  316. // VirtualGen_3Virtual 16.96% 56.64us 17.66K
  317. // ----------------------------------------------------------------------------
  318. // Concat_NoGen 2.20us 453.66K
  319. // Concat_Gen 109.49% 2.01us 496.70K
  320. // ----------------------------------------------------------------------------
  321. // Composed_NoGen 545.32ns 1.83M
  322. // Composed_Gen 87.94% 620.07ns 1.61M
  323. // Composed_GenRegular 88.13% 618.74ns 1.62M
  324. // ----------------------------------------------------------------------------
  325. // Sample 176.48ms 5.67
  326. // ============================================================================
  327. int main(int argc, char* argv[]) {
  328. gflags::ParseCommandLineFlags(&argc, &argv, true);
  329. folly::runBenchmarks();
  330. return 0;
  331. }