ForeachBenchmark.cpp 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408
  1. /*
  2. * Copyright 2016-present Facebook, Inc.
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <algorithm>
  17. #include <map>
  18. #include <folly/Benchmark.h>
  19. #include <folly/Random.h>
  20. #include <folly/container/Enumerate.h>
  21. #include <folly/container/Foreach.h>
  22. #include <folly/init/Init.h>
  23. using namespace folly;
  24. using namespace folly::detail;
  25. // Benchmarks:
  26. // 1. Benchmark iterating through the man with FOR_EACH, and also assign
  27. // iter->first and iter->second to local vars inside the FOR_EACH loop.
  28. // 2. Benchmark iterating through the man with FOR_EACH, but use iter->first and
  29. // iter->second as is, without assigning to local variables.
  30. // 3. Use FOR_EACH_KV loop to iterate through the map.
  31. // For use in benchmarks below.
  32. std::map<int, std::string> bmMap;
  33. std::vector<int> vec_one;
  34. std::vector<int> vec_two;
  35. // Smallest type to isolate iteration overhead.
  36. std::vector<char> vec_char;
  37. void setupBenchmark(size_t iters) {
  38. bmMap.clear();
  39. for (size_t i = 0; i < iters; ++i) {
  40. bmMap[i] = "teststring";
  41. }
  42. vec_one.clear();
  43. vec_two.clear();
  44. vec_one.resize(iters);
  45. vec_two.resize(iters);
  46. }
  47. void setupCharVecBenchmark(size_t iters) {
  48. vec_char.resize(iters);
  49. std::generate(
  50. vec_char.begin(), vec_char.end(), [] { return Random::rand32(128); });
  51. }
  52. BENCHMARK(ForEachFunctionNoAssign, iters) {
  53. BenchmarkSuspender suspender;
  54. int sumKeys = 0;
  55. std::string sumValues;
  56. setupBenchmark(iters);
  57. suspender.dismissing([&]() {
  58. folly::for_each(bmMap, [&](auto& key_val_pair) {
  59. sumKeys += key_val_pair.first;
  60. sumValues += key_val_pair.second;
  61. });
  62. doNotOptimizeAway(sumKeys);
  63. });
  64. }
  65. BENCHMARK(StdForEachFunctionNoAssign, iters) {
  66. BenchmarkSuspender suspender;
  67. int sumKeys = 0;
  68. std::string sumValues;
  69. setupBenchmark(iters);
  70. suspender.dismissing([&]() {
  71. std::for_each(bmMap.begin(), bmMap.end(), [&](auto& key_val_pair) {
  72. sumKeys += key_val_pair.first;
  73. sumValues += key_val_pair.second;
  74. });
  75. doNotOptimizeAway(sumKeys);
  76. });
  77. }
  78. BENCHMARK(RangeBasedForLoopNoAssign, iters) {
  79. BenchmarkSuspender suspender;
  80. int sumKeys = 0;
  81. std::string sumValues;
  82. setupBenchmark(iters);
  83. suspender.dismissing([&]() {
  84. for (auto& key_val_pair : bmMap) {
  85. sumKeys += key_val_pair.first;
  86. sumValues += key_val_pair.second;
  87. }
  88. doNotOptimizeAway(sumKeys);
  89. });
  90. }
  91. BENCHMARK(ManualLoopNoAssign, iters) {
  92. BenchmarkSuspender suspender;
  93. int sumKeys = 0;
  94. std::string sumValues;
  95. setupBenchmark(iters);
  96. suspender.dismissing([&]() {
  97. for (auto iter = bmMap.begin(); iter != bmMap.end(); ++iter) {
  98. sumKeys += iter->first;
  99. sumValues += iter->second;
  100. }
  101. doNotOptimizeAway(sumKeys);
  102. });
  103. }
  104. BENCHMARK(ForEachFunctionAssign, iters) {
  105. BenchmarkSuspender suspender;
  106. int sumKeys = 0;
  107. std::string sumValues;
  108. setupBenchmark(iters);
  109. suspender.dismissing([&]() {
  110. folly::for_each(bmMap, [&](auto& key_val_pair) {
  111. const int k = key_val_pair.first;
  112. const std::string v = key_val_pair.second;
  113. sumKeys += k;
  114. sumValues += v;
  115. });
  116. });
  117. }
  118. BENCHMARK(StdForEachFunctionAssign, iters) {
  119. BenchmarkSuspender suspender;
  120. int sumKeys = 0;
  121. std::string sumValues;
  122. setupBenchmark(iters);
  123. suspender.dismissing([&]() {
  124. std::for_each(bmMap.begin(), bmMap.end(), [&](auto& key_val_pair) {
  125. const int k = key_val_pair.first;
  126. const std::string v = key_val_pair.second;
  127. sumKeys += k;
  128. sumValues += v;
  129. });
  130. });
  131. }
  132. BENCHMARK(RangeBasedForLoopAssign, iters) {
  133. BenchmarkSuspender suspender;
  134. int sumKeys = 0;
  135. std::string sumValues;
  136. setupBenchmark(iters);
  137. suspender.dismissing([&]() {
  138. for (auto& key_val_pair : bmMap) {
  139. const int k = key_val_pair.first;
  140. const std::string v = key_val_pair.second;
  141. sumKeys += k;
  142. sumValues += v;
  143. }
  144. });
  145. }
  146. BENCHMARK(ManualLoopAssign, iters) {
  147. BenchmarkSuspender suspender;
  148. int sumKeys = 0;
  149. std::string sumValues;
  150. setupBenchmark(iters);
  151. suspender.dismissing([&]() {
  152. for (auto iter = bmMap.begin(); iter != bmMap.end(); ++iter) {
  153. const int k = iter->first;
  154. const std::string v = iter->second;
  155. sumKeys += k;
  156. sumValues += v;
  157. }
  158. });
  159. }
  160. BENCHMARK(ForEachFunctionNoAssignWithIndexManipulation, iters) {
  161. BenchmarkSuspender suspender;
  162. int sumKeys = 0;
  163. std::string sumValues;
  164. setupBenchmark(iters);
  165. suspender.dismissing([&]() {
  166. folly::for_each(bmMap, [&](auto& key_val_pair, auto index) {
  167. sumKeys += key_val_pair.first;
  168. sumValues += key_val_pair.second;
  169. sumValues += index;
  170. });
  171. });
  172. }
  173. BENCHMARK(StdForEachFunctionNoAssignWithIndexManipulation, iters) {
  174. BenchmarkSuspender suspender;
  175. int sumKeys = 0;
  176. std::string sumValues;
  177. setupBenchmark(iters);
  178. suspender.dismissing([&]() {
  179. auto index = std::size_t{0};
  180. std::for_each(bmMap.begin(), bmMap.end(), [&](auto& key_val_pair) {
  181. sumKeys += key_val_pair.first;
  182. sumValues += key_val_pair.second;
  183. sumValues += index;
  184. ++index;
  185. });
  186. });
  187. }
  188. BENCHMARK(RangeBasedForLoopNoAssignWithIndexManipulation, iters) {
  189. BenchmarkSuspender suspender;
  190. int sumKeys = 0;
  191. std::string sumValues;
  192. setupBenchmark(iters);
  193. suspender.dismissing([&]() {
  194. auto index = std::size_t{0};
  195. for (auto& key_val_pair : bmMap) {
  196. sumKeys += key_val_pair.first;
  197. sumValues += key_val_pair.second;
  198. sumValues += index;
  199. }
  200. });
  201. }
  202. BENCHMARK(ForEachFunctionFetch, iters) {
  203. BenchmarkSuspender suspender;
  204. setupBenchmark(iters);
  205. suspender.dismissing([&]() {
  206. folly::for_each(bmMap, [&](auto& key_val_pair, auto index) {
  207. folly::fetch(vec_one, index) = key_val_pair.first;
  208. });
  209. });
  210. }
  211. BENCHMARK(StdForEachFunctionFetch, iters) {
  212. BenchmarkSuspender suspender;
  213. setupBenchmark(iters);
  214. suspender.dismissing([&]() {
  215. auto index = std::size_t{0};
  216. std::for_each(bmMap.begin(), bmMap.end(), [&](auto& key_val_pair) {
  217. *(vec_one.begin() + index++) = key_val_pair.first;
  218. });
  219. });
  220. }
  221. BENCHMARK(ForLoopFetch, iters) {
  222. BenchmarkSuspender suspender;
  223. setupBenchmark(iters);
  224. suspender.dismissing([&]() {
  225. auto index = std::size_t{0};
  226. for (auto& key_val_pair : bmMap) {
  227. *(vec_one.begin() + index++) = key_val_pair.first;
  228. }
  229. });
  230. }
  231. BENCHMARK(ForEachKVNoMacroAssign, iters) {
  232. int sumKeys = 0;
  233. std::string sumValues;
  234. BENCHMARK_SUSPEND {
  235. setupBenchmark(iters);
  236. }
  237. FOR_EACH (iter, bmMap) {
  238. const int k = iter->first;
  239. const std::string v = iter->second;
  240. sumKeys += k;
  241. sumValues += v;
  242. }
  243. }
  244. BENCHMARK(ForEachKVNoMacroNoAssign, iters) {
  245. int sumKeys = 0;
  246. std::string sumValues;
  247. BENCHMARK_SUSPEND {
  248. setupBenchmark(iters);
  249. }
  250. FOR_EACH (iter, bmMap) {
  251. sumKeys += iter->first;
  252. sumValues += iter->second;
  253. }
  254. }
  255. BENCHMARK(ForEachKVMacro, iters) {
  256. int sumKeys = 0;
  257. std::string sumValues;
  258. BENCHMARK_SUSPEND {
  259. setupBenchmark(iters);
  260. }
  261. FOR_EACH_KV (k, v, bmMap) {
  262. sumKeys += k;
  263. sumValues += v;
  264. }
  265. }
  266. BENCHMARK(ForEachManual, iters) {
  267. int sum = 1;
  268. for (size_t i = 1; i < iters; ++i) {
  269. sum *= i;
  270. }
  271. doNotOptimizeAway(sum);
  272. }
  273. BENCHMARK(ForEachRange, iters) {
  274. int sum = 1;
  275. FOR_EACH_RANGE (i, 1, iters) { sum *= i; }
  276. doNotOptimizeAway(sum);
  277. }
  278. BENCHMARK(ForEachDescendingManual, iters) {
  279. int sum = 1;
  280. for (size_t i = iters; i-- > 1;) {
  281. sum *= i;
  282. }
  283. doNotOptimizeAway(sum);
  284. }
  285. BENCHMARK(ForEachRangeR, iters) {
  286. int sum = 1;
  287. FOR_EACH_RANGE_R (i, 1U, iters) { sum *= i; }
  288. doNotOptimizeAway(sum);
  289. }
  290. BENCHMARK(CharVecForRange, iters) {
  291. BENCHMARK_SUSPEND {
  292. setupCharVecBenchmark(iters);
  293. }
  294. size_t sum = 0;
  295. for (auto& c : vec_char) {
  296. sum += c;
  297. }
  298. doNotOptimizeAway(sum);
  299. }
  300. BENCHMARK(CharVecForRangeExplicitIndex, iters) {
  301. BENCHMARK_SUSPEND {
  302. setupCharVecBenchmark(iters);
  303. }
  304. size_t sum = 0;
  305. size_t index = 0;
  306. for (auto& c : vec_char) {
  307. sum += c * index;
  308. ++index;
  309. }
  310. doNotOptimizeAway(sum);
  311. }
  312. BENCHMARK(CharVecForEach, iters) {
  313. BENCHMARK_SUSPEND {
  314. setupCharVecBenchmark(iters);
  315. }
  316. size_t sum = 0;
  317. folly::for_each(vec_char, [&](auto& c) { sum += c; });
  318. doNotOptimizeAway(sum);
  319. }
  320. BENCHMARK(CharVecForEachIndex, iters) {
  321. BENCHMARK_SUSPEND {
  322. setupCharVecBenchmark(iters);
  323. }
  324. size_t sum = 0;
  325. folly::for_each(vec_char, [&](auto& c, auto index) { sum += c * index; });
  326. doNotOptimizeAway(sum);
  327. }
  328. BENCHMARK(CharVecForRangeEnumerate, iters) {
  329. BENCHMARK_SUSPEND {
  330. setupCharVecBenchmark(iters);
  331. }
  332. size_t sum = 0;
  333. for (auto&& it : enumerate(vec_char)) {
  334. sum += *it * it.index;
  335. }
  336. doNotOptimizeAway(sum);
  337. }
  338. int main(int argc, char** argv) {
  339. folly::init(&argc, &argv);
  340. runBenchmarks();
  341. return 0;
  342. }