tbb_profiling.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355
  1. /*
  2. Copyright (c) 2005-2020 Intel Corporation
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. #ifndef __TBB_profiling_H
  14. #define __TBB_profiling_H
  15. #define __TBB_tbb_profiling_H_include_area
  16. #include "internal/_warning_suppress_enable_notice.h"
  17. namespace tbb {
  18. namespace internal {
  19. // include list of index names
  20. #define TBB_STRING_RESOURCE(index_name,str) index_name,
  21. enum string_index {
  22. #include "internal/_tbb_strings.h"
  23. NUM_STRINGS
  24. };
  25. #undef TBB_STRING_RESOURCE
  26. enum itt_relation
  27. {
  28. __itt_relation_is_unknown = 0,
  29. __itt_relation_is_dependent_on, /**< "A is dependent on B" means that A cannot start until B completes */
  30. __itt_relation_is_sibling_of, /**< "A is sibling of B" means that A and B were created as a group */
  31. __itt_relation_is_parent_of, /**< "A is parent of B" means that A created B */
  32. __itt_relation_is_continuation_of, /**< "A is continuation of B" means that A assumes the dependencies of B */
  33. __itt_relation_is_child_of, /**< "A is child of B" means that A was created by B (inverse of is_parent_of) */
  34. __itt_relation_is_continued_by, /**< "A is continued by B" means that B assumes the dependencies of A (inverse of is_continuation_of) */
  35. __itt_relation_is_predecessor_to /**< "A is predecessor to B" means that B cannot start until A completes (inverse of is_dependent_on) */
  36. };
  37. }
  38. }
  39. // Check if the tools support is enabled
  40. #if (_WIN32||_WIN64||__linux__) && !__MINGW32__ && TBB_USE_THREADING_TOOLS
  41. #if _WIN32||_WIN64
  42. #include <stdlib.h> /* mbstowcs_s */
  43. #endif
  44. #include "tbb_stddef.h"
  45. namespace tbb {
  46. namespace internal {
  47. #if _WIN32||_WIN64
  48. void __TBB_EXPORTED_FUNC itt_set_sync_name_v3( void *obj, const wchar_t* name );
  49. inline size_t multibyte_to_widechar( wchar_t* wcs, const char* mbs, size_t bufsize) {
  50. #if _MSC_VER>=1400
  51. size_t len;
  52. mbstowcs_s( &len, wcs, bufsize, mbs, _TRUNCATE );
  53. return len; // mbstowcs_s counts null terminator
  54. #else
  55. size_t len = mbstowcs( wcs, mbs, bufsize );
  56. if(wcs && len!=size_t(-1) )
  57. wcs[len<bufsize-1? len: bufsize-1] = wchar_t('\0');
  58. return len+1; // mbstowcs does not count null terminator
  59. #endif
  60. }
  61. #else
  62. void __TBB_EXPORTED_FUNC itt_set_sync_name_v3( void *obj, const char* name );
  63. #endif
  64. } // namespace internal
  65. } // namespace tbb
  66. //! Macro __TBB_DEFINE_PROFILING_SET_NAME(T) defines "set_name" methods for sync objects of type T
  67. /** Should be used in the "tbb" namespace only.
  68. Don't place semicolon after it to avoid compiler warnings. **/
  69. #if _WIN32||_WIN64
  70. #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type) \
  71. namespace profiling { \
  72. inline void set_name( sync_object_type& obj, const wchar_t* name ) { \
  73. tbb::internal::itt_set_sync_name_v3( &obj, name ); \
  74. } \
  75. inline void set_name( sync_object_type& obj, const char* name ) { \
  76. size_t len = tbb::internal::multibyte_to_widechar(NULL, name, 0); \
  77. wchar_t *wname = new wchar_t[len]; \
  78. tbb::internal::multibyte_to_widechar(wname, name, len); \
  79. set_name( obj, wname ); \
  80. delete[] wname; \
  81. } \
  82. }
  83. #else /* !WIN */
  84. #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type) \
  85. namespace profiling { \
  86. inline void set_name( sync_object_type& obj, const char* name ) { \
  87. tbb::internal::itt_set_sync_name_v3( &obj, name ); \
  88. } \
  89. }
  90. #endif /* !WIN */
  91. #else /* no tools support */
  92. #if _WIN32||_WIN64
  93. #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type) \
  94. namespace profiling { \
  95. inline void set_name( sync_object_type&, const wchar_t* ) {} \
  96. inline void set_name( sync_object_type&, const char* ) {} \
  97. }
  98. #else /* !WIN */
  99. #define __TBB_DEFINE_PROFILING_SET_NAME(sync_object_type) \
  100. namespace profiling { \
  101. inline void set_name( sync_object_type&, const char* ) {} \
  102. }
  103. #endif /* !WIN */
  104. #endif /* no tools support */
  105. #include "atomic.h"
  106. // Need these to work regardless of tools support
  107. namespace tbb {
  108. namespace internal {
  109. enum notify_type {prepare=0, cancel, acquired, releasing};
  110. const uintptr_t NUM_NOTIFY_TYPES = 4; // set to # elements in enum above
  111. void __TBB_EXPORTED_FUNC call_itt_notify_v5(int t, void *ptr);
  112. void __TBB_EXPORTED_FUNC itt_store_pointer_with_release_v3(void *dst, void *src);
  113. void* __TBB_EXPORTED_FUNC itt_load_pointer_with_acquire_v3(const void *src);
  114. void* __TBB_EXPORTED_FUNC itt_load_pointer_v3( const void* src );
  115. enum itt_domain_enum { ITT_DOMAIN_FLOW=0, ITT_DOMAIN_MAIN=1, ITT_DOMAIN_ALGO=2, ITT_NUM_DOMAINS };
  116. void __TBB_EXPORTED_FUNC itt_make_task_group_v7( itt_domain_enum domain, void *group, unsigned long long group_extra,
  117. void *parent, unsigned long long parent_extra, string_index name_index );
  118. void __TBB_EXPORTED_FUNC itt_metadata_str_add_v7( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
  119. string_index key, const char *value );
  120. void __TBB_EXPORTED_FUNC itt_metadata_ptr_add_v11( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
  121. string_index key, void* value );
  122. void __TBB_EXPORTED_FUNC itt_relation_add_v7( itt_domain_enum domain, void *addr0, unsigned long long addr0_extra,
  123. itt_relation relation, void *addr1, unsigned long long addr1_extra );
  124. void __TBB_EXPORTED_FUNC itt_task_begin_v7( itt_domain_enum domain, void *task, unsigned long long task_extra,
  125. void *parent, unsigned long long parent_extra, string_index name_index );
  126. void __TBB_EXPORTED_FUNC itt_task_end_v7( itt_domain_enum domain );
  127. void __TBB_EXPORTED_FUNC itt_region_begin_v9( itt_domain_enum domain, void *region, unsigned long long region_extra,
  128. void *parent, unsigned long long parent_extra, string_index name_index );
  129. void __TBB_EXPORTED_FUNC itt_region_end_v9( itt_domain_enum domain, void *region, unsigned long long region_extra );
  130. // two template arguments are to workaround /Wp64 warning with tbb::atomic specialized for unsigned type
  131. template <typename T, typename U>
  132. inline void itt_store_word_with_release(tbb::atomic<T>& dst, U src) {
  133. #if TBB_USE_THREADING_TOOLS
  134. // This assertion should be replaced with static_assert
  135. __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
  136. itt_store_pointer_with_release_v3(&dst, (void *)uintptr_t(src));
  137. #else
  138. dst = src;
  139. #endif // TBB_USE_THREADING_TOOLS
  140. }
  141. template <typename T>
  142. inline T itt_load_word_with_acquire(const tbb::atomic<T>& src) {
  143. #if TBB_USE_THREADING_TOOLS
  144. // This assertion should be replaced with static_assert
  145. __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
  146. #if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
  147. // Workaround for overzealous compiler warnings
  148. #pragma warning (push)
  149. #pragma warning (disable: 4311)
  150. #endif
  151. T result = (T)itt_load_pointer_with_acquire_v3(&src);
  152. #if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
  153. #pragma warning (pop)
  154. #endif
  155. return result;
  156. #else
  157. return src;
  158. #endif // TBB_USE_THREADING_TOOLS
  159. }
  160. template <typename T>
  161. inline void itt_store_word_with_release(T& dst, T src) {
  162. #if TBB_USE_THREADING_TOOLS
  163. // This assertion should be replaced with static_assert
  164. __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
  165. itt_store_pointer_with_release_v3(&dst, (void *)src);
  166. #else
  167. __TBB_store_with_release(dst, src);
  168. #endif // TBB_USE_THREADING_TOOLS
  169. }
  170. template <typename T>
  171. inline T itt_load_word_with_acquire(const T& src) {
  172. #if TBB_USE_THREADING_TOOLS
  173. // This assertion should be replaced with static_assert
  174. __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized");
  175. return (T)itt_load_pointer_with_acquire_v3(&src);
  176. #else
  177. return __TBB_load_with_acquire(src);
  178. #endif // TBB_USE_THREADING_TOOLS
  179. }
  180. template <typename T>
  181. inline void itt_hide_store_word(T& dst, T src) {
  182. #if TBB_USE_THREADING_TOOLS
  183. //TODO: This assertion should be replaced with static_assert
  184. __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized");
  185. itt_store_pointer_with_release_v3(&dst, (void *)src);
  186. #else
  187. dst = src;
  188. #endif
  189. }
  190. //TODO: rename to itt_hide_load_word_relaxed
  191. template <typename T>
  192. inline T itt_hide_load_word(const T& src) {
  193. #if TBB_USE_THREADING_TOOLS
  194. //TODO: This assertion should be replaced with static_assert
  195. __TBB_ASSERT(sizeof(T) == sizeof(void *), "Type must be word-sized.");
  196. return (T)itt_load_pointer_v3(&src);
  197. #else
  198. return src;
  199. #endif
  200. }
  201. #if TBB_USE_THREADING_TOOLS
  202. inline void call_itt_notify(notify_type t, void *ptr) {
  203. call_itt_notify_v5((int)t, ptr);
  204. }
  205. inline void itt_make_task_group( itt_domain_enum domain, void *group, unsigned long long group_extra,
  206. void *parent, unsigned long long parent_extra, string_index name_index ) {
  207. itt_make_task_group_v7( domain, group, group_extra, parent, parent_extra, name_index );
  208. }
  209. inline void itt_metadata_str_add( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
  210. string_index key, const char *value ) {
  211. itt_metadata_str_add_v7( domain, addr, addr_extra, key, value );
  212. }
  213. inline void register_node_addr(itt_domain_enum domain, void *addr, unsigned long long addr_extra,
  214. string_index key, void *value) {
  215. itt_metadata_ptr_add_v11(domain, addr, addr_extra, key, value);
  216. }
  217. inline void itt_relation_add( itt_domain_enum domain, void *addr0, unsigned long long addr0_extra,
  218. itt_relation relation, void *addr1, unsigned long long addr1_extra ) {
  219. itt_relation_add_v7( domain, addr0, addr0_extra, relation, addr1, addr1_extra );
  220. }
  221. inline void itt_task_begin( itt_domain_enum domain, void *task, unsigned long long task_extra,
  222. void *parent, unsigned long long parent_extra, string_index name_index ) {
  223. itt_task_begin_v7( domain, task, task_extra, parent, parent_extra, name_index );
  224. }
  225. inline void itt_task_end( itt_domain_enum domain ) {
  226. itt_task_end_v7( domain );
  227. }
  228. inline void itt_region_begin( itt_domain_enum domain, void *region, unsigned long long region_extra,
  229. void *parent, unsigned long long parent_extra, string_index name_index ) {
  230. itt_region_begin_v9( domain, region, region_extra, parent, parent_extra, name_index );
  231. }
  232. inline void itt_region_end( itt_domain_enum domain, void *region, unsigned long long region_extra ) {
  233. itt_region_end_v9( domain, region, region_extra );
  234. }
  235. #else
  236. inline void register_node_addr( itt_domain_enum /*domain*/, void* /*addr*/, unsigned long long /*addr_extra*/, string_index /*key*/, void* /*value*/ ) {}
  237. inline void call_itt_notify(notify_type /*t*/, void* /*ptr*/) {}
  238. inline void itt_make_task_group( itt_domain_enum /*domain*/, void* /*group*/, unsigned long long /*group_extra*/,
  239. void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) {}
  240. inline void itt_metadata_str_add( itt_domain_enum /*domain*/, void* /*addr*/, unsigned long long /*addr_extra*/,
  241. string_index /*key*/, const char* /*value*/ ) {}
  242. inline void itt_relation_add( itt_domain_enum /*domain*/, void* /*addr0*/, unsigned long long /*addr0_extra*/,
  243. itt_relation /*relation*/, void* /*addr1*/, unsigned long long /*addr1_extra*/ ) {}
  244. inline void itt_task_begin( itt_domain_enum /*domain*/, void* /*task*/, unsigned long long /*task_extra*/,
  245. void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) {}
  246. inline void itt_task_end( itt_domain_enum /*domain*/ ) {}
  247. inline void itt_region_begin( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/,
  248. void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) {}
  249. inline void itt_region_end( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/ ) {}
  250. #endif // TBB_USE_THREADING_TOOLS
  251. } // namespace internal
  252. } // namespace tbb
  253. #if TBB_PREVIEW_FLOW_GRAPH_TRACE
  254. #include <string>
  255. namespace tbb {
  256. namespace profiling {
  257. namespace interface10 {
  258. #if TBB_USE_THREADING_TOOLS && !(TBB_USE_THREADING_TOOLS == 2)
  259. class event {
  260. /** This class supports user event traces through itt.
  261. Common use-case is tagging data flow graph tasks (data-id)
  262. and visualization by Intel Advisor Flow Graph Analyzer (FGA) **/
  263. // TODO: Replace implementation by itt user event api.
  264. const std::string my_name;
  265. static void emit_trace(const std::string &input) {
  266. itt_metadata_str_add( tbb::internal::ITT_DOMAIN_FLOW, NULL, tbb::internal::FLOW_NULL, tbb::internal::USER_EVENT, ( "FGA::DATAID::" + input ).c_str() );
  267. }
  268. public:
  269. event(const std::string &input)
  270. : my_name( input )
  271. { }
  272. void emit() {
  273. emit_trace(my_name);
  274. }
  275. static void emit(const std::string &description) {
  276. emit_trace(description);
  277. }
  278. };
  279. #else // TBB_USE_THREADING_TOOLS && !(TBB_USE_THREADING_TOOLS == 2)
  280. // Using empty struct if user event tracing is disabled:
  281. struct event {
  282. event(const std::string &) { }
  283. void emit() { }
  284. static void emit(const std::string &) { }
  285. };
  286. #endif // TBB_USE_THREADING_TOOLS && !(TBB_USE_THREADING_TOOLS == 2)
  287. } // interfaceX
  288. using interface10::event;
  289. } // namespace profiling
  290. } // namespace tbb
  291. #endif // TBB_PREVIEW_FLOW_GRAPH_TRACE
  292. #include "internal/_warning_suppress_disable_notice.h"
  293. #undef __TBB_tbb_profiling_H_include_area
  294. #endif /* __TBB_profiling_H */