-
Notifications
You must be signed in to change notification settings - Fork 59
Expand file tree
/
Copy pathtbb_main.cpp
More file actions
565 lines (481 loc) · 20.4 KB
/
tbb_main.cpp
File metadata and controls
565 lines (481 loc) · 20.4 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
/*
Copyright (c) 2005-2019 Intel Corporation
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#include "tbb/tbb_config.h"
#include "tbb/global_control.h"
#include "tbb_main.h"
#include "governor.h"
#include "market.h"
#include "tbb_misc.h"
#include "itt_notify.h"
namespace tbb {
namespace internal {
//------------------------------------------------------------------------
// Begin shared data layout.
// The following global data items are mostly read-only after initialization.
//------------------------------------------------------------------------
//! Padding in order to prevent false sharing.
static const char _pad[NFS_MaxLineSize - sizeof(int)] = {};
//------------------------------------------------------------------------
// governor data
basic_tls<uintptr_t> governor::theTLS;
unsigned governor::DefaultNumberOfThreads;
rml::tbb_factory governor::theRMLServerFactory;
bool governor::UsePrivateRML;
bool governor::is_speculation_enabled;
bool governor::is_rethrow_broken;
//------------------------------------------------------------------------
// market data
market* market::theMarket;
market::global_market_mutex_type market::theMarketMutex;
//------------------------------------------------------------------------
// One time initialization data
//! Counter of references to global shared resources such as TLS.
atomic<int> __TBB_InitOnce::count;
__TBB_atomic_flag __TBB_InitOnce::InitializationLock;
//! Flag that is set to true after one-time initializations are done.
bool __TBB_InitOnce::InitializationDone;
#if DO_ITT_NOTIFY
static bool ITT_Present;
static atomic<bool> ITT_InitializationDone;
#endif
#if !(_WIN32||_WIN64) || __TBB_SOURCE_DIRECTLY_INCLUDED
static __TBB_InitOnce __TBB_InitOnceHiddenInstance;
#endif
//------------------------------------------------------------------------
// generic_scheduler data
//! Pointer to the scheduler factory function
generic_scheduler* (*AllocateSchedulerPtr)( market& );
#if __TBB_OLD_PRIMES_RNG
//! Table of primes used by fast random-number generator (FastRandom).
/** Also serves to keep anything else from being placed in the same
cache line as the global data items preceding it. */
static const unsigned Primes[] = {
0x9e3779b1, 0xffe6cc59, 0x2109f6dd, 0x43977ab5,
0xba5703f5, 0xb495a877, 0xe1626741, 0x79695e6b,
0xbc98c09f, 0xd5bee2b3, 0x287488f9, 0x3af18231,
0x9677cd4d, 0xbe3a6929, 0xadc6a877, 0xdcf0674b,
0xbe4d6fe9, 0x5f15e201, 0x99afc3fd, 0xf3f16801,
0xe222cfff, 0x24ba5fdb, 0x0620452d, 0x79f149e3,
0xc8b93f49, 0x972702cd, 0xb07dd827, 0x6c97d5ed,
0x085a3d61, 0x46eb5ea7, 0x3d9910ed, 0x2e687b5b,
0x29609227, 0x6eb081f1, 0x0954c4e1, 0x9d114db9,
0x542acfa9, 0xb3e6bd7b, 0x0742d917, 0xe9f3ffa7,
0x54581edb, 0xf2480f45, 0x0bb9288f, 0xef1affc7,
0x85fa0ca7, 0x3ccc14db, 0xe6baf34b, 0x343377f7,
0x5ca19031, 0xe6d9293b, 0xf0a9f391, 0x5d2e980b,
0xfc411073, 0xc3749363, 0xb892d829, 0x3549366b,
0x629750ad, 0xb98294e5, 0x892d9483, 0xc235baf3,
0x3d2402a3, 0x6bdef3c9, 0xbec333cd, 0x40c9520f
};
//------------------------------------------------------------------------
// End of shared data layout
//------------------------------------------------------------------------
//------------------------------------------------------------------------
// Shared data accessors
//------------------------------------------------------------------------
unsigned GetPrime ( unsigned seed ) {
return Primes[seed%(sizeof(Primes)/sizeof(Primes[0]))];
}
#endif //__TBB_OLD_PRIMES_RNG
//------------------------------------------------------------------------
// __TBB_InitOnce
//------------------------------------------------------------------------
void __TBB_InitOnce::add_ref() {
if( ++count==1 )
governor::acquire_resources();
}
void __TBB_InitOnce::remove_ref() {
int k = --count;
__TBB_ASSERT(k>=0,"removed __TBB_InitOnce ref that was not added?");
if( k==0 ) {
governor::release_resources();
ITT_FINI_ITTLIB();
}
}
//------------------------------------------------------------------------
// One-time Initializations
//------------------------------------------------------------------------
//! Defined in cache_aligned_allocator.cpp
void initialize_cache_aligned_allocator();
//! Defined in scheduler.cpp
void Scheduler_OneTimeInitialization ( bool itt_present );
#if DO_ITT_NOTIFY
static __itt_domain *tbb_domains[ITT_NUM_DOMAINS] = {};
struct resource_string {
const char *str;
__itt_string_handle *itt_str_handle;
};
//
// populate resource strings
//
#define TBB_STRING_RESOURCE( index_name, str ) { str, NULL },
static resource_string strings_for_itt[] = {
#include "tbb/internal/_tbb_strings.h"
{ "num_resource_strings", NULL }
};
#undef TBB_STRING_RESOURCE
static __itt_string_handle *ITT_get_string_handle(int idx) {
__TBB_ASSERT( idx >= 0 && idx < NUM_STRINGS, "string handle out of valid range");
return (idx >= 0 && idx < NUM_STRINGS) ? strings_for_itt[idx].itt_str_handle : NULL;
}
static void ITT_init_domains() {
tbb_domains[ITT_DOMAIN_MAIN] = __itt_domain_create( _T("tbb") );
tbb_domains[ITT_DOMAIN_MAIN]->flags = 1;
tbb_domains[ITT_DOMAIN_FLOW] = __itt_domain_create( _T("tbb.flow") );
tbb_domains[ITT_DOMAIN_FLOW]->flags = 1;
tbb_domains[ITT_DOMAIN_ALGO] = __itt_domain_create( _T("tbb.algorithm") );
tbb_domains[ITT_DOMAIN_ALGO]->flags = 1;
}
static void ITT_init_strings() {
for ( int i = 0; i < NUM_STRINGS; ++i ) {
#if _WIN32||_WIN64
strings_for_itt[i].itt_str_handle = __itt_string_handle_createA( strings_for_itt[i].str );
#else
strings_for_itt[i].itt_str_handle = __itt_string_handle_create( strings_for_itt[i].str );
#endif
}
}
static void ITT_init() {
ITT_init_domains();
ITT_init_strings();
}
/** Thread-unsafe lazy one-time initialization of tools interop.
Used by both dummy handlers and general TBB one-time initialization routine. **/
void ITT_DoUnsafeOneTimeInitialization () {
// Double check ITT_InitializationDone is necessary because the first check
// in ITT_DoOneTimeInitialization is not guarded with the __TBB_InitOnce lock.
if ( !ITT_InitializationDone ) {
ITT_Present = (__TBB_load_ittnotify()!=0);
if (ITT_Present) ITT_init();
ITT_InitializationDone = true;
ITT_SYNC_CREATE(&market::theMarketMutex, SyncType_GlobalLock, SyncObj_SchedulerInitialization);
}
}
/** Thread-safe lazy one-time initialization of tools interop.
Used by dummy handlers only. **/
extern "C"
void ITT_DoOneTimeInitialization() {
if ( !ITT_InitializationDone ) {
__TBB_InitOnce::lock();
ITT_DoUnsafeOneTimeInitialization();
__TBB_InitOnce::unlock();
}
}
#endif /* DO_ITT_NOTIFY */
//! Performs thread-safe lazy one-time general TBB initialization.
void DoOneTimeInitializations() {
suppress_unused_warning(_pad);
__TBB_InitOnce::lock();
// No fence required for load of InitializationDone, because we are inside a critical section.
if( !__TBB_InitOnce::InitializationDone ) {
__TBB_InitOnce::add_ref();
if( GetBoolEnvironmentVariable("TBB_VERSION") )
PrintVersion();
bool itt_present = false;
#if DO_ITT_NOTIFY
ITT_DoUnsafeOneTimeInitialization();
itt_present = ITT_Present;
#endif /* DO_ITT_NOTIFY */
initialize_cache_aligned_allocator();
governor::initialize_rml_factory();
Scheduler_OneTimeInitialization( itt_present );
// Force processor groups support detection
governor::default_num_threads();
// Dump version data
governor::print_version_info();
PrintExtraVersionInfo( "Tools support", itt_present ? "enabled" : "disabled" );
__TBB_InitOnce::InitializationDone = true;
}
__TBB_InitOnce::unlock();
}
#if (_WIN32||_WIN64) && !__TBB_SOURCE_DIRECTLY_INCLUDED
//! Windows "DllMain" that handles startup and shutdown of dynamic library.
extern "C" bool WINAPI DllMain( HANDLE /*hinstDLL*/, DWORD reason, LPVOID lpvReserved ) {
switch( reason ) {
case DLL_PROCESS_ATTACH:
__TBB_InitOnce::add_ref();
break;
case DLL_PROCESS_DETACH:
// Since THREAD_DETACH is not called for the main thread, call auto-termination
// here as well - but not during process shutdown (due to risk of a deadlock).
if( lpvReserved==NULL ) // library unload
governor::terminate_auto_initialized_scheduler();
__TBB_InitOnce::remove_ref();
// It is assumed that InitializationDone is not set after DLL_PROCESS_DETACH,
// and thus no race on InitializationDone is possible.
if( __TBB_InitOnce::initialization_done() ) {
// Remove reference that we added in DoOneTimeInitializations.
__TBB_InitOnce::remove_ref();
}
break;
case DLL_THREAD_DETACH:
governor::terminate_auto_initialized_scheduler();
break;
}
return true;
}
#endif /* (_WIN32||_WIN64) && !__TBB_SOURCE_DIRECTLY_INCLUDED */
void itt_store_pointer_with_release_v3( void* dst, void* src ) {
ITT_NOTIFY(sync_releasing, dst);
__TBB_store_with_release(*static_cast<void**>(dst),src);
}
void* itt_load_pointer_with_acquire_v3( const void* src ) {
void* result = __TBB_load_with_acquire(*static_cast<void*const*>(src));
ITT_NOTIFY(sync_acquired, const_cast<void*>(src));
return result;
}
#if DO_ITT_NOTIFY
void call_itt_notify_v5(int t, void *ptr) {
switch (t) {
case 0: ITT_NOTIFY(sync_prepare, ptr); break;
case 1: ITT_NOTIFY(sync_cancel, ptr); break;
case 2: ITT_NOTIFY(sync_acquired, ptr); break;
case 3: ITT_NOTIFY(sync_releasing, ptr); break;
}
}
#else
void call_itt_notify_v5(int /*t*/, void* /*ptr*/) {}
#endif
#if DO_ITT_NOTIFY
const __itt_id itt_null_id = {0, 0, 0};
static inline __itt_domain* get_itt_domain( itt_domain_enum idx ) {
if (tbb_domains[idx] == NULL) {
ITT_DoOneTimeInitialization();
}
return tbb_domains[idx];
}
static inline void itt_id_make(__itt_id *id, void* addr, unsigned long long extra) {
*id = __itt_id_make(addr, extra);
}
static inline void itt_id_create(const __itt_domain *domain, __itt_id id) {
ITTNOTIFY_VOID_D1(id_create, domain, id);
}
void itt_make_task_group_v7( itt_domain_enum domain, void *group, unsigned long long group_extra,
void *parent, unsigned long long parent_extra, string_index name_index ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
__itt_id group_id = itt_null_id;
__itt_id parent_id = itt_null_id;
itt_id_make( &group_id, group, group_extra );
itt_id_create( d, group_id );
if ( parent ) {
itt_id_make( &parent_id, parent, parent_extra );
}
__itt_string_handle *n = ITT_get_string_handle(name_index);
ITTNOTIFY_VOID_D3(task_group, d, group_id, parent_id, n);
}
}
void itt_metadata_str_add_v7( itt_domain_enum domain, void *addr, unsigned long long addr_extra,
string_index key, const char *value ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
__itt_id id = itt_null_id;
itt_id_make( &id, addr, addr_extra );
__itt_string_handle *k = ITT_get_string_handle(key);
size_t value_length = strlen( value );
#if _WIN32||_WIN64
ITTNOTIFY_VOID_D4(metadata_str_addA, d, id, k, value, value_length);
#else
ITTNOTIFY_VOID_D4(metadata_str_add, d, id, k, value, value_length);
#endif
}
}
void itt_relation_add_v7( itt_domain_enum domain, void *addr0, unsigned long long addr0_extra,
itt_relation relation, void *addr1, unsigned long long addr1_extra ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
__itt_id id0 = itt_null_id;
__itt_id id1 = itt_null_id;
itt_id_make( &id0, addr0, addr0_extra );
itt_id_make( &id1, addr1, addr1_extra );
ITTNOTIFY_VOID_D3(relation_add, d, id0, (__itt_relation)relation, id1);
}
}
void itt_task_begin_v7( itt_domain_enum domain, void *task, unsigned long long task_extra,
void *parent, unsigned long long parent_extra, string_index name_index ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
__itt_id task_id = itt_null_id;
__itt_id parent_id = itt_null_id;
if ( task ) {
itt_id_make( &task_id, task, task_extra );
}
if ( parent ) {
itt_id_make( &parent_id, parent, parent_extra );
}
__itt_string_handle *n = ITT_get_string_handle(name_index);
ITTNOTIFY_VOID_D3(task_begin, d, task_id, parent_id, n );
}
}
void itt_task_end_v7( itt_domain_enum domain ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
ITTNOTIFY_VOID_D0(task_end, d);
}
}
void itt_region_begin_v9( itt_domain_enum domain, void *region, unsigned long long region_extra,
void *parent, unsigned long long parent_extra, string_index /* name_index */ ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
__itt_id region_id = itt_null_id;
__itt_id parent_id = itt_null_id;
itt_id_make( ®ion_id, region, region_extra );
if ( parent ) {
itt_id_make( &parent_id, parent, parent_extra );
}
ITTNOTIFY_VOID_D3(region_begin, d, region_id, parent_id, NULL );
}
}
void itt_region_end_v9( itt_domain_enum domain, void *region, unsigned long long region_extra ) {
if ( __itt_domain *d = get_itt_domain( domain ) ) {
__itt_id region_id = itt_null_id;
itt_id_make( ®ion_id, region, region_extra );
ITTNOTIFY_VOID_D1( region_end, d, region_id );
}
}
#else // DO_ITT_NOTIFY
void itt_make_task_group_v7( itt_domain_enum /*domain*/, void* /*group*/, unsigned long long /*group_extra*/,
void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) { }
void itt_metadata_str_add_v7( itt_domain_enum /*domain*/, void* /*addr*/, unsigned long long /*addr_extra*/,
string_index /*key*/, const char* /*value*/ ) { }
void itt_relation_add_v7( itt_domain_enum /*domain*/, void* /*addr0*/, unsigned long long /*addr0_extra*/,
itt_relation /*relation*/, void* /*addr1*/, unsigned long long /*addr1_extra*/ ) { }
void itt_task_begin_v7( itt_domain_enum /*domain*/, void* /*task*/, unsigned long long /*task_extra*/,
void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) { }
void itt_task_end_v7( itt_domain_enum /*domain*/ ) { }
void itt_region_begin_v9( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/,
void* /*parent*/, unsigned long long /*parent_extra*/, string_index /*name_index*/ ) { }
void itt_region_end_v9( itt_domain_enum /*domain*/, void* /*region*/, unsigned long long /*region_extra*/ ) { }
#endif // DO_ITT_NOTIFY
void* itt_load_pointer_v3( const void* src ) {
//TODO: replace this with __TBB_load_relaxed
void* result = *static_cast<void*const*>(src);
return result;
}
void itt_set_sync_name_v3( void* obj, const tchar* name) {
ITT_SYNC_RENAME(obj, name);
suppress_unused_warning(obj, name);
}
class control_storage {
friend class tbb::interface9::global_control;
protected:
size_t my_active_value;
atomic<global_control*> my_head;
spin_mutex my_list_mutex;
virtual size_t default_value() const = 0;
virtual void apply_active() const {}
virtual bool is_first_arg_preferred(size_t a, size_t b) const {
return a>b; // prefer max by default
}
virtual size_t active_value() const {
return my_head? my_active_value : default_value();
}
};
class allowed_parallelism_control : public padded<control_storage> {
virtual size_t default_value() const __TBB_override {
return max(1U, governor::default_num_threads());
}
virtual bool is_first_arg_preferred(size_t a, size_t b) const __TBB_override {
return a<b; // prefer min allowed parallelism
}
virtual void apply_active() const __TBB_override {
__TBB_ASSERT( my_active_value>=1, NULL );
// -1 to take master into account
market::set_active_num_workers( my_active_value-1 );
}
virtual size_t active_value() const __TBB_override {
/* Reading of my_active_value is not synchronized with possible updating
of my_head by other thread. It's ok, as value of my_active_value became
not invalid, just obsolete. */
if (!my_head)
return default_value();
// non-zero, if market is active
const size_t workers = market::max_num_workers();
// We can't exceed market's maximal number of workers.
// +1 to take master into account
return workers? min(workers+1, my_active_value): my_active_value;
}
public:
size_t active_value_if_present() const {
return my_head? my_active_value : 0;
}
};
class stack_size_control : public padded<control_storage> {
virtual size_t default_value() const __TBB_override {
return tbb::internal::ThreadStackSize;
}
virtual void apply_active() const __TBB_override {
#if __TBB_WIN8UI_SUPPORT && (_WIN32_WINNT < 0x0A00)
__TBB_ASSERT( false, "For Windows 8 Store* apps we must not set stack size" );
#endif
}
};
static allowed_parallelism_control allowed_parallelism_ctl;
static stack_size_control stack_size_ctl;
static control_storage *controls[] = {&allowed_parallelism_ctl, &stack_size_ctl};
unsigned market::app_parallelism_limit() {
return allowed_parallelism_ctl.active_value_if_present();
}
} // namespace internal
namespace interface9 {
using namespace internal;
using namespace tbb::internal;
void global_control::internal_create() {
__TBB_ASSERT_RELEASE( my_param < global_control::parameter_max, NULL );
control_storage *const c = controls[my_param];
spin_mutex::scoped_lock lock(c->my_list_mutex);
if (!c->my_head || c->is_first_arg_preferred(my_value, c->my_active_value)) {
c->my_active_value = my_value;
// to guarantee that apply_active() is called with current active value,
// calls it here and in internal_destroy() under my_list_mutex
c->apply_active();
}
my_next = c->my_head;
// publish my_head, at this point my_active_value must be valid
c->my_head = this;
}
void global_control::internal_destroy() {
global_control *prev = 0;
__TBB_ASSERT_RELEASE( my_param < global_control::parameter_max, NULL );
control_storage *const c = controls[my_param];
__TBB_ASSERT( c->my_head, NULL );
// Concurrent reading and changing global parameter is possible.
// In this case, my_active_value may not match current state of parameters.
// This is OK because:
// 1) my_active_value is either current or previous
// 2) my_active_value is current on internal_destroy leave
spin_mutex::scoped_lock lock(c->my_list_mutex);
size_t new_active = (size_t)-1, old_active = c->my_active_value;
if ( c->my_head != this )
new_active = c->my_head->my_value;
else if ( c->my_head->my_next )
new_active = c->my_head->my_next->my_value;
// if there is only one element, new_active will be set later
for ( global_control *curr = c->my_head; curr; prev = curr, curr = curr->my_next )
if ( curr == this ) {
if ( prev )
prev->my_next = my_next;
else
c->my_head = my_next;
} else
if (c->is_first_arg_preferred(curr->my_value, new_active))
new_active = curr->my_value;
if ( !c->my_head ) {
__TBB_ASSERT( new_active==(size_t)-1, NULL );
new_active = c->default_value();
}
if ( new_active != old_active ) {
c->my_active_value = new_active;
c->apply_active();
}
}
size_t global_control::active_value( int param ) {
__TBB_ASSERT_RELEASE( param < global_control::parameter_max, NULL );
return controls[param]->active_value();
}
} // tbb::interface9
} // namespace tbb