2 This file is part of drd, a thread error detector.
4 Copyright (C) 2006-2013 Bart Van Assche <bvanassche@acm.org>.
6 This program is free software; you can redistribute it and/or
7 modify it under the terms of the GNU General Public License as
8 published by the Free Software Foundation; either version 2 of the
9 License, or (at your option) any later version.
11 This program is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
21 The GNU General Public License is contained in the file COPYING.
25 #include "drd_barrier.h"
26 #include "drd_clientobj.h"
27 #include "drd_error.h"
28 #include "drd_suppression.h"
29 #include "pub_tool_errormgr.h" // VG_(maybe_record_error)()
30 #include "pub_tool_libcassert.h" // tl_assert()
31 #include "pub_tool_libcprint.h" // VG_(printf)()
32 #include "pub_tool_machine.h" // VG_(get_IP)()
33 #include "pub_tool_mallocfree.h" // VG_(malloc)(), VG_(free)()
34 #include "pub_tool_oset.h"
35 #include "pub_tool_threadstate.h" // VG_(get_running_tid)()
38 /* Type definitions. */
40 /** Information associated with one thread participating in a barrier. */
41 struct barrier_thread_info
43 UWord tid
; // A DrdThreadId declared as UWord because
44 // this member variable is the key of an OSet.
45 Segment
* sg
; // Segment of the last pthread_barrier() call
47 Segment
* post_wait_sg
; // Segment created after *_barrier_wait() finished
48 ExeContext
* wait_call_ctxt
;// call stack for *_barrier_wait() call.
49 Bool thread_finished
;// Whether thread 'tid' has finished.
53 /* Local functions. */
55 static void barrier_cleanup(struct barrier_info
* p
);
56 static void barrier_delete_thread(struct barrier_info
* const p
,
57 const DrdThreadId tid
);
58 static const HChar
* barrier_get_typename(struct barrier_info
* const p
);
59 static const HChar
* barrier_type_name(const BarrierT bt
);
61 void barrier_report_wait_delete_race(const struct barrier_info
* const p
,
62 const struct barrier_thread_info
* const q
);
65 /* Local variables. */
67 static Bool s_trace_barrier
= False
;
68 static ULong s_barrier_segment_creation_count
;
71 /* Function definitions. */
73 void DRD_(barrier_set_trace
)(const Bool trace_barrier
)
75 s_trace_barrier
= trace_barrier
;
79 * Initialize the structure *p with the specified thread ID and iteration
83 void DRD_(barrier_thread_initialize
)(struct barrier_thread_info
* const p
,
84 const DrdThreadId tid
)
89 p
->wait_call_ctxt
= 0;
90 p
->thread_finished
= False
;
94 * Deallocate the memory that is owned by members of
95 * struct barrier_thread_info.
97 static void DRD_(barrier_thread_destroy
)(struct barrier_thread_info
* const p
)
101 DRD_(sg_put
)(p
->post_wait_sg
);
105 * Initialize the structure *p with the specified client-side barrier address,
106 * barrier object size and number of participants in each barrier.
109 void DRD_(barrier_initialize
)(struct barrier_info
* const p
,
111 const BarrierT barrier_type
,
116 tl_assert(barrier
!= 0);
117 tl_assert(barrier_type
== pthread_barrier
|| barrier_type
== gomp_barrier
);
118 tl_assert(p
->a1
== barrier
);
120 p
->cleanup
= (void(*)(DrdClientobj
*))barrier_cleanup
;
122 = (void(*)(DrdClientobj
*, DrdThreadId
))barrier_delete_thread
;
123 p
->barrier_type
= barrier_type
;
125 p
->pre_iteration
= 0;
126 p
->post_iteration
= 0;
127 p
->pre_waiters_left
= count
;
128 p
->post_waiters_left
= count
;
130 tl_assert(sizeof(((struct barrier_thread_info
*)0)->tid
) == sizeof(Word
));
131 tl_assert(sizeof(((struct barrier_thread_info
*)0)->tid
)
132 >= sizeof(DrdThreadId
));
133 for (i
= 0; i
< 2; i
++) {
134 p
->oset
[i
] = VG_(OSetGen_Create
)(0, 0, VG_(malloc
), "drd.barrier.bi.1",
140 * Deallocate the memory owned by the struct barrier_info object and also
141 * all the nodes in the OSet p->oset.
143 * Called by clientobj_destroy().
145 static void barrier_cleanup(struct barrier_info
* p
)
147 struct barrier_thread_info
* q
;
148 Segment
* latest_sg
= 0;
154 DRD_(thread_get_latest_segment
)(&latest_sg
, DRD_(thread_get_running_tid
)());
155 tl_assert(latest_sg
);
157 if (p
->pre_waiters_left
!= p
->count
) {
158 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), p
->a1
, 0, 0 };
159 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
161 VG_(get_IP
)(VG_(get_running_tid
)()),
162 "Destruction of barrier that is being waited"
166 oset
= p
->oset
[1 - (p
->pre_iteration
& 1)];
167 VG_(OSetGen_ResetIter
)(oset
);
168 for ( ; (q
= VG_(OSetGen_Next
)(oset
)) != 0; ) {
169 if (q
->post_wait_sg
&& !DRD_(vc_lte
)(&q
->post_wait_sg
->vc
,
172 barrier_report_wait_delete_race(p
, q
);
174 DRD_(barrier_thread_destroy
)(q
);
178 for (i
= 0; i
< 2; i
++) {
179 VG_(OSetGen_Destroy
)(p
->oset
[i
]);
183 DRD_(sg_put
)(latest_sg
);
187 * Look up the client-side barrier address barrier in s_barrier[]. If not
192 DRD_(barrier_get_or_allocate
)(const Addr barrier
,
193 const BarrierT barrier_type
, const Word count
)
195 struct barrier_info
*p
;
197 tl_assert(barrier_type
== pthread_barrier
|| barrier_type
== gomp_barrier
);
199 tl_assert(offsetof(DrdClientobj
, barrier
) == 0);
200 p
= &(DRD_(clientobj_get
)(barrier
, ClientBarrier
)->barrier
);
203 p
= &(DRD_(clientobj_add
)(barrier
, ClientBarrier
)->barrier
);
204 DRD_(barrier_initialize
)(p
, barrier
, barrier_type
, count
);
210 * Look up the address of the struct barrier_info associated with the
211 * client-side barrier object.
213 static struct barrier_info
* DRD_(barrier_get
)(const Addr barrier
)
215 tl_assert(offsetof(DrdClientobj
, barrier
) == 0);
216 return &(DRD_(clientobj_get
)(barrier
, ClientBarrier
)->barrier
);
220 * Initialize a barrier with given client address, barrier type and number of
221 * participants. The 'reinitialization' argument indicates whether a barrier
222 * object is being initialized or reinitialized.
224 * Called before pthread_barrier_init().
226 void DRD_(barrier_init
)(const Addr barrier
,
227 const BarrierT barrier_type
, const Word count
,
228 const Bool reinitialization
)
230 struct barrier_info
* p
;
232 tl_assert(barrier_type
== pthread_barrier
|| barrier_type
== gomp_barrier
);
236 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), barrier
, 0, 0 };
237 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
239 VG_(get_IP
)(VG_(get_running_tid
)()),
240 "pthread_barrier_init: 'count' argument is zero",
244 if (! reinitialization
&& barrier_type
== pthread_barrier
)
246 p
= DRD_(barrier_get
)(barrier
);
249 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), barrier
, 0, 0 };
250 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
252 VG_(get_IP
)(VG_(get_running_tid
)()),
253 "Barrier reinitialization",
258 p
= DRD_(barrier_get_or_allocate
)(barrier
, barrier_type
, count
);
260 if (s_trace_barrier
) {
261 if (reinitialization
)
262 DRD_(trace_msg
)("[%d] barrier_reinit %s 0x%lx count %ld -> %ld",
263 DRD_(thread_get_running_tid
)(),
264 barrier_get_typename(p
), barrier
, p
->count
, count
);
266 DRD_(trace_msg
)("[%d] barrier_init %s 0x%lx",
267 DRD_(thread_get_running_tid
)(),
268 barrier_get_typename(p
),
272 if (reinitialization
&& p
->count
!= count
)
274 if (p
->pre_waiters_left
!= p
->count
|| p
->post_waiters_left
!= p
->count
)
276 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), p
->a1
, 0, 0 };
277 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
279 VG_(get_IP
)(VG_(get_running_tid
)()),
280 "Reinitialization of barrier with active"
288 /** Called after pthread_barrier_destroy() / gomp_barrier_destroy(). */
289 void DRD_(barrier_destroy
)(const Addr barrier
, const BarrierT barrier_type
)
291 struct barrier_info
* p
;
293 p
= DRD_(barrier_get
)(barrier
);
296 DRD_(trace_msg
)("[%d] barrier_destroy %s 0x%lx",
297 DRD_(thread_get_running_tid
)(),
298 barrier_get_typename(p
), barrier
);
302 GenericErrInfo GEI
= {
303 .tid
= DRD_(thread_get_running_tid
)(),
306 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
308 VG_(get_IP
)(VG_(get_running_tid
)()),
314 if (p
->pre_waiters_left
!= p
->count
|| p
->post_waiters_left
!= p
->count
)
316 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), p
->a1
, 0, 0 };
317 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
319 VG_(get_IP
)(VG_(get_running_tid
)()),
320 "Destruction of a barrier with active waiters",
324 DRD_(clientobj_remove
)(p
->a1
, ClientBarrier
);
327 /** Called before pthread_barrier_wait() / gomp_barrier_wait(). */
328 void DRD_(barrier_pre_wait
)(const DrdThreadId tid
, const Addr barrier
,
329 const BarrierT barrier_type
)
331 struct barrier_info
* p
;
332 struct barrier_thread_info
* q
;
333 const UWord word_tid
= tid
;
336 p
= DRD_(barrier_get
)(barrier
);
337 if (p
== 0 && barrier_type
== gomp_barrier
) {
339 * gomp_barrier_wait() call has been intercepted but gomp_barrier_init()
340 * not. The only cause I know of that can trigger this is that libgomp.so
341 * has been compiled with --enable-linux-futex.
343 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), 0, 0, 0 };
344 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
346 VG_(get_IP
)(VG_(get_running_tid
)()),
347 "Please verify whether gcc has been configured"
348 " with option --disable-linux-futex. See also"
349 " the section about OpenMP in the DRD manual.",
355 DRD_(trace_msg
)("[%d] barrier_pre_wait %s 0x%lx iteration %ld",
356 DRD_(thread_get_running_tid
)(),
357 barrier_get_typename(p
), barrier
, p
->pre_iteration
);
359 /* Clean up nodes associated with finished threads. */
360 oset
= p
->oset
[p
->pre_iteration
& 1];
362 VG_(OSetGen_ResetIter
)(oset
);
363 for ( ; (q
= VG_(OSetGen_Next
)(oset
)) != 0; ) {
364 if (q
->thread_finished
) {
365 void* r
= VG_(OSetGen_Remove
)(oset
, &q
->tid
);
367 DRD_(barrier_thread_destroy
)(q
);
368 VG_(OSetGen_FreeNode
)(oset
, q
);
369 VG_(OSetGen_ResetIterAt
)(oset
, &word_tid
);
372 /* Allocate the per-thread data structure if necessary. */
373 q
= VG_(OSetGen_Lookup
)(oset
, &word_tid
);
375 q
= VG_(OSetGen_AllocNode
)(oset
, sizeof(*q
));
376 DRD_(barrier_thread_initialize
)(q
, tid
);
377 VG_(OSetGen_Insert
)(oset
, q
);
378 tl_assert(VG_(OSetGen_Lookup
)(oset
, &word_tid
) == q
);
381 /* Record *_barrier_wait() call context. */
382 q
->wait_call_ctxt
= VG_(record_ExeContext
)(VG_(get_running_tid
)(), 0);
385 * Store a pointer to the latest segment of the current thread in the
386 * per-thread data structure.
388 DRD_(thread_get_latest_segment
)(&q
->sg
, tid
);
391 * If the same number of threads as the barrier count indicates have
392 * called the pre *_barrier_wait() wrapper, toggle p->pre_iteration and
393 * reset the p->pre_waiters_left counter.
395 if (--p
->pre_waiters_left
<= 0)
398 p
->pre_waiters_left
= p
->count
;
402 /** Called after pthread_barrier_wait() / gomp_barrier_wait(). */
403 void DRD_(barrier_post_wait
)(const DrdThreadId tid
, const Addr barrier
,
404 const BarrierT barrier_type
, const Bool waited
,
405 const Bool serializing
)
407 struct barrier_info
* p
;
408 const UWord word_tid
= tid
;
409 struct barrier_thread_info
* q
;
410 struct barrier_thread_info
* r
;
413 p
= DRD_(barrier_get
)(barrier
);
416 DRD_(trace_msg
)("[%d] barrier_post_wait %s 0x%lx iteration %ld%s",
417 tid
, p
? barrier_get_typename(p
) : "(?)",
418 barrier
, p
? p
->post_iteration
: -1,
419 serializing
? " (serializing)" : "");
422 * If p == 0, this means that the barrier has been destroyed after
423 * *_barrier_wait() returned and before this function was called. Just
424 * return in that case -- race conditions between *_barrier_wait()
425 * and *_barrier_destroy() are detected by the *_barrier_destroy() wrapper.
430 /* If the *_barrier_wait() call returned an error code, exit. */
434 oset
= p
->oset
[p
->post_iteration
& 1];
435 q
= VG_(OSetGen_Lookup
)(oset
, &word_tid
);
436 if (p
->pre_iteration
- p
->post_iteration
> 1) {
437 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), p
->a1
, 0, 0 };
438 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
440 VG_(get_IP
)(VG_(get_running_tid
)()),
441 "Number of concurrent pthread_barrier_wait()"
442 " calls exceeds the barrier count",
444 } else if (q
== NULL
) {
445 BarrierErrInfo bei
= { DRD_(thread_get_running_tid
)(), p
->a1
, 0, 0 };
446 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
448 VG_(get_IP
)(VG_(get_running_tid
)()),
449 "Error in barrier implementation"
450 " -- barrier_wait() started before"
451 " barrier_destroy() and finished after"
452 " barrier_destroy()",
456 q
= VG_(OSetGen_AllocNode
)(oset
, sizeof(*q
));
457 DRD_(barrier_thread_initialize
)(q
, tid
);
458 VG_(OSetGen_Insert
)(oset
, q
);
459 tl_assert(VG_(OSetGen_Lookup
)(oset
, &word_tid
) == q
);
460 DRD_(thread_get_latest_segment
)(&q
->sg
, tid
);
463 /* Create a new segment and store a pointer to that segment. */
464 DRD_(thread_new_segment
)(tid
);
465 DRD_(thread_get_latest_segment
)(&q
->post_wait_sg
, tid
);
466 s_barrier_segment_creation_count
++;
469 * Combine all vector clocks that were stored in the pre_barrier_wait
470 * wrapper with the vector clock of the current thread.
475 DRD_(vc_copy
)(&old_vc
, DRD_(thread_get_vc
)(tid
));
476 VG_(OSetGen_ResetIter
)(oset
);
477 for ( ; (r
= VG_(OSetGen_Next
)(oset
)) != 0; )
482 DRD_(vc_combine
)(DRD_(thread_get_vc
)(tid
), &r
->sg
->vc
);
485 DRD_(thread_update_conflict_set
)(tid
, &old_vc
);
486 DRD_(vc_cleanup
)(&old_vc
);
490 * If the same number of threads as the barrier count indicates have
491 * called the post *_barrier_wait() wrapper, toggle p->post_iteration and
492 * reset the p->post_waiters_left counter.
494 if (--p
->post_waiters_left
<= 0)
497 p
->post_waiters_left
= p
->count
;
501 /** Called when thread tid stops to exist. */
502 static void barrier_delete_thread(struct barrier_info
* const p
,
503 const DrdThreadId tid
)
505 struct barrier_thread_info
* q
;
506 const UWord word_tid
= tid
;
509 for (i
= 0; i
< 2; i
++) {
510 q
= VG_(OSetGen_Lookup
)(p
->oset
[i
], &word_tid
);
512 q
->thread_finished
= True
;
517 * Report that *_barrier_destroy() has been called but that this call was
518 * not synchronized with the last *_barrier_wait() call on the same barrier.
520 * This topic has been discussed extensively on comp.programming.threads
521 * (February 3, 2009). See also
522 * <a href="http://groups.google.com/group/comp.programming.threads/browse_thread/thread/4f65535d6192aa50/a5f4bf1e3b437c4d">Immediately destroying pthread barriers</a>.
525 void barrier_report_wait_delete_race(const struct barrier_info
* const p
,
526 const struct barrier_thread_info
* const q
)
533 = { DRD_(thread_get_running_tid
)(), p
->a1
, q
->tid
, q
->wait_call_ctxt
};
534 VG_(maybe_record_error
)(VG_(get_running_tid
)(),
536 VG_(get_IP
)(VG_(get_running_tid
)()),
537 "Destruction of barrier not synchronized with"
538 " barrier wait call",
543 static const HChar
* barrier_get_typename(struct barrier_info
* const p
)
547 return barrier_type_name(p
->barrier_type
);
550 static const HChar
* barrier_type_name(const BarrierT bt
)
554 case pthread_barrier
:
555 return "pthread barrier";
557 return "gomp barrier";
562 ULong
DRD_(get_barrier_segment_creation_count
)(void)
564 return s_barrier_segment_creation_count
;