summaryrefslogtreecommitdiffstats
path: root/cpukit/score/include/rtems/score/smplock.h
diff options
context:
space:
mode:
authorSebastian Huber <sebastian.huber@embedded-brains.de>2014-03-07 14:36:22 +0100
committerSebastian Huber <sebastian.huber@embedded-brains.de>2014-03-14 08:46:49 +0100
commit53ad908a646eb6fd67f9b4586f4b484e8255b9d3 (patch)
tree7dd408879d01a507e6052f375ec6e14ab3f8965d /cpukit/score/include/rtems/score/smplock.h
parentscore: Add per-CPU profiling (diff)
downloadrtems-53ad908a646eb6fd67f9b4586f4b484e8255b9d3.tar.bz2
score: Add SMP lock profiling support
Diffstat (limited to 'cpukit/score/include/rtems/score/smplock.h')
-rw-r--r--cpukit/score/include/rtems/score/smplock.h409
1 files changed, 392 insertions, 17 deletions
diff --git a/cpukit/score/include/rtems/score/smplock.h b/cpukit/score/include/rtems/score/smplock.h
index 288fd454da..fc92f285fe 100644
--- a/cpukit/score/include/rtems/score/smplock.h
+++ b/cpukit/score/include/rtems/score/smplock.h
@@ -27,6 +27,11 @@
#include <rtems/score/atomic.h>
#include <rtems/score/isrlevel.h>
+#if defined( RTEMS_PROFILING )
+#include <rtems/score/chainimpl.h>
+#include <string.h>
+#endif
+
#ifdef __cplusplus
extern "C" {
#endif /* __cplusplus */
@@ -50,18 +55,170 @@ extern "C" {
*/
/**
+ * @brief Count of lock contention counters for lock statistics.
+ */
+#define SMP_LOCK_STATS_CONTENTION_COUNTS 4
+
+/**
+ * @brief SMP lock statistics.
+ *
+ * The lock acquire attempt instant is the point in time right after the
+ * interrupt disable action in the lock acquire sequence.
+ *
+ * The lock acquire instant is the point in time right after the lock
+ * acquisition. This is the begin of the critical section code execution.
+ *
+ * The lock release instant is the point in time right before the interrupt
+ * enable action in the lock release sequence.
+ *
+ * The lock section time is the time elapsed between the lock acquire instant
+ * and the lock release instant.
+ *
+ * The lock acquire time is the time elapsed between the lock acquire attempt
+ * instant and the lock acquire instant.
+ */
+typedef struct {
+#if defined( RTEMS_PROFILING )
+ /**
+ * @brief Node for SMP lock statistics chain.
+ */
+ Chain_Node Node;
+
+ /**
+ * @brief The maximum lock acquire time in CPU counter ticks.
+ */
+ CPU_Counter_ticks max_acquire_time;
+
+ /**
+ * @brief The maximum lock section time in CPU counter ticks.
+ */
+ CPU_Counter_ticks max_section_time;
+
+ /**
+ * @brief The count of lock uses.
+ *
+ * This value may overflow.
+ */
+ uint64_t usage_count;
+
+ /**
+ * @brief Total lock acquire time in nanoseconds.
+ *
+ * The average lock acquire time is the total acquire time divided by the
+ * lock usage count. The ration of the total section and total acquire times
+ * gives a measure for the lock contention.
+ *
+ * This value may overflow.
+ */
+ uint64_t total_acquire_time;
+
+ /**
+ * @brief The counts of lock acquire operations by contention.
+ *
+ * The contention count for index N corresponds to a lock acquire attempt
+ * with an initial queue length of N. The last index corresponds to all
+ * lock acquire attempts with an initial queue length greater than or equal
+ * to SMP_LOCK_STATS_CONTENTION_COUNTS minus one.
+ *
+ * The values may overflow.
+ */
+ uint64_t contention_counts[SMP_LOCK_STATS_CONTENTION_COUNTS];
+
+ /**
+ * @brief Total lock section time in CPU counter ticks.
+ *
+ * The average lock section time is the total section time divided by the
+ * lock usage count.
+ *
+ * This value may overflow.
+ */
+ uint64_t total_section_time;
+
+ /**
+ * @brief The lock name.
+ */
+ const char *name;
+#endif /* defined( RTEMS_PROFILING ) */
+} SMP_lock_Stats;
+
+/**
+ * @brief Local context for SMP lock statistics.
+ */
+typedef struct {
+#if defined( RTEMS_PROFILING )
+ /**
+ * @brief The last lock acquire instant in CPU counter ticks.
+ *
+ * This value is used to measure the lock section time.
+ */
+ CPU_Counter_ticks acquire_instant;
+#endif
+} SMP_lock_Stats_context;
+
+/**
+ * @brief SMP lock statistics initializer for static initialization.
+ */
+#if defined( RTEMS_PROFILING )
+#define SMP_LOCK_STATS_INITIALIZER( name ) \
+ { { NULL, NULL }, 0, 0, 0, 0, { 0, 0, 0, 0 }, 0, name }
+#else
+#define SMP_LOCK_STATS_INITIALIZER( name ) \
+ { }
+#endif
+
+/**
+ * @brief Initializes an SMP lock statistics block.
+ *
+ * @param[in, out] stats The SMP lock statistics block.
+ * @param[in] name The name for the SMP lock statistics. This name must be
+ * persistent throughout the life time of this statistics block.
+ */
+static inline void _SMP_lock_Stats_initialize(
+ SMP_lock_Stats *stats,
+ const char *name
+)
+{
+ SMP_lock_Stats init = SMP_LOCK_STATS_INITIALIZER( name );
+
+ *stats = init;
+}
+
+/**
+ * @brief Destroys an SMP lock statistics block.
+ *
+ * @param[in,out] stats The SMP lock statistics block.
+ */
+static inline void _SMP_lock_Stats_destroy( SMP_lock_Stats *stats );
+
+/**
+ * @brief Destroys an SMP lock statistics block.
+ *
+ * @param[in,out] stats The SMP lock statistics block.
+ * @param[in] stats_context The SMP lock statistics context.
+ */
+static inline void _SMP_lock_Stats_release_update(
+ SMP_lock_Stats *stats,
+ const SMP_lock_Stats_context *stats_context
+);
+
+/**
* @brief SMP ticket lock control.
*/
typedef struct {
Atomic_Uint next_ticket;
Atomic_Uint now_serving;
+ SMP_lock_Stats Stats;
} SMP_ticket_lock_Control;
/**
* @brief SMP ticket lock control initializer for static initialization.
*/
-#define SMP_TICKET_LOCK_INITIALIZER \
- { ATOMIC_INITIALIZER_UINT( 0U ), ATOMIC_INITIALIZER_UINT( 0U ) }
+#define SMP_TICKET_LOCK_INITIALIZER( name ) \
+ { \
+ ATOMIC_INITIALIZER_UINT( 0U ), \
+ ATOMIC_INITIALIZER_UINT( 0U ), \
+ SMP_LOCK_STATS_INITIALIZER( name ) \
+ }
/**
* @brief Initializes an SMP ticket lock.
@@ -69,11 +226,17 @@ typedef struct {
* Concurrent initialization leads to unpredictable results.
*
* @param[in,out] lock The SMP ticket lock control.
+ * @param[in] name The name for the SMP ticket lock. This name must be
+ * persistent throughout the life time of this lock.
*/
-static inline void _SMP_ticket_lock_Initialize( SMP_ticket_lock_Control *lock )
+static inline void _SMP_ticket_lock_Initialize(
+ SMP_ticket_lock_Control *lock,
+ const char *name
+)
{
_Atomic_Init_uint( &lock->next_ticket, 0U );
_Atomic_Init_uint( &lock->now_serving, 0U );
+ _SMP_lock_Stats_initialize( &lock->Stats, name );
}
/**
@@ -85,7 +248,7 @@ static inline void _SMP_ticket_lock_Initialize( SMP_ticket_lock_Control *lock )
*/
static inline void _SMP_ticket_lock_Destroy( SMP_ticket_lock_Control *lock )
{
- (void) lock;
+ _SMP_lock_Stats_destroy( &lock->Stats );
}
/**
@@ -96,30 +259,83 @@ static inline void _SMP_ticket_lock_Destroy( SMP_ticket_lock_Control *lock )
* the SMP ticket lock.
*
* @param[in,out] lock The SMP ticket lock control.
+ * @param[out] stats_context The SMP lock statistics context.
*/
-static inline void _SMP_ticket_lock_Acquire( SMP_ticket_lock_Control *lock )
+static inline void _SMP_ticket_lock_Acquire(
+ SMP_ticket_lock_Control *lock,
+ SMP_lock_Stats_context *stats_context
+)
{
- unsigned int my_ticket =
- _Atomic_Fetch_add_uint( &lock->next_ticket, 1U, ATOMIC_ORDER_RELAXED );
+ unsigned int my_ticket;
unsigned int now_serving;
- do {
- now_serving =
- _Atomic_Load_uint( &lock->now_serving, ATOMIC_ORDER_ACQUIRE );
- } while ( now_serving != my_ticket );
+#if defined( RTEMS_PROFILING )
+ SMP_lock_Stats *stats = &lock->Stats;
+ CPU_Counter_ticks first;
+ CPU_Counter_ticks second;
+ CPU_Counter_ticks delta;
+ unsigned int initial_queue_length;
+
+ first = _CPU_Counter_read();
+#endif
+
+ my_ticket =
+ _Atomic_Fetch_add_uint( &lock->next_ticket, 1U, ATOMIC_ORDER_RELAXED );
+
+#if defined( RTEMS_PROFILING )
+ now_serving =
+ _Atomic_Load_uint( &lock->now_serving, ATOMIC_ORDER_ACQUIRE );
+ initial_queue_length = my_ticket - now_serving;
+
+ if ( initial_queue_length > 0 ) {
+#endif
+
+ do {
+ now_serving =
+ _Atomic_Load_uint( &lock->now_serving, ATOMIC_ORDER_ACQUIRE );
+ } while ( now_serving != my_ticket );
+
+#if defined( RTEMS_PROFILING )
+ }
+
+ second = _CPU_Counter_read();
+ stats_context->acquire_instant = second;
+ delta = _CPU_Counter_difference( second, first );
+
+ ++stats->usage_count;
+
+ stats->total_acquire_time += delta;
+
+ if ( stats->max_acquire_time < delta ) {
+ stats->max_acquire_time = delta;
+ }
+
+ if ( initial_queue_length >= SMP_LOCK_STATS_CONTENTION_COUNTS ) {
+ initial_queue_length = SMP_LOCK_STATS_CONTENTION_COUNTS - 1;
+ }
+ ++stats->contention_counts[initial_queue_length];
+#else
+ (void) stats_context;
+#endif
}
/**
* @brief Releases an SMP ticket lock.
*
* @param[in,out] lock The SMP ticket lock control.
+ * @param[in] stats_context The SMP lock statistics context.
*/
-static inline void _SMP_ticket_lock_Release( SMP_ticket_lock_Control *lock )
+static inline void _SMP_ticket_lock_Release(
+ SMP_ticket_lock_Control *lock,
+ const SMP_lock_Stats_context *stats_context
+)
{
unsigned int current_ticket =
_Atomic_Load_uint( &lock->now_serving, ATOMIC_ORDER_RELAXED );
unsigned int next_ticket = current_ticket + 1U;
+ _SMP_lock_Stats_release_update( &lock->Stats, stats_context );
+
_Atomic_Store_uint( &lock->now_serving, next_ticket, ATOMIC_ORDER_RELEASE );
}
@@ -135,12 +351,13 @@ typedef struct {
*/
typedef struct {
ISR_Level isr_level;
+ SMP_lock_Stats_context Stats_context;
} SMP_lock_Context;
/**
* @brief SMP lock control initializer for static initialization.
*/
-#define SMP_LOCK_INITIALIZER { SMP_TICKET_LOCK_INITIALIZER }
+#define SMP_LOCK_INITIALIZER( name ) { SMP_TICKET_LOCK_INITIALIZER( name ) }
/**
* @brief Initializes an SMP lock.
@@ -148,10 +365,15 @@ typedef struct {
* Concurrent initialization leads to unpredictable results.
*
* @param[in,out] lock The SMP lock control.
+ * @param[in] name The name for the SMP lock statistics. This name must be
+ * persistent throughout the life time of this statistics block.
*/
-static inline void _SMP_lock_Initialize( SMP_lock_Control *lock )
+static inline void _SMP_lock_Initialize(
+ SMP_lock_Control *lock,
+ const char *name
+)
{
- _SMP_ticket_lock_Initialize( &lock->ticket_lock );
+ _SMP_ticket_lock_Initialize( &lock->ticket_lock, name );
}
/**
@@ -183,7 +405,7 @@ static inline void _SMP_lock_Acquire(
)
{
(void) context;
- _SMP_ticket_lock_Acquire( &lock->ticket_lock );
+ _SMP_ticket_lock_Acquire( &lock->ticket_lock, &context->Stats_context );
}
/**
@@ -199,7 +421,7 @@ static inline void _SMP_lock_Release(
)
{
(void) context;
- _SMP_ticket_lock_Release( &lock->ticket_lock );
+ _SMP_ticket_lock_Release( &lock->ticket_lock, &context->Stats_context );
}
/**
@@ -234,6 +456,159 @@ static inline void _SMP_lock_Release_and_ISR_enable(
_ISR_Enable_without_giant( context->isr_level );
}
+#if defined( RTEMS_PROFILING )
+typedef struct {
+ SMP_lock_Control Lock;
+ Chain_Control Stats_chain;
+ Chain_Control Iterator_chain;
+} SMP_lock_Stats_control;
+
+typedef struct {
+ Chain_Node Node;
+ SMP_lock_Stats *current;
+} SMP_lock_Stats_iteration_context;
+
+extern SMP_lock_Stats_control _SMP_lock_Stats_control;
+
+static inline void _SMP_lock_Stats_iteration_start(
+ SMP_lock_Stats_iteration_context *iteration_context
+)
+{
+ SMP_lock_Stats_control *control = &_SMP_lock_Stats_control;
+ SMP_lock_Context lock_context;
+
+ _SMP_lock_ISR_disable_and_acquire( &control->Lock, &lock_context );
+
+ _Chain_Append_unprotected(
+ &control->Iterator_chain,
+ &iteration_context->Node
+ );
+ iteration_context->current =
+ (SMP_lock_Stats *) _Chain_First( &control->Stats_chain );
+
+ _SMP_lock_Release_and_ISR_enable( &control->Lock, &lock_context );
+}
+
+static inline bool _SMP_lock_Stats_iteration_next(
+ SMP_lock_Stats_iteration_context *iteration_context,
+ SMP_lock_Stats *snapshot,
+ char *name,
+ size_t name_size
+)
+{
+ SMP_lock_Stats_control *control = &_SMP_lock_Stats_control;
+ SMP_lock_Context lock_context;
+ SMP_lock_Stats *current;
+ bool valid;
+
+ _SMP_lock_ISR_disable_and_acquire( &control->Lock, &lock_context );
+
+ current = iteration_context->current;
+ if ( !_Chain_Is_tail( &control->Stats_chain, &current->Node ) ) {
+ size_t name_len = strlen(current->name);
+
+ valid = true;
+
+ iteration_context->current = (SMP_lock_Stats *)
+ _Chain_Next( &current->Node );
+
+ *snapshot = *current;
+ snapshot->name = name;
+
+ if ( name_len >= name_size ) {
+ name_len = name_size - 1;
+ }
+
+ name[name_len] = '\0';
+ memcpy(name, current->name, name_len);
+ } else {
+ valid = false;
+ }
+
+ _SMP_lock_Release_and_ISR_enable( &control->Lock, &lock_context );
+
+ return valid;
+}
+
+static inline void _SMP_lock_Stats_iteration_stop(
+ SMP_lock_Stats_iteration_context *iteration_context
+)
+{
+ SMP_lock_Stats_control *control = &_SMP_lock_Stats_control;
+ SMP_lock_Context lock_context;
+
+ _SMP_lock_ISR_disable_and_acquire( &control->Lock, &lock_context );
+ _Chain_Extract_unprotected( &iteration_context->Node );
+ _SMP_lock_Release_and_ISR_enable( &control->Lock, &lock_context );
+}
+#endif
+
+static inline void _SMP_lock_Stats_destroy( SMP_lock_Stats *stats )
+{
+#if defined( RTEMS_PROFILING )
+ if ( !_Chain_Is_node_off_chain( &stats->Node ) ) {
+ SMP_lock_Stats_control *control = &_SMP_lock_Stats_control;
+ SMP_lock_Context lock_context;
+ SMP_lock_Stats_iteration_context *iteration_context;
+ SMP_lock_Stats_iteration_context *iteration_context_tail;
+ SMP_lock_Stats *next_stats;
+
+ _SMP_lock_ISR_disable_and_acquire( &control->Lock, &lock_context );
+
+ next_stats = (SMP_lock_Stats *) _Chain_Next( &stats->Node );
+ _Chain_Extract_unprotected( &stats->Node );
+
+ iteration_context = (SMP_lock_Stats_iteration_context *)
+ _Chain_First( &control->Iterator_chain );
+ iteration_context_tail = (SMP_lock_Stats_iteration_context *)
+ _Chain_Tail( &control->Iterator_chain );
+
+ while ( iteration_context != iteration_context_tail ) {
+ if ( iteration_context->current == stats ) {
+ iteration_context->current = next_stats;
+ }
+
+ iteration_context = (SMP_lock_Stats_iteration_context *)
+ _Chain_Next( &iteration_context->Node );
+ }
+
+ _SMP_lock_Release_and_ISR_enable( &control->Lock, &lock_context );
+ }
+#else
+ (void) stats;
+#endif
+}
+
+static inline void _SMP_lock_Stats_release_update(
+ SMP_lock_Stats *stats,
+ const SMP_lock_Stats_context *stats_context
+)
+{
+#if defined( RTEMS_PROFILING )
+ CPU_Counter_ticks first = stats_context->acquire_instant;
+ CPU_Counter_ticks second = _CPU_Counter_read();
+ CPU_Counter_ticks delta = _CPU_Counter_difference( second, first );
+
+ stats->total_section_time += delta;
+
+ if ( stats->max_section_time < delta ) {
+ stats->max_section_time = delta;
+
+ if ( _Chain_Is_node_off_chain( &stats->Node ) ) {
+ SMP_lock_Stats_control *control = &_SMP_lock_Stats_control;
+ SMP_lock_Context lock_context;
+
+ _SMP_lock_ISR_disable_and_acquire( &control->Lock, &lock_context );
+ _Chain_Append_unprotected( &control->Stats_chain, &stats->Node );
+ _SMP_lock_Release_and_ISR_enable( &control->Lock, &lock_context );
+ }
+ }
+#else
+ (void) stats;
+ (void) stats_context;
+#endif
+}
+
/**@}*/
#ifdef __cplusplus