cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

builtin-lock.c (27782B)


      1// SPDX-License-Identifier: GPL-2.0
      2#include <errno.h>
      3#include <inttypes.h>
      4#include "builtin.h"
      5#include "perf.h"
      6
      7#include "util/evlist.h" // for struct evsel_str_handler
      8#include "util/evsel.h"
      9#include "util/symbol.h"
     10#include "util/thread.h"
     11#include "util/header.h"
     12
     13#include <subcmd/pager.h>
     14#include <subcmd/parse-options.h>
     15#include "util/trace-event.h"
     16
     17#include "util/debug.h"
     18#include "util/session.h"
     19#include "util/tool.h"
     20#include "util/data.h"
     21#include "util/string2.h"
     22
     23#include <sys/types.h>
     24#include <sys/prctl.h>
     25#include <semaphore.h>
     26#include <pthread.h>
     27#include <math.h>
     28#include <limits.h>
     29
     30#include <linux/list.h>
     31#include <linux/hash.h>
     32#include <linux/kernel.h>
     33#include <linux/zalloc.h>
     34#include <linux/err.h>
     35
     36static struct perf_session *session;
     37
     38/* based on kernel/lockdep.c */
     39#define LOCKHASH_BITS		12
     40#define LOCKHASH_SIZE		(1UL << LOCKHASH_BITS)
     41
     42static struct hlist_head lockhash_table[LOCKHASH_SIZE];
     43
     44#define __lockhashfn(key)	hash_long((unsigned long)key, LOCKHASH_BITS)
     45#define lockhashentry(key)	(lockhash_table + __lockhashfn((key)))
     46
     47struct lock_stat {
     48	struct hlist_node	hash_entry;
     49	struct rb_node		rb;		/* used for sorting */
     50
     51	u64			addr;		/* address of lockdep_map, used as ID */
     52	char			*name;		/* for strcpy(), we cannot use const */
     53
     54	unsigned int		nr_acquire;
     55	unsigned int		nr_acquired;
     56	unsigned int		nr_contended;
     57	unsigned int		nr_release;
     58
     59	unsigned int		nr_readlock;
     60	unsigned int		nr_trylock;
     61
     62	/* these times are in nano sec. */
     63	u64                     avg_wait_time;
     64	u64			wait_time_total;
     65	u64			wait_time_min;
     66	u64			wait_time_max;
     67
     68	int			broken; /* flag of blacklist */
     69	int			combined;
     70};
     71
     72/*
     73 * States of lock_seq_stat
     74 *
     75 * UNINITIALIZED is required for detecting first event of acquire.
     76 * As the nature of lock events, there is no guarantee
     77 * that the first event for the locks are acquire,
     78 * it can be acquired, contended or release.
     79 */
     80#define SEQ_STATE_UNINITIALIZED      0	       /* initial state */
     81#define SEQ_STATE_RELEASED	1
     82#define SEQ_STATE_ACQUIRING	2
     83#define SEQ_STATE_ACQUIRED	3
     84#define SEQ_STATE_READ_ACQUIRED	4
     85#define SEQ_STATE_CONTENDED	5
     86
     87/*
     88 * MAX_LOCK_DEPTH
     89 * Imported from include/linux/sched.h.
     90 * Should this be synchronized?
     91 */
     92#define MAX_LOCK_DEPTH 48
     93
     94/*
     95 * struct lock_seq_stat:
     96 * Place to put on state of one lock sequence
     97 * 1) acquire -> acquired -> release
     98 * 2) acquire -> contended -> acquired -> release
     99 * 3) acquire (with read or try) -> release
    100 * 4) Are there other patterns?
    101 */
    102struct lock_seq_stat {
    103	struct list_head        list;
    104	int			state;
    105	u64			prev_event_time;
    106	u64                     addr;
    107
    108	int                     read_count;
    109};
    110
    111struct thread_stat {
    112	struct rb_node		rb;
    113
    114	u32                     tid;
    115	struct list_head        seq_list;
    116};
    117
    118static struct rb_root		thread_stats;
    119
    120static bool combine_locks;
    121static bool show_thread_stats;
    122
    123static struct thread_stat *thread_stat_find(u32 tid)
    124{
    125	struct rb_node *node;
    126	struct thread_stat *st;
    127
    128	node = thread_stats.rb_node;
    129	while (node) {
    130		st = container_of(node, struct thread_stat, rb);
    131		if (st->tid == tid)
    132			return st;
    133		else if (tid < st->tid)
    134			node = node->rb_left;
    135		else
    136			node = node->rb_right;
    137	}
    138
    139	return NULL;
    140}
    141
    142static void thread_stat_insert(struct thread_stat *new)
    143{
    144	struct rb_node **rb = &thread_stats.rb_node;
    145	struct rb_node *parent = NULL;
    146	struct thread_stat *p;
    147
    148	while (*rb) {
    149		p = container_of(*rb, struct thread_stat, rb);
    150		parent = *rb;
    151
    152		if (new->tid < p->tid)
    153			rb = &(*rb)->rb_left;
    154		else if (new->tid > p->tid)
    155			rb = &(*rb)->rb_right;
    156		else
    157			BUG_ON("inserting invalid thread_stat\n");
    158	}
    159
    160	rb_link_node(&new->rb, parent, rb);
    161	rb_insert_color(&new->rb, &thread_stats);
    162}
    163
    164static struct thread_stat *thread_stat_findnew_after_first(u32 tid)
    165{
    166	struct thread_stat *st;
    167
    168	st = thread_stat_find(tid);
    169	if (st)
    170		return st;
    171
    172	st = zalloc(sizeof(struct thread_stat));
    173	if (!st) {
    174		pr_err("memory allocation failed\n");
    175		return NULL;
    176	}
    177
    178	st->tid = tid;
    179	INIT_LIST_HEAD(&st->seq_list);
    180
    181	thread_stat_insert(st);
    182
    183	return st;
    184}
    185
    186static struct thread_stat *thread_stat_findnew_first(u32 tid);
    187static struct thread_stat *(*thread_stat_findnew)(u32 tid) =
    188	thread_stat_findnew_first;
    189
    190static struct thread_stat *thread_stat_findnew_first(u32 tid)
    191{
    192	struct thread_stat *st;
    193
    194	st = zalloc(sizeof(struct thread_stat));
    195	if (!st) {
    196		pr_err("memory allocation failed\n");
    197		return NULL;
    198	}
    199	st->tid = tid;
    200	INIT_LIST_HEAD(&st->seq_list);
    201
    202	rb_link_node(&st->rb, NULL, &thread_stats.rb_node);
    203	rb_insert_color(&st->rb, &thread_stats);
    204
    205	thread_stat_findnew = thread_stat_findnew_after_first;
    206	return st;
    207}
    208
    209/* build simple key function one is bigger than two */
    210#define SINGLE_KEY(member)						\
    211	static int lock_stat_key_ ## member(struct lock_stat *one,	\
    212					 struct lock_stat *two)		\
    213	{								\
    214		return one->member > two->member;			\
    215	}
    216
    217SINGLE_KEY(nr_acquired)
    218SINGLE_KEY(nr_contended)
    219SINGLE_KEY(avg_wait_time)
    220SINGLE_KEY(wait_time_total)
    221SINGLE_KEY(wait_time_max)
    222
    223static int lock_stat_key_wait_time_min(struct lock_stat *one,
    224					struct lock_stat *two)
    225{
    226	u64 s1 = one->wait_time_min;
    227	u64 s2 = two->wait_time_min;
    228	if (s1 == ULLONG_MAX)
    229		s1 = 0;
    230	if (s2 == ULLONG_MAX)
    231		s2 = 0;
    232	return s1 > s2;
    233}
    234
    235struct lock_key {
    236	/*
    237	 * name: the value for specify by user
    238	 * this should be simpler than raw name of member
    239	 * e.g. nr_acquired -> acquired, wait_time_total -> wait_total
    240	 */
    241	const char		*name;
    242	/* header: the string printed on the header line */
    243	const char		*header;
    244	/* len: the printing width of the field */
    245	int			len;
    246	/* key: a pointer to function to compare two lock stats for sorting */
    247	int			(*key)(struct lock_stat*, struct lock_stat*);
    248	/* print: a pointer to function to print a given lock stats */
    249	void			(*print)(struct lock_key*, struct lock_stat*);
    250	/* list: list entry to link this */
    251	struct list_head	list;
    252};
    253
    254#define PRINT_KEY(member)						\
    255static void lock_stat_key_print_ ## member(struct lock_key *key,	\
    256					   struct lock_stat *ls)	\
    257{									\
    258	pr_info("%*llu", key->len, (unsigned long long)ls->member);	\
    259}
    260
    261PRINT_KEY(nr_acquired)
    262PRINT_KEY(nr_contended)
    263PRINT_KEY(avg_wait_time)
    264PRINT_KEY(wait_time_total)
    265PRINT_KEY(wait_time_max)
    266
    267static void lock_stat_key_print_wait_time_min(struct lock_key *key,
    268					      struct lock_stat *ls)
    269{
    270	u64 wait_time = ls->wait_time_min;
    271
    272	if (wait_time == ULLONG_MAX)
    273		wait_time = 0;
    274
    275	pr_info("%*"PRIu64, key->len, wait_time);
    276}
    277
    278
    279static const char		*sort_key = "acquired";
    280
    281static int			(*compare)(struct lock_stat *, struct lock_stat *);
    282
    283static struct rb_root		sorted; /* place to store intermediate data */
    284static struct rb_root		result;	/* place to store sorted data */
    285
    286static LIST_HEAD(lock_keys);
    287static const char		*output_fields;
    288
    289#define DEF_KEY_LOCK(name, header, fn_suffix, len)			\
    290	{ #name, header, len, lock_stat_key_ ## fn_suffix, lock_stat_key_print_ ## fn_suffix, {} }
    291struct lock_key keys[] = {
    292	DEF_KEY_LOCK(acquired, "acquired", nr_acquired, 10),
    293	DEF_KEY_LOCK(contended, "contended", nr_contended, 10),
    294	DEF_KEY_LOCK(avg_wait, "avg wait (ns)", avg_wait_time, 15),
    295	DEF_KEY_LOCK(wait_total, "total wait (ns)", wait_time_total, 15),
    296	DEF_KEY_LOCK(wait_max, "max wait (ns)", wait_time_max, 15),
    297	DEF_KEY_LOCK(wait_min, "min wait (ns)", wait_time_min, 15),
    298
    299	/* extra comparisons much complicated should be here */
    300	{ }
    301};
    302
    303static int select_key(void)
    304{
    305	int i;
    306
    307	for (i = 0; keys[i].name; i++) {
    308		if (!strcmp(keys[i].name, sort_key)) {
    309			compare = keys[i].key;
    310
    311			/* selected key should be in the output fields */
    312			if (list_empty(&keys[i].list))
    313				list_add_tail(&keys[i].list, &lock_keys);
    314
    315			return 0;
    316		}
    317	}
    318
    319	pr_err("Unknown compare key: %s\n", sort_key);
    320	return -1;
    321}
    322
    323static int add_output_field(struct list_head *head, char *name)
    324{
    325	int i;
    326
    327	for (i = 0; keys[i].name; i++) {
    328		if (strcmp(keys[i].name, name))
    329			continue;
    330
    331		/* prevent double link */
    332		if (list_empty(&keys[i].list))
    333			list_add_tail(&keys[i].list, head);
    334
    335		return 0;
    336	}
    337
    338	pr_err("Unknown output field: %s\n", name);
    339	return -1;
    340}
    341
    342static int setup_output_field(const char *str)
    343{
    344	char *tok, *tmp, *orig;
    345	int i, ret = 0;
    346
    347	/* no output field given: use all of them */
    348	if (str == NULL) {
    349		for (i = 0; keys[i].name; i++)
    350			list_add_tail(&keys[i].list, &lock_keys);
    351		return 0;
    352	}
    353
    354	for (i = 0; keys[i].name; i++)
    355		INIT_LIST_HEAD(&keys[i].list);
    356
    357	orig = tmp = strdup(str);
    358	if (orig == NULL)
    359		return -ENOMEM;
    360
    361	while ((tok = strsep(&tmp, ",")) != NULL){
    362		ret = add_output_field(&lock_keys, tok);
    363		if (ret < 0)
    364			break;
    365	}
    366	free(orig);
    367
    368	return ret;
    369}
    370
    371static void combine_lock_stats(struct lock_stat *st)
    372{
    373	struct rb_node **rb = &sorted.rb_node;
    374	struct rb_node *parent = NULL;
    375	struct lock_stat *p;
    376	int ret;
    377
    378	while (*rb) {
    379		p = container_of(*rb, struct lock_stat, rb);
    380		parent = *rb;
    381
    382		if (st->name && p->name)
    383			ret = strcmp(st->name, p->name);
    384		else
    385			ret = !!st->name - !!p->name;
    386
    387		if (ret == 0) {
    388			p->nr_acquired += st->nr_acquired;
    389			p->nr_contended += st->nr_contended;
    390			p->wait_time_total += st->wait_time_total;
    391
    392			if (p->nr_contended)
    393				p->avg_wait_time = p->wait_time_total / p->nr_contended;
    394
    395			if (p->wait_time_min > st->wait_time_min)
    396				p->wait_time_min = st->wait_time_min;
    397			if (p->wait_time_max < st->wait_time_max)
    398				p->wait_time_max = st->wait_time_max;
    399
    400			p->broken |= st->broken;
    401			st->combined = 1;
    402			return;
    403		}
    404
    405		if (ret < 0)
    406			rb = &(*rb)->rb_left;
    407		else
    408			rb = &(*rb)->rb_right;
    409	}
    410
    411	rb_link_node(&st->rb, parent, rb);
    412	rb_insert_color(&st->rb, &sorted);
    413}
    414
    415static void insert_to_result(struct lock_stat *st,
    416			     int (*bigger)(struct lock_stat *, struct lock_stat *))
    417{
    418	struct rb_node **rb = &result.rb_node;
    419	struct rb_node *parent = NULL;
    420	struct lock_stat *p;
    421
    422	if (combine_locks && st->combined)
    423		return;
    424
    425	while (*rb) {
    426		p = container_of(*rb, struct lock_stat, rb);
    427		parent = *rb;
    428
    429		if (bigger(st, p))
    430			rb = &(*rb)->rb_left;
    431		else
    432			rb = &(*rb)->rb_right;
    433	}
    434
    435	rb_link_node(&st->rb, parent, rb);
    436	rb_insert_color(&st->rb, &result);
    437}
    438
    439/* returns left most element of result, and erase it */
    440static struct lock_stat *pop_from_result(void)
    441{
    442	struct rb_node *node = result.rb_node;
    443
    444	if (!node)
    445		return NULL;
    446
    447	while (node->rb_left)
    448		node = node->rb_left;
    449
    450	rb_erase(node, &result);
    451	return container_of(node, struct lock_stat, rb);
    452}
    453
    454static struct lock_stat *lock_stat_findnew(u64 addr, const char *name)
    455{
    456	struct hlist_head *entry = lockhashentry(addr);
    457	struct lock_stat *ret, *new;
    458
    459	hlist_for_each_entry(ret, entry, hash_entry) {
    460		if (ret->addr == addr)
    461			return ret;
    462	}
    463
    464	new = zalloc(sizeof(struct lock_stat));
    465	if (!new)
    466		goto alloc_failed;
    467
    468	new->addr = addr;
    469	new->name = zalloc(sizeof(char) * strlen(name) + 1);
    470	if (!new->name) {
    471		free(new);
    472		goto alloc_failed;
    473	}
    474
    475	strcpy(new->name, name);
    476	new->wait_time_min = ULLONG_MAX;
    477
    478	hlist_add_head(&new->hash_entry, entry);
    479	return new;
    480
    481alloc_failed:
    482	pr_err("memory allocation failed\n");
    483	return NULL;
    484}
    485
    486struct trace_lock_handler {
    487	int (*acquire_event)(struct evsel *evsel,
    488			     struct perf_sample *sample);
    489
    490	int (*acquired_event)(struct evsel *evsel,
    491			      struct perf_sample *sample);
    492
    493	int (*contended_event)(struct evsel *evsel,
    494			       struct perf_sample *sample);
    495
    496	int (*release_event)(struct evsel *evsel,
    497			     struct perf_sample *sample);
    498};
    499
    500static struct lock_seq_stat *get_seq(struct thread_stat *ts, u64 addr)
    501{
    502	struct lock_seq_stat *seq;
    503
    504	list_for_each_entry(seq, &ts->seq_list, list) {
    505		if (seq->addr == addr)
    506			return seq;
    507	}
    508
    509	seq = zalloc(sizeof(struct lock_seq_stat));
    510	if (!seq) {
    511		pr_err("memory allocation failed\n");
    512		return NULL;
    513	}
    514	seq->state = SEQ_STATE_UNINITIALIZED;
    515	seq->addr = addr;
    516
    517	list_add(&seq->list, &ts->seq_list);
    518	return seq;
    519}
    520
    521enum broken_state {
    522	BROKEN_ACQUIRE,
    523	BROKEN_ACQUIRED,
    524	BROKEN_CONTENDED,
    525	BROKEN_RELEASE,
    526	BROKEN_MAX,
    527};
    528
    529static int bad_hist[BROKEN_MAX];
    530
    531enum acquire_flags {
    532	TRY_LOCK = 1,
    533	READ_LOCK = 2,
    534};
    535
    536static int report_lock_acquire_event(struct evsel *evsel,
    537				     struct perf_sample *sample)
    538{
    539	struct lock_stat *ls;
    540	struct thread_stat *ts;
    541	struct lock_seq_stat *seq;
    542	const char *name = evsel__strval(evsel, sample, "name");
    543	u64 addr = evsel__intval(evsel, sample, "lockdep_addr");
    544	int flag = evsel__intval(evsel, sample, "flags");
    545
    546	/* abuse ls->addr for tid */
    547	if (show_thread_stats)
    548		addr = sample->tid;
    549
    550	ls = lock_stat_findnew(addr, name);
    551	if (!ls)
    552		return -ENOMEM;
    553
    554	ts = thread_stat_findnew(sample->tid);
    555	if (!ts)
    556		return -ENOMEM;
    557
    558	seq = get_seq(ts, addr);
    559	if (!seq)
    560		return -ENOMEM;
    561
    562	switch (seq->state) {
    563	case SEQ_STATE_UNINITIALIZED:
    564	case SEQ_STATE_RELEASED:
    565		if (!flag) {
    566			seq->state = SEQ_STATE_ACQUIRING;
    567		} else {
    568			if (flag & TRY_LOCK)
    569				ls->nr_trylock++;
    570			if (flag & READ_LOCK)
    571				ls->nr_readlock++;
    572			seq->state = SEQ_STATE_READ_ACQUIRED;
    573			seq->read_count = 1;
    574			ls->nr_acquired++;
    575		}
    576		break;
    577	case SEQ_STATE_READ_ACQUIRED:
    578		if (flag & READ_LOCK) {
    579			seq->read_count++;
    580			ls->nr_acquired++;
    581			goto end;
    582		} else {
    583			goto broken;
    584		}
    585		break;
    586	case SEQ_STATE_ACQUIRED:
    587	case SEQ_STATE_ACQUIRING:
    588	case SEQ_STATE_CONTENDED:
    589broken:
    590		/* broken lock sequence */
    591		if (!ls->broken) {
    592			ls->broken = 1;
    593			bad_hist[BROKEN_ACQUIRE]++;
    594		}
    595		list_del_init(&seq->list);
    596		free(seq);
    597		goto end;
    598	default:
    599		BUG_ON("Unknown state of lock sequence found!\n");
    600		break;
    601	}
    602
    603	ls->nr_acquire++;
    604	seq->prev_event_time = sample->time;
    605end:
    606	return 0;
    607}
    608
    609static int report_lock_acquired_event(struct evsel *evsel,
    610				      struct perf_sample *sample)
    611{
    612	struct lock_stat *ls;
    613	struct thread_stat *ts;
    614	struct lock_seq_stat *seq;
    615	u64 contended_term;
    616	const char *name = evsel__strval(evsel, sample, "name");
    617	u64 addr = evsel__intval(evsel, sample, "lockdep_addr");
    618
    619	if (show_thread_stats)
    620		addr = sample->tid;
    621
    622	ls = lock_stat_findnew(addr, name);
    623	if (!ls)
    624		return -ENOMEM;
    625
    626	ts = thread_stat_findnew(sample->tid);
    627	if (!ts)
    628		return -ENOMEM;
    629
    630	seq = get_seq(ts, addr);
    631	if (!seq)
    632		return -ENOMEM;
    633
    634	switch (seq->state) {
    635	case SEQ_STATE_UNINITIALIZED:
    636		/* orphan event, do nothing */
    637		return 0;
    638	case SEQ_STATE_ACQUIRING:
    639		break;
    640	case SEQ_STATE_CONTENDED:
    641		contended_term = sample->time - seq->prev_event_time;
    642		ls->wait_time_total += contended_term;
    643		if (contended_term < ls->wait_time_min)
    644			ls->wait_time_min = contended_term;
    645		if (ls->wait_time_max < contended_term)
    646			ls->wait_time_max = contended_term;
    647		break;
    648	case SEQ_STATE_RELEASED:
    649	case SEQ_STATE_ACQUIRED:
    650	case SEQ_STATE_READ_ACQUIRED:
    651		/* broken lock sequence */
    652		if (!ls->broken) {
    653			ls->broken = 1;
    654			bad_hist[BROKEN_ACQUIRED]++;
    655		}
    656		list_del_init(&seq->list);
    657		free(seq);
    658		goto end;
    659	default:
    660		BUG_ON("Unknown state of lock sequence found!\n");
    661		break;
    662	}
    663
    664	seq->state = SEQ_STATE_ACQUIRED;
    665	ls->nr_acquired++;
    666	ls->avg_wait_time = ls->nr_contended ? ls->wait_time_total/ls->nr_contended : 0;
    667	seq->prev_event_time = sample->time;
    668end:
    669	return 0;
    670}
    671
    672static int report_lock_contended_event(struct evsel *evsel,
    673				       struct perf_sample *sample)
    674{
    675	struct lock_stat *ls;
    676	struct thread_stat *ts;
    677	struct lock_seq_stat *seq;
    678	const char *name = evsel__strval(evsel, sample, "name");
    679	u64 addr = evsel__intval(evsel, sample, "lockdep_addr");
    680
    681	if (show_thread_stats)
    682		addr = sample->tid;
    683
    684	ls = lock_stat_findnew(addr, name);
    685	if (!ls)
    686		return -ENOMEM;
    687
    688	ts = thread_stat_findnew(sample->tid);
    689	if (!ts)
    690		return -ENOMEM;
    691
    692	seq = get_seq(ts, addr);
    693	if (!seq)
    694		return -ENOMEM;
    695
    696	switch (seq->state) {
    697	case SEQ_STATE_UNINITIALIZED:
    698		/* orphan event, do nothing */
    699		return 0;
    700	case SEQ_STATE_ACQUIRING:
    701		break;
    702	case SEQ_STATE_RELEASED:
    703	case SEQ_STATE_ACQUIRED:
    704	case SEQ_STATE_READ_ACQUIRED:
    705	case SEQ_STATE_CONTENDED:
    706		/* broken lock sequence */
    707		if (!ls->broken) {
    708			ls->broken = 1;
    709			bad_hist[BROKEN_CONTENDED]++;
    710		}
    711		list_del_init(&seq->list);
    712		free(seq);
    713		goto end;
    714	default:
    715		BUG_ON("Unknown state of lock sequence found!\n");
    716		break;
    717	}
    718
    719	seq->state = SEQ_STATE_CONTENDED;
    720	ls->nr_contended++;
    721	ls->avg_wait_time = ls->wait_time_total/ls->nr_contended;
    722	seq->prev_event_time = sample->time;
    723end:
    724	return 0;
    725}
    726
    727static int report_lock_release_event(struct evsel *evsel,
    728				     struct perf_sample *sample)
    729{
    730	struct lock_stat *ls;
    731	struct thread_stat *ts;
    732	struct lock_seq_stat *seq;
    733	const char *name = evsel__strval(evsel, sample, "name");
    734	u64 addr = evsel__intval(evsel, sample, "lockdep_addr");
    735
    736	if (show_thread_stats)
    737		addr = sample->tid;
    738
    739	ls = lock_stat_findnew(addr, name);
    740	if (!ls)
    741		return -ENOMEM;
    742
    743	ts = thread_stat_findnew(sample->tid);
    744	if (!ts)
    745		return -ENOMEM;
    746
    747	seq = get_seq(ts, addr);
    748	if (!seq)
    749		return -ENOMEM;
    750
    751	switch (seq->state) {
    752	case SEQ_STATE_UNINITIALIZED:
    753		goto end;
    754	case SEQ_STATE_ACQUIRED:
    755		break;
    756	case SEQ_STATE_READ_ACQUIRED:
    757		seq->read_count--;
    758		BUG_ON(seq->read_count < 0);
    759		if (seq->read_count) {
    760			ls->nr_release++;
    761			goto end;
    762		}
    763		break;
    764	case SEQ_STATE_ACQUIRING:
    765	case SEQ_STATE_CONTENDED:
    766	case SEQ_STATE_RELEASED:
    767		/* broken lock sequence */
    768		if (!ls->broken) {
    769			ls->broken = 1;
    770			bad_hist[BROKEN_RELEASE]++;
    771		}
    772		goto free_seq;
    773	default:
    774		BUG_ON("Unknown state of lock sequence found!\n");
    775		break;
    776	}
    777
    778	ls->nr_release++;
    779free_seq:
    780	list_del_init(&seq->list);
    781	free(seq);
    782end:
    783	return 0;
    784}
    785
    786/* lock oriented handlers */
    787/* TODO: handlers for CPU oriented, thread oriented */
    788static struct trace_lock_handler report_lock_ops  = {
    789	.acquire_event		= report_lock_acquire_event,
    790	.acquired_event		= report_lock_acquired_event,
    791	.contended_event	= report_lock_contended_event,
    792	.release_event		= report_lock_release_event,
    793};
    794
    795static struct trace_lock_handler *trace_handler;
    796
    797static int evsel__process_lock_acquire(struct evsel *evsel, struct perf_sample *sample)
    798{
    799	if (trace_handler->acquire_event)
    800		return trace_handler->acquire_event(evsel, sample);
    801	return 0;
    802}
    803
    804static int evsel__process_lock_acquired(struct evsel *evsel, struct perf_sample *sample)
    805{
    806	if (trace_handler->acquired_event)
    807		return trace_handler->acquired_event(evsel, sample);
    808	return 0;
    809}
    810
    811static int evsel__process_lock_contended(struct evsel *evsel, struct perf_sample *sample)
    812{
    813	if (trace_handler->contended_event)
    814		return trace_handler->contended_event(evsel, sample);
    815	return 0;
    816}
    817
    818static int evsel__process_lock_release(struct evsel *evsel, struct perf_sample *sample)
    819{
    820	if (trace_handler->release_event)
    821		return trace_handler->release_event(evsel, sample);
    822	return 0;
    823}
    824
    825static void print_bad_events(int bad, int total)
    826{
    827	/* Output for debug, this have to be removed */
    828	int i;
    829	const char *name[4] =
    830		{ "acquire", "acquired", "contended", "release" };
    831
    832	pr_info("\n=== output for debug===\n\n");
    833	pr_info("bad: %d, total: %d\n", bad, total);
    834	pr_info("bad rate: %.2f %%\n", (double)bad / (double)total * 100);
    835	pr_info("histogram of events caused bad sequence\n");
    836	for (i = 0; i < BROKEN_MAX; i++)
    837		pr_info(" %10s: %d\n", name[i], bad_hist[i]);
    838}
    839
    840/* TODO: various way to print, coloring, nano or milli sec */
    841static void print_result(void)
    842{
    843	struct lock_stat *st;
    844	struct lock_key *key;
    845	char cut_name[20];
    846	int bad, total;
    847
    848	pr_info("%20s ", "Name");
    849	list_for_each_entry(key, &lock_keys, list)
    850		pr_info("%*s ", key->len, key->header);
    851	pr_info("\n\n");
    852
    853	bad = total = 0;
    854	while ((st = pop_from_result())) {
    855		total++;
    856		if (st->broken)
    857			bad++;
    858		if (!st->nr_acquired)
    859			continue;
    860
    861		bzero(cut_name, 20);
    862
    863		if (strlen(st->name) < 20) {
    864			/* output raw name */
    865			const char *name = st->name;
    866
    867			if (show_thread_stats) {
    868				struct thread *t;
    869
    870				/* st->addr contains tid of thread */
    871				t = perf_session__findnew(session, st->addr);
    872				name = thread__comm_str(t);
    873			}
    874
    875			pr_info("%20s ", name);
    876		} else {
    877			strncpy(cut_name, st->name, 16);
    878			cut_name[16] = '.';
    879			cut_name[17] = '.';
    880			cut_name[18] = '.';
    881			cut_name[19] = '\0';
    882			/* cut off name for saving output style */
    883			pr_info("%20s ", cut_name);
    884		}
    885
    886		list_for_each_entry(key, &lock_keys, list) {
    887			key->print(key, st);
    888			pr_info(" ");
    889		}
    890		pr_info("\n");
    891	}
    892
    893	print_bad_events(bad, total);
    894}
    895
    896static bool info_threads, info_map;
    897
    898static void dump_threads(void)
    899{
    900	struct thread_stat *st;
    901	struct rb_node *node;
    902	struct thread *t;
    903
    904	pr_info("%10s: comm\n", "Thread ID");
    905
    906	node = rb_first(&thread_stats);
    907	while (node) {
    908		st = container_of(node, struct thread_stat, rb);
    909		t = perf_session__findnew(session, st->tid);
    910		pr_info("%10d: %s\n", st->tid, thread__comm_str(t));
    911		node = rb_next(node);
    912		thread__put(t);
    913	}
    914}
    915
    916static int compare_maps(struct lock_stat *a, struct lock_stat *b)
    917{
    918	int ret;
    919
    920	if (a->name && b->name)
    921		ret = strcmp(a->name, b->name);
    922	else
    923		ret = !!a->name - !!b->name;
    924
    925	if (!ret)
    926		return a->addr < b->addr;
    927	else
    928		return ret < 0;
    929}
    930
    931static void dump_map(void)
    932{
    933	unsigned int i;
    934	struct lock_stat *st;
    935
    936	pr_info("Address of instance: name of class\n");
    937	for (i = 0; i < LOCKHASH_SIZE; i++) {
    938		hlist_for_each_entry(st, &lockhash_table[i], hash_entry) {
    939			insert_to_result(st, compare_maps);
    940		}
    941	}
    942
    943	while ((st = pop_from_result()))
    944		pr_info(" %#llx: %s\n", (unsigned long long)st->addr, st->name);
    945}
    946
    947static int dump_info(void)
    948{
    949	int rc = 0;
    950
    951	if (info_threads)
    952		dump_threads();
    953	else if (info_map)
    954		dump_map();
    955	else {
    956		rc = -1;
    957		pr_err("Unknown type of information\n");
    958	}
    959
    960	return rc;
    961}
    962
    963typedef int (*tracepoint_handler)(struct evsel *evsel,
    964				  struct perf_sample *sample);
    965
    966static int process_sample_event(struct perf_tool *tool __maybe_unused,
    967				union perf_event *event,
    968				struct perf_sample *sample,
    969				struct evsel *evsel,
    970				struct machine *machine)
    971{
    972	int err = 0;
    973	struct thread *thread = machine__findnew_thread(machine, sample->pid,
    974							sample->tid);
    975
    976	if (thread == NULL) {
    977		pr_debug("problem processing %d event, skipping it.\n",
    978			event->header.type);
    979		return -1;
    980	}
    981
    982	if (evsel->handler != NULL) {
    983		tracepoint_handler f = evsel->handler;
    984		err = f(evsel, sample);
    985	}
    986
    987	thread__put(thread);
    988
    989	return err;
    990}
    991
    992static void combine_result(void)
    993{
    994	unsigned int i;
    995	struct lock_stat *st;
    996
    997	if (!combine_locks)
    998		return;
    999
   1000	for (i = 0; i < LOCKHASH_SIZE; i++) {
   1001		hlist_for_each_entry(st, &lockhash_table[i], hash_entry) {
   1002			combine_lock_stats(st);
   1003		}
   1004	}
   1005}
   1006
   1007static void sort_result(void)
   1008{
   1009	unsigned int i;
   1010	struct lock_stat *st;
   1011
   1012	for (i = 0; i < LOCKHASH_SIZE; i++) {
   1013		hlist_for_each_entry(st, &lockhash_table[i], hash_entry) {
   1014			insert_to_result(st, compare);
   1015		}
   1016	}
   1017}
   1018
   1019static const struct evsel_str_handler lock_tracepoints[] = {
   1020	{ "lock:lock_acquire",	 evsel__process_lock_acquire,   }, /* CONFIG_LOCKDEP */
   1021	{ "lock:lock_acquired",	 evsel__process_lock_acquired,  }, /* CONFIG_LOCKDEP, CONFIG_LOCK_STAT */
   1022	{ "lock:lock_contended", evsel__process_lock_contended, }, /* CONFIG_LOCKDEP, CONFIG_LOCK_STAT */
   1023	{ "lock:lock_release",	 evsel__process_lock_release,   }, /* CONFIG_LOCKDEP */
   1024};
   1025
   1026static bool force;
   1027
   1028static int __cmd_report(bool display_info)
   1029{
   1030	int err = -EINVAL;
   1031	struct perf_tool eops = {
   1032		.sample		 = process_sample_event,
   1033		.comm		 = perf_event__process_comm,
   1034		.namespaces	 = perf_event__process_namespaces,
   1035		.ordered_events	 = true,
   1036	};
   1037	struct perf_data data = {
   1038		.path  = input_name,
   1039		.mode  = PERF_DATA_MODE_READ,
   1040		.force = force,
   1041	};
   1042
   1043	session = perf_session__new(&data, &eops);
   1044	if (IS_ERR(session)) {
   1045		pr_err("Initializing perf session failed\n");
   1046		return PTR_ERR(session);
   1047	}
   1048
   1049	symbol__init(&session->header.env);
   1050
   1051	if (!perf_session__has_traces(session, "lock record"))
   1052		goto out_delete;
   1053
   1054	if (perf_session__set_tracepoints_handlers(session, lock_tracepoints)) {
   1055		pr_err("Initializing perf session tracepoint handlers failed\n");
   1056		goto out_delete;
   1057	}
   1058
   1059	if (setup_output_field(output_fields))
   1060		goto out_delete;
   1061
   1062	if (select_key())
   1063		goto out_delete;
   1064
   1065	err = perf_session__process_events(session);
   1066	if (err)
   1067		goto out_delete;
   1068
   1069	setup_pager();
   1070	if (display_info) /* used for info subcommand */
   1071		err = dump_info();
   1072	else {
   1073		combine_result();
   1074		sort_result();
   1075		print_result();
   1076	}
   1077
   1078out_delete:
   1079	perf_session__delete(session);
   1080	return err;
   1081}
   1082
   1083static int __cmd_record(int argc, const char **argv)
   1084{
   1085	const char *record_args[] = {
   1086		"record", "-R", "-m", "1024", "-c", "1", "--synth", "task",
   1087	};
   1088	unsigned int rec_argc, i, j, ret;
   1089	const char **rec_argv;
   1090
   1091	for (i = 0; i < ARRAY_SIZE(lock_tracepoints); i++) {
   1092		if (!is_valid_tracepoint(lock_tracepoints[i].name)) {
   1093				pr_err("tracepoint %s is not enabled. "
   1094				       "Are CONFIG_LOCKDEP and CONFIG_LOCK_STAT enabled?\n",
   1095				       lock_tracepoints[i].name);
   1096				return 1;
   1097		}
   1098	}
   1099
   1100	rec_argc = ARRAY_SIZE(record_args) + argc - 1;
   1101	/* factor of 2 is for -e in front of each tracepoint */
   1102	rec_argc += 2 * ARRAY_SIZE(lock_tracepoints);
   1103
   1104	rec_argv = calloc(rec_argc + 1, sizeof(char *));
   1105	if (!rec_argv)
   1106		return -ENOMEM;
   1107
   1108	for (i = 0; i < ARRAY_SIZE(record_args); i++)
   1109		rec_argv[i] = strdup(record_args[i]);
   1110
   1111	for (j = 0; j < ARRAY_SIZE(lock_tracepoints); j++) {
   1112		rec_argv[i++] = "-e";
   1113		rec_argv[i++] = strdup(lock_tracepoints[j].name);
   1114	}
   1115
   1116	for (j = 1; j < (unsigned int)argc; j++, i++)
   1117		rec_argv[i] = argv[j];
   1118
   1119	BUG_ON(i != rec_argc);
   1120
   1121	ret = cmd_record(i, rec_argv);
   1122	free(rec_argv);
   1123	return ret;
   1124}
   1125
   1126int cmd_lock(int argc, const char **argv)
   1127{
   1128	const struct option lock_options[] = {
   1129	OPT_STRING('i', "input", &input_name, "file", "input file name"),
   1130	OPT_INCR('v', "verbose", &verbose, "be more verbose (show symbol address, etc)"),
   1131	OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace, "dump raw trace in ASCII"),
   1132	OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
   1133	OPT_END()
   1134	};
   1135
   1136	const struct option info_options[] = {
   1137	OPT_BOOLEAN('t', "threads", &info_threads,
   1138		    "dump thread list in perf.data"),
   1139	OPT_BOOLEAN('m', "map", &info_map,
   1140		    "map of lock instances (address:name table)"),
   1141	OPT_PARENT(lock_options)
   1142	};
   1143
   1144	const struct option report_options[] = {
   1145	OPT_STRING('k', "key", &sort_key, "acquired",
   1146		    "key for sorting (acquired / contended / avg_wait / wait_total / wait_max / wait_min)"),
   1147	OPT_STRING('F', "field", &output_fields, NULL,
   1148		    "output fields (acquired / contended / avg_wait / wait_total / wait_max / wait_min)"),
   1149	/* TODO: type */
   1150	OPT_BOOLEAN('c', "combine-locks", &combine_locks,
   1151		    "combine locks in the same class"),
   1152	OPT_BOOLEAN('t', "threads", &show_thread_stats,
   1153		    "show per-thread lock stats"),
   1154	OPT_PARENT(lock_options)
   1155	};
   1156
   1157	const char * const info_usage[] = {
   1158		"perf lock info [<options>]",
   1159		NULL
   1160	};
   1161	const char *const lock_subcommands[] = { "record", "report", "script",
   1162						 "info", NULL };
   1163	const char *lock_usage[] = {
   1164		NULL,
   1165		NULL
   1166	};
   1167	const char * const report_usage[] = {
   1168		"perf lock report [<options>]",
   1169		NULL
   1170	};
   1171	unsigned int i;
   1172	int rc = 0;
   1173
   1174	for (i = 0; i < LOCKHASH_SIZE; i++)
   1175		INIT_HLIST_HEAD(lockhash_table + i);
   1176
   1177	argc = parse_options_subcommand(argc, argv, lock_options, lock_subcommands,
   1178					lock_usage, PARSE_OPT_STOP_AT_NON_OPTION);
   1179	if (!argc)
   1180		usage_with_options(lock_usage, lock_options);
   1181
   1182	if (strlen(argv[0]) > 2 && strstarts("record", argv[0])) {
   1183		return __cmd_record(argc, argv);
   1184	} else if (strlen(argv[0]) > 2 && strstarts("report", argv[0])) {
   1185		trace_handler = &report_lock_ops;
   1186		if (argc) {
   1187			argc = parse_options(argc, argv,
   1188					     report_options, report_usage, 0);
   1189			if (argc)
   1190				usage_with_options(report_usage, report_options);
   1191		}
   1192		rc = __cmd_report(false);
   1193	} else if (!strcmp(argv[0], "script")) {
   1194		/* Aliased to 'perf script' */
   1195		return cmd_script(argc, argv);
   1196	} else if (!strcmp(argv[0], "info")) {
   1197		if (argc) {
   1198			argc = parse_options(argc, argv,
   1199					     info_options, info_usage, 0);
   1200			if (argc)
   1201				usage_with_options(info_usage, info_options);
   1202		}
   1203		/* recycling report_lock_ops */
   1204		trace_handler = &report_lock_ops;
   1205		rc = __cmd_report(true);
   1206	} else {
   1207		usage_with_options(lock_usage, lock_options);
   1208	}
   1209
   1210	return rc;
   1211}