• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
3  *
4  * Parts came from builtin-{top,stat,record}.c, see those files for further
5  * copyright notes.
6  *
7  * Released under the GPL v2. (and only v2, not any later version)
8  */
9 #include "util.h"
10 #include <lk/debugfs.h>
11 #include <poll.h>
12 #include "cpumap.h"
13 #include "thread_map.h"
14 #include "target.h"
15 #include "evlist.h"
16 #include "evsel.h"
17 #include "debug.h"
18 #include <unistd.h>
19 
20 #include "parse-events.h"
21 
22 #include <sys/mman.h>
23 
24 #include <linux/bitops.h>
25 #include <linux/hash.h>
26 
27 #define FD(e, x, y) (*(int *)xyarray__entry(e->fd, x, y))
28 #define SID(e, x, y) xyarray__entry(e->sample_id, x, y)
29 
perf_evlist__init(struct perf_evlist * evlist,struct cpu_map * cpus,struct thread_map * threads)30 void perf_evlist__init(struct perf_evlist *evlist, struct cpu_map *cpus,
31 		       struct thread_map *threads)
32 {
33 	int i;
34 
35 	for (i = 0; i < PERF_EVLIST__HLIST_SIZE; ++i)
36 		INIT_HLIST_HEAD(&evlist->heads[i]);
37 	INIT_LIST_HEAD(&evlist->entries);
38 	perf_evlist__set_maps(evlist, cpus, threads);
39 	evlist->workload.pid = -1;
40 }
41 
perf_evlist__new(void)42 struct perf_evlist *perf_evlist__new(void)
43 {
44 	struct perf_evlist *evlist = zalloc(sizeof(*evlist));
45 
46 	if (evlist != NULL)
47 		perf_evlist__init(evlist, NULL, NULL);
48 
49 	return evlist;
50 }
51 
52 /**
53  * perf_evlist__set_id_pos - set the positions of event ids.
54  * @evlist: selected event list
55  *
56  * Events with compatible sample types all have the same id_pos
57  * and is_pos.  For convenience, put a copy on evlist.
58  */
perf_evlist__set_id_pos(struct perf_evlist * evlist)59 void perf_evlist__set_id_pos(struct perf_evlist *evlist)
60 {
61 	struct perf_evsel *first = perf_evlist__first(evlist);
62 
63 	evlist->id_pos = first->id_pos;
64 	evlist->is_pos = first->is_pos;
65 }
66 
perf_evlist__update_id_pos(struct perf_evlist * evlist)67 static void perf_evlist__update_id_pos(struct perf_evlist *evlist)
68 {
69 	struct perf_evsel *evsel;
70 
71 	list_for_each_entry(evsel, &evlist->entries, node)
72 		perf_evsel__calc_id_pos(evsel);
73 
74 	perf_evlist__set_id_pos(evlist);
75 }
76 
perf_evlist__purge(struct perf_evlist * evlist)77 static void perf_evlist__purge(struct perf_evlist *evlist)
78 {
79 	struct perf_evsel *pos, *n;
80 
81 	list_for_each_entry_safe(pos, n, &evlist->entries, node) {
82 		list_del_init(&pos->node);
83 		perf_evsel__delete(pos);
84 	}
85 
86 	evlist->nr_entries = 0;
87 }
88 
perf_evlist__exit(struct perf_evlist * evlist)89 void perf_evlist__exit(struct perf_evlist *evlist)
90 {
91 	free(evlist->mmap);
92 	free(evlist->pollfd);
93 	evlist->mmap = NULL;
94 	evlist->pollfd = NULL;
95 }
96 
perf_evlist__delete(struct perf_evlist * evlist)97 void perf_evlist__delete(struct perf_evlist *evlist)
98 {
99 	perf_evlist__purge(evlist);
100 	perf_evlist__exit(evlist);
101 	free(evlist);
102 }
103 
perf_evlist__add(struct perf_evlist * evlist,struct perf_evsel * entry)104 void perf_evlist__add(struct perf_evlist *evlist, struct perf_evsel *entry)
105 {
106 	list_add_tail(&entry->node, &evlist->entries);
107 	if (!evlist->nr_entries++)
108 		perf_evlist__set_id_pos(evlist);
109 }
110 
perf_evlist__splice_list_tail(struct perf_evlist * evlist,struct list_head * list,int nr_entries)111 void perf_evlist__splice_list_tail(struct perf_evlist *evlist,
112 				   struct list_head *list,
113 				   int nr_entries)
114 {
115 	bool set_id_pos = !evlist->nr_entries;
116 
117 	list_splice_tail(list, &evlist->entries);
118 	evlist->nr_entries += nr_entries;
119 	if (set_id_pos)
120 		perf_evlist__set_id_pos(evlist);
121 }
122 
__perf_evlist__set_leader(struct list_head * list)123 void __perf_evlist__set_leader(struct list_head *list)
124 {
125 	struct perf_evsel *evsel, *leader;
126 
127 	leader = list_entry(list->next, struct perf_evsel, node);
128 	evsel = list_entry(list->prev, struct perf_evsel, node);
129 
130 	leader->nr_members = evsel->idx - leader->idx + 1;
131 
132 	list_for_each_entry(evsel, list, node) {
133 		evsel->leader = leader;
134 	}
135 }
136 
perf_evlist__set_leader(struct perf_evlist * evlist)137 void perf_evlist__set_leader(struct perf_evlist *evlist)
138 {
139 	if (evlist->nr_entries) {
140 		evlist->nr_groups = evlist->nr_entries > 1 ? 1 : 0;
141 		__perf_evlist__set_leader(&evlist->entries);
142 	}
143 }
144 
perf_evlist__add_default(struct perf_evlist * evlist)145 int perf_evlist__add_default(struct perf_evlist *evlist)
146 {
147 	struct perf_event_attr attr = {
148 		.type = PERF_TYPE_HARDWARE,
149 		.config = PERF_COUNT_HW_CPU_CYCLES,
150 	};
151 	struct perf_evsel *evsel;
152 
153 	event_attr_init(&attr);
154 
155 	evsel = perf_evsel__new(&attr, 0);
156 	if (evsel == NULL)
157 		goto error;
158 
159 	/* use strdup() because free(evsel) assumes name is allocated */
160 	evsel->name = strdup("cycles");
161 	if (!evsel->name)
162 		goto error_free;
163 
164 	perf_evlist__add(evlist, evsel);
165 	return 0;
166 error_free:
167 	perf_evsel__delete(evsel);
168 error:
169 	return -ENOMEM;
170 }
171 
perf_evlist__add_attrs(struct perf_evlist * evlist,struct perf_event_attr * attrs,size_t nr_attrs)172 static int perf_evlist__add_attrs(struct perf_evlist *evlist,
173 				  struct perf_event_attr *attrs, size_t nr_attrs)
174 {
175 	struct perf_evsel *evsel, *n;
176 	LIST_HEAD(head);
177 	size_t i;
178 
179 	for (i = 0; i < nr_attrs; i++) {
180 		evsel = perf_evsel__new(attrs + i, evlist->nr_entries + i);
181 		if (evsel == NULL)
182 			goto out_delete_partial_list;
183 		list_add_tail(&evsel->node, &head);
184 	}
185 
186 	perf_evlist__splice_list_tail(evlist, &head, nr_attrs);
187 
188 	return 0;
189 
190 out_delete_partial_list:
191 	list_for_each_entry_safe(evsel, n, &head, node)
192 		perf_evsel__delete(evsel);
193 	return -1;
194 }
195 
__perf_evlist__add_default_attrs(struct perf_evlist * evlist,struct perf_event_attr * attrs,size_t nr_attrs)196 int __perf_evlist__add_default_attrs(struct perf_evlist *evlist,
197 				     struct perf_event_attr *attrs, size_t nr_attrs)
198 {
199 	size_t i;
200 
201 	for (i = 0; i < nr_attrs; i++)
202 		event_attr_init(attrs + i);
203 
204 	return perf_evlist__add_attrs(evlist, attrs, nr_attrs);
205 }
206 
207 struct perf_evsel *
perf_evlist__find_tracepoint_by_id(struct perf_evlist * evlist,int id)208 perf_evlist__find_tracepoint_by_id(struct perf_evlist *evlist, int id)
209 {
210 	struct perf_evsel *evsel;
211 
212 	list_for_each_entry(evsel, &evlist->entries, node) {
213 		if (evsel->attr.type   == PERF_TYPE_TRACEPOINT &&
214 		    (int)evsel->attr.config == id)
215 			return evsel;
216 	}
217 
218 	return NULL;
219 }
220 
221 struct perf_evsel *
perf_evlist__find_tracepoint_by_name(struct perf_evlist * evlist,const char * name)222 perf_evlist__find_tracepoint_by_name(struct perf_evlist *evlist,
223 				     const char *name)
224 {
225 	struct perf_evsel *evsel;
226 
227 	list_for_each_entry(evsel, &evlist->entries, node) {
228 		if ((evsel->attr.type == PERF_TYPE_TRACEPOINT) &&
229 		    (strcmp(evsel->name, name) == 0))
230 			return evsel;
231 	}
232 
233 	return NULL;
234 }
235 
perf_evlist__add_newtp(struct perf_evlist * evlist,const char * sys,const char * name,void * handler)236 int perf_evlist__add_newtp(struct perf_evlist *evlist,
237 			   const char *sys, const char *name, void *handler)
238 {
239 	struct perf_evsel *evsel;
240 
241 	evsel = perf_evsel__newtp(sys, name, evlist->nr_entries);
242 	if (evsel == NULL)
243 		return -1;
244 
245 	evsel->handler.func = handler;
246 	perf_evlist__add(evlist, evsel);
247 	return 0;
248 }
249 
perf_evlist__disable(struct perf_evlist * evlist)250 void perf_evlist__disable(struct perf_evlist *evlist)
251 {
252 	int cpu, thread;
253 	struct perf_evsel *pos;
254 	int nr_cpus = cpu_map__nr(evlist->cpus);
255 	int nr_threads = thread_map__nr(evlist->threads);
256 
257 	for (cpu = 0; cpu < nr_cpus; cpu++) {
258 		list_for_each_entry(pos, &evlist->entries, node) {
259 			if (!perf_evsel__is_group_leader(pos) || !pos->fd)
260 				continue;
261 			for (thread = 0; thread < nr_threads; thread++)
262 				ioctl(FD(pos, cpu, thread),
263 				      PERF_EVENT_IOC_DISABLE, 0);
264 		}
265 	}
266 }
267 
perf_evlist__enable(struct perf_evlist * evlist)268 void perf_evlist__enable(struct perf_evlist *evlist)
269 {
270 	int cpu, thread;
271 	struct perf_evsel *pos;
272 	int nr_cpus = cpu_map__nr(evlist->cpus);
273 	int nr_threads = thread_map__nr(evlist->threads);
274 
275 	for (cpu = 0; cpu < nr_cpus; cpu++) {
276 		list_for_each_entry(pos, &evlist->entries, node) {
277 			if (!perf_evsel__is_group_leader(pos) || !pos->fd)
278 				continue;
279 			for (thread = 0; thread < nr_threads; thread++)
280 				ioctl(FD(pos, cpu, thread),
281 				      PERF_EVENT_IOC_ENABLE, 0);
282 		}
283 	}
284 }
285 
perf_evlist__disable_event(struct perf_evlist * evlist,struct perf_evsel * evsel)286 int perf_evlist__disable_event(struct perf_evlist *evlist,
287 			       struct perf_evsel *evsel)
288 {
289 	int cpu, thread, err;
290 
291 	if (!evsel->fd)
292 		return 0;
293 
294 	for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
295 		for (thread = 0; thread < evlist->threads->nr; thread++) {
296 			err = ioctl(FD(evsel, cpu, thread),
297 				    PERF_EVENT_IOC_DISABLE, 0);
298 			if (err)
299 				return err;
300 		}
301 	}
302 	return 0;
303 }
304 
perf_evlist__enable_event(struct perf_evlist * evlist,struct perf_evsel * evsel)305 int perf_evlist__enable_event(struct perf_evlist *evlist,
306 			      struct perf_evsel *evsel)
307 {
308 	int cpu, thread, err;
309 
310 	if (!evsel->fd)
311 		return -EINVAL;
312 
313 	for (cpu = 0; cpu < evlist->cpus->nr; cpu++) {
314 		for (thread = 0; thread < evlist->threads->nr; thread++) {
315 			err = ioctl(FD(evsel, cpu, thread),
316 				    PERF_EVENT_IOC_ENABLE, 0);
317 			if (err)
318 				return err;
319 		}
320 	}
321 	return 0;
322 }
323 
perf_evlist__alloc_pollfd(struct perf_evlist * evlist)324 static int perf_evlist__alloc_pollfd(struct perf_evlist *evlist)
325 {
326 	int nr_cpus = cpu_map__nr(evlist->cpus);
327 	int nr_threads = thread_map__nr(evlist->threads);
328 	int nfds = nr_cpus * nr_threads * evlist->nr_entries;
329 	evlist->pollfd = malloc(sizeof(struct pollfd) * nfds);
330 	return evlist->pollfd != NULL ? 0 : -ENOMEM;
331 }
332 
perf_evlist__add_pollfd(struct perf_evlist * evlist,int fd)333 void perf_evlist__add_pollfd(struct perf_evlist *evlist, int fd)
334 {
335 	fcntl(fd, F_SETFL, O_NONBLOCK);
336 	evlist->pollfd[evlist->nr_fds].fd = fd;
337 	evlist->pollfd[evlist->nr_fds].events = POLLIN;
338 	evlist->nr_fds++;
339 }
340 
perf_evlist__id_hash(struct perf_evlist * evlist,struct perf_evsel * evsel,int cpu,int thread,u64 id)341 static void perf_evlist__id_hash(struct perf_evlist *evlist,
342 				 struct perf_evsel *evsel,
343 				 int cpu, int thread, u64 id)
344 {
345 	int hash;
346 	struct perf_sample_id *sid = SID(evsel, cpu, thread);
347 
348 	sid->id = id;
349 	sid->evsel = evsel;
350 	hash = hash_64(sid->id, PERF_EVLIST__HLIST_BITS);
351 	hlist_add_head(&sid->node, &evlist->heads[hash]);
352 }
353 
perf_evlist__id_add(struct perf_evlist * evlist,struct perf_evsel * evsel,int cpu,int thread,u64 id)354 void perf_evlist__id_add(struct perf_evlist *evlist, struct perf_evsel *evsel,
355 			 int cpu, int thread, u64 id)
356 {
357 	perf_evlist__id_hash(evlist, evsel, cpu, thread, id);
358 	evsel->id[evsel->ids++] = id;
359 }
360 
perf_evlist__id_add_fd(struct perf_evlist * evlist,struct perf_evsel * evsel,int cpu,int thread,int fd)361 static int perf_evlist__id_add_fd(struct perf_evlist *evlist,
362 				  struct perf_evsel *evsel,
363 				  int cpu, int thread, int fd)
364 {
365 	u64 read_data[4] = { 0, };
366 	int id_idx = 1; /* The first entry is the counter value */
367 	u64 id;
368 	int ret;
369 
370 	ret = ioctl(fd, PERF_EVENT_IOC_ID, &id);
371 	if (!ret)
372 		goto add;
373 
374 	if (errno != ENOTTY)
375 		return -1;
376 
377 	/* Legacy way to get event id.. All hail to old kernels! */
378 
379 	/*
380 	 * This way does not work with group format read, so bail
381 	 * out in that case.
382 	 */
383 	if (perf_evlist__read_format(evlist) & PERF_FORMAT_GROUP)
384 		return -1;
385 
386 	if (!(evsel->attr.read_format & PERF_FORMAT_ID) ||
387 	    read(fd, &read_data, sizeof(read_data)) == -1)
388 		return -1;
389 
390 	if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
391 		++id_idx;
392 	if (evsel->attr.read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
393 		++id_idx;
394 
395 	id = read_data[id_idx];
396 
397  add:
398 	perf_evlist__id_add(evlist, evsel, cpu, thread, id);
399 	return 0;
400 }
401 
perf_evlist__id2sid(struct perf_evlist * evlist,u64 id)402 struct perf_sample_id *perf_evlist__id2sid(struct perf_evlist *evlist, u64 id)
403 {
404 	struct hlist_head *head;
405 	struct perf_sample_id *sid;
406 	int hash;
407 
408 	hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
409 	head = &evlist->heads[hash];
410 
411 	hlist_for_each_entry(sid, head, node)
412 		if (sid->id == id)
413 			return sid;
414 
415 	return NULL;
416 }
417 
perf_evlist__id2evsel(struct perf_evlist * evlist,u64 id)418 struct perf_evsel *perf_evlist__id2evsel(struct perf_evlist *evlist, u64 id)
419 {
420 	struct perf_sample_id *sid;
421 
422 	if (evlist->nr_entries == 1)
423 		return perf_evlist__first(evlist);
424 
425 	sid = perf_evlist__id2sid(evlist, id);
426 	if (sid)
427 		return sid->evsel;
428 
429 	if (!perf_evlist__sample_id_all(evlist))
430 		return perf_evlist__first(evlist);
431 
432 	return NULL;
433 }
434 
perf_evlist__event2id(struct perf_evlist * evlist,union perf_event * event,u64 * id)435 static int perf_evlist__event2id(struct perf_evlist *evlist,
436 				 union perf_event *event, u64 *id)
437 {
438 	const u64 *array = event->sample.array;
439 	ssize_t n;
440 
441 	n = (event->header.size - sizeof(event->header)) >> 3;
442 
443 	if (event->header.type == PERF_RECORD_SAMPLE) {
444 		if (evlist->id_pos >= n)
445 			return -1;
446 		*id = array[evlist->id_pos];
447 	} else {
448 		if (evlist->is_pos > n)
449 			return -1;
450 		n -= evlist->is_pos;
451 		*id = array[n];
452 	}
453 	return 0;
454 }
455 
perf_evlist__event2evsel(struct perf_evlist * evlist,union perf_event * event)456 static struct perf_evsel *perf_evlist__event2evsel(struct perf_evlist *evlist,
457 						   union perf_event *event)
458 {
459 	struct perf_evsel *first = perf_evlist__first(evlist);
460 	struct hlist_head *head;
461 	struct perf_sample_id *sid;
462 	int hash;
463 	u64 id;
464 
465 	if (evlist->nr_entries == 1)
466 		return first;
467 
468 	if (!first->attr.sample_id_all &&
469 	    event->header.type != PERF_RECORD_SAMPLE)
470 		return first;
471 
472 	if (perf_evlist__event2id(evlist, event, &id))
473 		return NULL;
474 
475 	/* Synthesized events have an id of zero */
476 	if (!id)
477 		return first;
478 
479 	hash = hash_64(id, PERF_EVLIST__HLIST_BITS);
480 	head = &evlist->heads[hash];
481 
482 	hlist_for_each_entry(sid, head, node) {
483 		if (sid->id == id)
484 			return sid->evsel;
485 	}
486 	return NULL;
487 }
488 
perf_evlist__mmap_read(struct perf_evlist * evlist,int idx)489 union perf_event *perf_evlist__mmap_read(struct perf_evlist *evlist, int idx)
490 {
491 	struct perf_mmap *md = &evlist->mmap[idx];
492 	unsigned int head = perf_mmap__read_head(md);
493 	unsigned int old = md->prev;
494 	unsigned char *data = md->base + page_size;
495 	union perf_event *event = NULL;
496 
497 	if (evlist->overwrite) {
498 		/*
499 		 * If we're further behind than half the buffer, there's a chance
500 		 * the writer will bite our tail and mess up the samples under us.
501 		 *
502 		 * If we somehow ended up ahead of the head, we got messed up.
503 		 *
504 		 * In either case, truncate and restart at head.
505 		 */
506 		int diff = head - old;
507 		if (diff > md->mask / 2 || diff < 0) {
508 			fprintf(stderr, "WARNING: failed to keep up with mmap data.\n");
509 
510 			/*
511 			 * head points to a known good entry, start there.
512 			 */
513 			old = head;
514 		}
515 	}
516 
517 	if (old != head) {
518 		size_t size;
519 
520 		event = (union perf_event *)&data[old & md->mask];
521 		size = event->header.size;
522 
523 		/*
524 		 * Event straddles the mmap boundary -- header should always
525 		 * be inside due to u64 alignment of output.
526 		 */
527 		if ((old & md->mask) + size != ((old + size) & md->mask)) {
528 			unsigned int offset = old;
529 			unsigned int len = min(sizeof(*event), size), cpy;
530 			void *dst = &md->event_copy;
531 
532 			do {
533 				cpy = min(md->mask + 1 - (offset & md->mask), len);
534 				memcpy(dst, &data[offset & md->mask], cpy);
535 				offset += cpy;
536 				dst += cpy;
537 				len -= cpy;
538 			} while (len);
539 
540 			event = &md->event_copy;
541 		}
542 
543 		old += size;
544 	}
545 
546 	md->prev = old;
547 
548 	return event;
549 }
550 
perf_evlist__mmap_consume(struct perf_evlist * evlist,int idx)551 void perf_evlist__mmap_consume(struct perf_evlist *evlist, int idx)
552 {
553 	if (!evlist->overwrite) {
554 		struct perf_mmap *md = &evlist->mmap[idx];
555 		unsigned int old = md->prev;
556 
557 		perf_mmap__write_tail(md, old);
558 	}
559 }
560 
__perf_evlist__munmap(struct perf_evlist * evlist,int idx)561 static void __perf_evlist__munmap(struct perf_evlist *evlist, int idx)
562 {
563 	if (evlist->mmap[idx].base != NULL) {
564 		munmap(evlist->mmap[idx].base, evlist->mmap_len);
565 		evlist->mmap[idx].base = NULL;
566 	}
567 }
568 
perf_evlist__munmap(struct perf_evlist * evlist)569 void perf_evlist__munmap(struct perf_evlist *evlist)
570 {
571 	int i;
572 
573 	for (i = 0; i < evlist->nr_mmaps; i++)
574 		__perf_evlist__munmap(evlist, i);
575 
576 	free(evlist->mmap);
577 	evlist->mmap = NULL;
578 }
579 
perf_evlist__alloc_mmap(struct perf_evlist * evlist)580 static int perf_evlist__alloc_mmap(struct perf_evlist *evlist)
581 {
582 	evlist->nr_mmaps = cpu_map__nr(evlist->cpus);
583 	if (cpu_map__empty(evlist->cpus))
584 		evlist->nr_mmaps = thread_map__nr(evlist->threads);
585 	evlist->mmap = zalloc(evlist->nr_mmaps * sizeof(struct perf_mmap));
586 	return evlist->mmap != NULL ? 0 : -ENOMEM;
587 }
588 
__perf_evlist__mmap(struct perf_evlist * evlist,int idx,int prot,int mask,int fd)589 static int __perf_evlist__mmap(struct perf_evlist *evlist,
590 			       int idx, int prot, int mask, int fd)
591 {
592 	evlist->mmap[idx].prev = 0;
593 	evlist->mmap[idx].mask = mask;
594 	evlist->mmap[idx].base = mmap(NULL, evlist->mmap_len, prot,
595 				      MAP_SHARED, fd, 0);
596 	if (evlist->mmap[idx].base == MAP_FAILED) {
597 		evlist->mmap[idx].base = NULL;
598 		return -1;
599 	}
600 
601 	perf_evlist__add_pollfd(evlist, fd);
602 	return 0;
603 }
604 
perf_evlist__mmap_per_cpu(struct perf_evlist * evlist,int prot,int mask)605 static int perf_evlist__mmap_per_cpu(struct perf_evlist *evlist, int prot, int mask)
606 {
607 	struct perf_evsel *evsel;
608 	int cpu, thread;
609 	int nr_cpus = cpu_map__nr(evlist->cpus);
610 	int nr_threads = thread_map__nr(evlist->threads);
611 
612 	pr_debug2("perf event ring buffer mmapped per cpu\n");
613 	for (cpu = 0; cpu < nr_cpus; cpu++) {
614 		int output = -1;
615 
616 		for (thread = 0; thread < nr_threads; thread++) {
617 			list_for_each_entry(evsel, &evlist->entries, node) {
618 				int fd = FD(evsel, cpu, thread);
619 
620 				if (output == -1) {
621 					output = fd;
622 					if (__perf_evlist__mmap(evlist, cpu,
623 								prot, mask, output) < 0)
624 						goto out_unmap;
625 				} else {
626 					if (ioctl(fd, PERF_EVENT_IOC_SET_OUTPUT, output) != 0)
627 						goto out_unmap;
628 				}
629 
630 				if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
631 				    perf_evlist__id_add_fd(evlist, evsel, cpu, thread, fd) < 0)
632 					goto out_unmap;
633 			}
634 		}
635 	}
636 
637 	return 0;
638 
639 out_unmap:
640 	for (cpu = 0; cpu < nr_cpus; cpu++)
641 		__perf_evlist__munmap(evlist, cpu);
642 	return -1;
643 }
644 
perf_evlist__mmap_per_thread(struct perf_evlist * evlist,int prot,int mask)645 static int perf_evlist__mmap_per_thread(struct perf_evlist *evlist, int prot, int mask)
646 {
647 	struct perf_evsel *evsel;
648 	int thread;
649 	int nr_threads = thread_map__nr(evlist->threads);
650 
651 	pr_debug2("perf event ring buffer mmapped per thread\n");
652 	for (thread = 0; thread < nr_threads; thread++) {
653 		int output = -1;
654 
655 		list_for_each_entry(evsel, &evlist->entries, node) {
656 			int fd = FD(evsel, 0, thread);
657 
658 			if (output == -1) {
659 				output = fd;
660 				if (__perf_evlist__mmap(evlist, thread,
661 							prot, mask, output) < 0)
662 					goto out_unmap;
663 			} else {
664 				if (ioctl(fd, PERF_EVENT_IOC_SET_OUTPUT, output) != 0)
665 					goto out_unmap;
666 			}
667 
668 			if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
669 			    perf_evlist__id_add_fd(evlist, evsel, 0, thread, fd) < 0)
670 				goto out_unmap;
671 		}
672 	}
673 
674 	return 0;
675 
676 out_unmap:
677 	for (thread = 0; thread < nr_threads; thread++)
678 		__perf_evlist__munmap(evlist, thread);
679 	return -1;
680 }
681 
682 /** perf_evlist__mmap - Create per cpu maps to receive events
683  *
684  * @evlist - list of events
685  * @pages - map length in pages
686  * @overwrite - overwrite older events?
687  *
688  * If overwrite is false the user needs to signal event consuption using:
689  *
690  *	struct perf_mmap *m = &evlist->mmap[cpu];
691  *	unsigned int head = perf_mmap__read_head(m);
692  *
693  *	perf_mmap__write_tail(m, head)
694  *
695  * Using perf_evlist__read_on_cpu does this automatically.
696  */
perf_evlist__mmap(struct perf_evlist * evlist,unsigned int pages,bool overwrite)697 int perf_evlist__mmap(struct perf_evlist *evlist, unsigned int pages,
698 		      bool overwrite)
699 {
700 	struct perf_evsel *evsel;
701 	const struct cpu_map *cpus = evlist->cpus;
702 	const struct thread_map *threads = evlist->threads;
703 	int prot = PROT_READ | (overwrite ? 0 : PROT_WRITE), mask;
704 
705         /* 512 kiB: default amount of unprivileged mlocked memory */
706         if (pages == UINT_MAX)
707                 pages = (512 * 1024) / page_size;
708 	else if (!is_power_of_2(pages))
709 		return -EINVAL;
710 
711 	mask = pages * page_size - 1;
712 
713 	if (evlist->mmap == NULL && perf_evlist__alloc_mmap(evlist) < 0)
714 		return -ENOMEM;
715 
716 	if (evlist->pollfd == NULL && perf_evlist__alloc_pollfd(evlist) < 0)
717 		return -ENOMEM;
718 
719 	evlist->overwrite = overwrite;
720 	evlist->mmap_len = (pages + 1) * page_size;
721 
722 	list_for_each_entry(evsel, &evlist->entries, node) {
723 		if ((evsel->attr.read_format & PERF_FORMAT_ID) &&
724 		    evsel->sample_id == NULL &&
725 		    perf_evsel__alloc_id(evsel, cpu_map__nr(cpus), threads->nr) < 0)
726 			return -ENOMEM;
727 	}
728 
729 	if (cpu_map__empty(cpus))
730 		return perf_evlist__mmap_per_thread(evlist, prot, mask);
731 
732 	return perf_evlist__mmap_per_cpu(evlist, prot, mask);
733 }
734 
perf_evlist__create_maps(struct perf_evlist * evlist,struct perf_target * target)735 int perf_evlist__create_maps(struct perf_evlist *evlist,
736 			     struct perf_target *target)
737 {
738 	evlist->threads = thread_map__new_str(target->pid, target->tid,
739 					      target->uid);
740 
741 	if (evlist->threads == NULL)
742 		return -1;
743 
744 	if (perf_target__has_task(target))
745 		evlist->cpus = cpu_map__dummy_new();
746 	else if (!perf_target__has_cpu(target) && !target->uses_mmap)
747 		evlist->cpus = cpu_map__dummy_new();
748 	else
749 		evlist->cpus = cpu_map__new(target->cpu_list);
750 
751 	if (evlist->cpus == NULL)
752 		goto out_delete_threads;
753 
754 	return 0;
755 
756 out_delete_threads:
757 	thread_map__delete(evlist->threads);
758 	return -1;
759 }
760 
perf_evlist__delete_maps(struct perf_evlist * evlist)761 void perf_evlist__delete_maps(struct perf_evlist *evlist)
762 {
763 	cpu_map__delete(evlist->cpus);
764 	thread_map__delete(evlist->threads);
765 	evlist->cpus	= NULL;
766 	evlist->threads = NULL;
767 }
768 
perf_evlist__apply_filters(struct perf_evlist * evlist)769 int perf_evlist__apply_filters(struct perf_evlist *evlist)
770 {
771 	struct perf_evsel *evsel;
772 	int err = 0;
773 	const int ncpus = cpu_map__nr(evlist->cpus),
774 		  nthreads = thread_map__nr(evlist->threads);
775 
776 	list_for_each_entry(evsel, &evlist->entries, node) {
777 		if (evsel->filter == NULL)
778 			continue;
779 
780 		err = perf_evsel__set_filter(evsel, ncpus, nthreads, evsel->filter);
781 		if (err)
782 			break;
783 	}
784 
785 	return err;
786 }
787 
perf_evlist__set_filter(struct perf_evlist * evlist,const char * filter)788 int perf_evlist__set_filter(struct perf_evlist *evlist, const char *filter)
789 {
790 	struct perf_evsel *evsel;
791 	int err = 0;
792 	const int ncpus = cpu_map__nr(evlist->cpus),
793 		  nthreads = thread_map__nr(evlist->threads);
794 
795 	list_for_each_entry(evsel, &evlist->entries, node) {
796 		err = perf_evsel__set_filter(evsel, ncpus, nthreads, filter);
797 		if (err)
798 			break;
799 	}
800 
801 	return err;
802 }
803 
perf_evlist__valid_sample_type(struct perf_evlist * evlist)804 bool perf_evlist__valid_sample_type(struct perf_evlist *evlist)
805 {
806 	struct perf_evsel *pos;
807 
808 	if (evlist->nr_entries == 1)
809 		return true;
810 
811 	if (evlist->id_pos < 0 || evlist->is_pos < 0)
812 		return false;
813 
814 	list_for_each_entry(pos, &evlist->entries, node) {
815 		if (pos->id_pos != evlist->id_pos ||
816 		    pos->is_pos != evlist->is_pos)
817 			return false;
818 	}
819 
820 	return true;
821 }
822 
__perf_evlist__combined_sample_type(struct perf_evlist * evlist)823 u64 __perf_evlist__combined_sample_type(struct perf_evlist *evlist)
824 {
825 	struct perf_evsel *evsel;
826 
827 	if (evlist->combined_sample_type)
828 		return evlist->combined_sample_type;
829 
830 	list_for_each_entry(evsel, &evlist->entries, node)
831 		evlist->combined_sample_type |= evsel->attr.sample_type;
832 
833 	return evlist->combined_sample_type;
834 }
835 
perf_evlist__combined_sample_type(struct perf_evlist * evlist)836 u64 perf_evlist__combined_sample_type(struct perf_evlist *evlist)
837 {
838 	evlist->combined_sample_type = 0;
839 	return __perf_evlist__combined_sample_type(evlist);
840 }
841 
perf_evlist__valid_read_format(struct perf_evlist * evlist)842 bool perf_evlist__valid_read_format(struct perf_evlist *evlist)
843 {
844 	struct perf_evsel *first = perf_evlist__first(evlist), *pos = first;
845 	u64 read_format = first->attr.read_format;
846 	u64 sample_type = first->attr.sample_type;
847 
848 	list_for_each_entry_continue(pos, &evlist->entries, node) {
849 		if (read_format != pos->attr.read_format)
850 			return false;
851 	}
852 
853 	/* PERF_SAMPLE_READ imples PERF_FORMAT_ID. */
854 	if ((sample_type & PERF_SAMPLE_READ) &&
855 	    !(read_format & PERF_FORMAT_ID)) {
856 		return false;
857 	}
858 
859 	return true;
860 }
861 
perf_evlist__read_format(struct perf_evlist * evlist)862 u64 perf_evlist__read_format(struct perf_evlist *evlist)
863 {
864 	struct perf_evsel *first = perf_evlist__first(evlist);
865 	return first->attr.read_format;
866 }
867 
perf_evlist__id_hdr_size(struct perf_evlist * evlist)868 u16 perf_evlist__id_hdr_size(struct perf_evlist *evlist)
869 {
870 	struct perf_evsel *first = perf_evlist__first(evlist);
871 	struct perf_sample *data;
872 	u64 sample_type;
873 	u16 size = 0;
874 
875 	if (!first->attr.sample_id_all)
876 		goto out;
877 
878 	sample_type = first->attr.sample_type;
879 
880 	if (sample_type & PERF_SAMPLE_TID)
881 		size += sizeof(data->tid) * 2;
882 
883        if (sample_type & PERF_SAMPLE_TIME)
884 		size += sizeof(data->time);
885 
886 	if (sample_type & PERF_SAMPLE_ID)
887 		size += sizeof(data->id);
888 
889 	if (sample_type & PERF_SAMPLE_STREAM_ID)
890 		size += sizeof(data->stream_id);
891 
892 	if (sample_type & PERF_SAMPLE_CPU)
893 		size += sizeof(data->cpu) * 2;
894 
895 	if (sample_type & PERF_SAMPLE_IDENTIFIER)
896 		size += sizeof(data->id);
897 out:
898 	return size;
899 }
900 
perf_evlist__valid_sample_id_all(struct perf_evlist * evlist)901 bool perf_evlist__valid_sample_id_all(struct perf_evlist *evlist)
902 {
903 	struct perf_evsel *first = perf_evlist__first(evlist), *pos = first;
904 
905 	list_for_each_entry_continue(pos, &evlist->entries, node) {
906 		if (first->attr.sample_id_all != pos->attr.sample_id_all)
907 			return false;
908 	}
909 
910 	return true;
911 }
912 
perf_evlist__sample_id_all(struct perf_evlist * evlist)913 bool perf_evlist__sample_id_all(struct perf_evlist *evlist)
914 {
915 	struct perf_evsel *first = perf_evlist__first(evlist);
916 	return first->attr.sample_id_all;
917 }
918 
perf_evlist__set_selected(struct perf_evlist * evlist,struct perf_evsel * evsel)919 void perf_evlist__set_selected(struct perf_evlist *evlist,
920 			       struct perf_evsel *evsel)
921 {
922 	evlist->selected = evsel;
923 }
924 
perf_evlist__close(struct perf_evlist * evlist)925 void perf_evlist__close(struct perf_evlist *evlist)
926 {
927 	struct perf_evsel *evsel;
928 	int ncpus = cpu_map__nr(evlist->cpus);
929 	int nthreads = thread_map__nr(evlist->threads);
930 
931 	list_for_each_entry_reverse(evsel, &evlist->entries, node)
932 		perf_evsel__close(evsel, ncpus, nthreads);
933 }
934 
perf_evlist__open(struct perf_evlist * evlist)935 int perf_evlist__open(struct perf_evlist *evlist)
936 {
937 	struct perf_evsel *evsel;
938 	int err;
939 
940 	perf_evlist__update_id_pos(evlist);
941 
942 	list_for_each_entry(evsel, &evlist->entries, node) {
943 		err = perf_evsel__open(evsel, evlist->cpus, evlist->threads);
944 		if (err < 0)
945 			goto out_err;
946 	}
947 
948 	return 0;
949 out_err:
950 	perf_evlist__close(evlist);
951 	errno = -err;
952 	return err;
953 }
954 
perf_evlist__prepare_workload(struct perf_evlist * evlist,struct perf_target * target,const char * argv[],bool pipe_output,bool want_signal)955 int perf_evlist__prepare_workload(struct perf_evlist *evlist,
956 				  struct perf_target *target,
957 				  const char *argv[], bool pipe_output,
958 				  bool want_signal)
959 {
960 	int child_ready_pipe[2], go_pipe[2];
961 	char bf;
962 
963 	if (pipe(child_ready_pipe) < 0) {
964 		perror("failed to create 'ready' pipe");
965 		return -1;
966 	}
967 
968 	if (pipe(go_pipe) < 0) {
969 		perror("failed to create 'go' pipe");
970 		goto out_close_ready_pipe;
971 	}
972 
973 	evlist->workload.pid = fork();
974 	if (evlist->workload.pid < 0) {
975 		perror("failed to fork");
976 		goto out_close_pipes;
977 	}
978 
979 	if (!evlist->workload.pid) {
980 		if (pipe_output)
981 			dup2(2, 1);
982 
983 		signal(SIGTERM, SIG_DFL);
984 
985 		close(child_ready_pipe[0]);
986 		close(go_pipe[1]);
987 		fcntl(go_pipe[0], F_SETFD, FD_CLOEXEC);
988 
989 		/*
990 		 * Tell the parent we're ready to go
991 		 */
992 		close(child_ready_pipe[1]);
993 
994 		/*
995 		 * Wait until the parent tells us to go.
996 		 */
997 		if (read(go_pipe[0], &bf, 1) == -1)
998 			perror("unable to read pipe");
999 
1000 		execvp(argv[0], (char **)argv);
1001 
1002 		perror(argv[0]);
1003 		if (want_signal)
1004 			kill(getppid(), SIGUSR1);
1005 		exit(-1);
1006 	}
1007 
1008 	if (perf_target__none(target))
1009 		evlist->threads->map[0] = evlist->workload.pid;
1010 
1011 	close(child_ready_pipe[1]);
1012 	close(go_pipe[0]);
1013 	/*
1014 	 * wait for child to settle
1015 	 */
1016 	if (read(child_ready_pipe[0], &bf, 1) == -1) {
1017 		perror("unable to read pipe");
1018 		goto out_close_pipes;
1019 	}
1020 
1021 	fcntl(go_pipe[1], F_SETFD, FD_CLOEXEC);
1022 	evlist->workload.cork_fd = go_pipe[1];
1023 	close(child_ready_pipe[0]);
1024 	return 0;
1025 
1026 out_close_pipes:
1027 	close(go_pipe[0]);
1028 	close(go_pipe[1]);
1029 out_close_ready_pipe:
1030 	close(child_ready_pipe[0]);
1031 	close(child_ready_pipe[1]);
1032 	return -1;
1033 }
1034 
perf_evlist__start_workload(struct perf_evlist * evlist)1035 int perf_evlist__start_workload(struct perf_evlist *evlist)
1036 {
1037 	if (evlist->workload.cork_fd > 0) {
1038 		char bf = 0;
1039 		int ret;
1040 		/*
1041 		 * Remove the cork, let it rip!
1042 		 */
1043 		ret = write(evlist->workload.cork_fd, &bf, 1);
1044 		if (ret < 0)
1045 			perror("enable to write to pipe");
1046 
1047 		close(evlist->workload.cork_fd);
1048 		return ret;
1049 	}
1050 
1051 	return 0;
1052 }
1053 
perf_evlist__parse_sample(struct perf_evlist * evlist,union perf_event * event,struct perf_sample * sample)1054 int perf_evlist__parse_sample(struct perf_evlist *evlist, union perf_event *event,
1055 			      struct perf_sample *sample)
1056 {
1057 	struct perf_evsel *evsel = perf_evlist__event2evsel(evlist, event);
1058 
1059 	if (!evsel)
1060 		return -EFAULT;
1061 	return perf_evsel__parse_sample(evsel, event, sample);
1062 }
1063 
perf_evlist__fprintf(struct perf_evlist * evlist,FILE * fp)1064 size_t perf_evlist__fprintf(struct perf_evlist *evlist, FILE *fp)
1065 {
1066 	struct perf_evsel *evsel;
1067 	size_t printed = 0;
1068 
1069 	list_for_each_entry(evsel, &evlist->entries, node) {
1070 		printed += fprintf(fp, "%s%s", evsel->idx ? ", " : "",
1071 				   perf_evsel__name(evsel));
1072 	}
1073 
1074 	return printed + fprintf(fp, "\n");;
1075 }
1076