Lines Matching +full:top +full:- +full:level
1 // SPDX-License-Identifier: GPL-2.0
57 #define LEVEL(x) P(LVLNUM, x) macro
63 P(OP, LOAD) | P(LVL, MISS) | LEVEL(L3) | P(SNOOP, NA),/* 0x00:ukn L3 */
64 OP_LH | P(LVL, L1) | LEVEL(L1) | P(SNOOP, NONE), /* 0x01: L1 local */
65 OP_LH | P(LVL, LFB) | LEVEL(LFB) | P(SNOOP, NONE), /* 0x02: LFB hit */
66 OP_LH | P(LVL, L2) | LEVEL(L2) | P(SNOOP, NONE), /* 0x03: L2 hit */
67 OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, NONE), /* 0x04: L3 hit */
68 OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, MISS), /* 0x05: L3 hit, snoop miss */
69 OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HIT), /* 0x06: L3 hit, snoop hit */
70 OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HITM), /* 0x07: L3 hit, snoop hitm */
71 OP_LH | P(LVL, REM_CCE1) | REM | LEVEL(L3) | P(SNOOP, HIT), /* 0x08: L3 miss snoop hit */
72 OP_LH | P(LVL, REM_CCE1) | REM | LEVEL(L3) | P(SNOOP, HITM), /* 0x09: L3 miss snoop hitm*/
73 OP_LH | P(LVL, LOC_RAM) | LEVEL(RAM) | P(SNOOP, HIT), /* 0x0a: L3 miss, shared */
74 OP_LH | P(LVL, REM_RAM1) | REM | LEVEL(L3) | P(SNOOP, HIT), /* 0x0b: L3 miss, shared */
75 OP_LH | P(LVL, LOC_RAM) | LEVEL(RAM) | SNOOP_NONE_MISS, /* 0x0c: L3 miss, excl */
76 OP_LH | P(LVL, REM_RAM1) | LEVEL(RAM) | REM | SNOOP_NONE_MISS, /* 0x0d: L3 miss, excl */
77 OP_LH | P(LVL, IO) | LEVEL(NA) | P(SNOOP, NONE), /* 0x0e: I/O */
78 OP_LH | P(LVL, UNC) | LEVEL(NA) | P(SNOOP, NONE), /* 0x0f: uncached */
84 pebs_data_source[0x05] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HIT); in intel_pmu_pebs_data_source_nhm()
85 pebs_data_source[0x06] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HITM); in intel_pmu_pebs_data_source_nhm()
86 pebs_data_source[0x07] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HITM); in intel_pmu_pebs_data_source_nhm()
91 u64 pmem_or_l4 = pmem ? LEVEL(PMEM) : LEVEL(L4); in intel_pmu_pebs_data_source_skl()
95 pebs_data_source[0x0b] = OP_LH | LEVEL(RAM) | REM | P(SNOOP, NONE); in intel_pmu_pebs_data_source_skl()
96 pebs_data_source[0x0c] = OP_LH | LEVEL(ANY_CACHE) | REM | P(SNOOPX, FWD); in intel_pmu_pebs_data_source_skl()
97 pebs_data_source[0x0d] = OP_LH | LEVEL(ANY_CACHE) | REM | P(SNOOP, HITM); in intel_pmu_pebs_data_source_skl()
109 * 1 = stored missed 2nd level TLB in precise_store_data()
112 * otherwise hit 2nd level TLB in precise_store_data()
144 if (event->hw.flags & PERF_X86_EVENT_PEBS_ST_HSW) in precise_datala_hsw()
146 else if (event->hw.flags & PERF_X86_EVENT_PEBS_LD_HSW) in precise_datala_hsw()
157 if (event->hw.flags & PERF_X86_EVENT_PEBS_ST_HSW) { in precise_datala_hsw()
174 * use the mapping table for bit 0-3 in load_latency_data()
187 * 0 = did not miss 2nd level TLB in load_latency_data()
188 * 1 = missed 2nd level TLB in load_latency_data()
299 * This is a cross-CPU update of the cpu_entry_area, we must shoot down in ds_update_cea()
338 struct debug_store *ds = hwev->ds; in alloc_pebs_buffer()
348 return -ENOMEM; in alloc_pebs_buffer()
358 return -ENOMEM; in alloc_pebs_buffer()
362 hwev->ds_pebs_vaddr = buffer; in alloc_pebs_buffer()
364 cea = &get_cpu_entry_area(cpu)->cpu_debug_buffers.pebs_buffer; in alloc_pebs_buffer()
365 ds->pebs_buffer_base = (unsigned long) cea; in alloc_pebs_buffer()
367 ds->pebs_index = ds->pebs_buffer_base; in alloc_pebs_buffer()
369 ds->pebs_absolute_maximum = ds->pebs_buffer_base + max; in alloc_pebs_buffer()
385 cea = &get_cpu_entry_area(cpu)->cpu_debug_buffers.pebs_buffer; in release_pebs_buffer()
387 dsfree_pages(hwev->ds_pebs_vaddr, x86_pmu.pebs_buffer_size); in release_pebs_buffer()
388 hwev->ds_pebs_vaddr = NULL; in release_pebs_buffer()
394 struct debug_store *ds = hwev->ds; in alloc_bts_buffer()
404 return -ENOMEM; in alloc_bts_buffer()
406 hwev->ds_bts_vaddr = buffer; in alloc_bts_buffer()
408 cea = &get_cpu_entry_area(cpu)->cpu_debug_buffers.bts_buffer; in alloc_bts_buffer()
409 ds->bts_buffer_base = (unsigned long) cea; in alloc_bts_buffer()
411 ds->bts_index = ds->bts_buffer_base; in alloc_bts_buffer()
413 ds->bts_absolute_maximum = ds->bts_buffer_base + in alloc_bts_buffer()
415 ds->bts_interrupt_threshold = ds->bts_absolute_maximum - in alloc_bts_buffer()
429 cea = &get_cpu_entry_area(cpu)->cpu_debug_buffers.bts_buffer; in release_bts_buffer()
431 dsfree_pages(hwev->ds_bts_vaddr, BTS_BUFFER_SIZE); in release_bts_buffer()
432 hwev->ds_bts_vaddr = NULL; in release_bts_buffer()
437 struct debug_store *ds = &get_cpu_entry_area(cpu)->cpu_debug_store; in alloc_ds_buffer()
569 if (!cpuc->ds) in intel_pmu_disable_bts()
584 struct debug_store *ds = cpuc->ds; in intel_pmu_drain_bts_buffer()
590 struct perf_event *event = cpuc->events[INTEL_PMC_IDX_FIXED_BTS]; in intel_pmu_drain_bts_buffer()
591 struct bts_record *at, *base, *top; in intel_pmu_drain_bts_buffer() local
604 base = (struct bts_record *)(unsigned long)ds->bts_buffer_base; in intel_pmu_drain_bts_buffer()
605 top = (struct bts_record *)(unsigned long)ds->bts_index; in intel_pmu_drain_bts_buffer()
607 if (top <= base) in intel_pmu_drain_bts_buffer()
612 ds->bts_index = ds->bts_buffer_base; in intel_pmu_drain_bts_buffer()
614 perf_sample_data_init(&data, 0, event->hw.last_period); in intel_pmu_drain_bts_buffer()
626 for (at = base; at < top; at++) { in intel_pmu_drain_bts_buffer()
632 if (event->attr.exclude_kernel && in intel_pmu_drain_bts_buffer()
633 (kernel_ip(at->from) || kernel_ip(at->to))) in intel_pmu_drain_bts_buffer()
646 header.size * (top - base - skip))) in intel_pmu_drain_bts_buffer()
649 for (at = base; at < top; at++) { in intel_pmu_drain_bts_buffer()
651 if (event->attr.exclude_kernel && in intel_pmu_drain_bts_buffer()
652 (kernel_ip(at->from) || kernel_ip(at->to))) in intel_pmu_drain_bts_buffer()
655 data.ip = at->from; in intel_pmu_drain_bts_buffer()
656 data.addr = at->to; in intel_pmu_drain_bts_buffer()
664 event->hw.interrupts++; in intel_pmu_drain_bts_buffer()
665 event->pending_kill = POLL_IN; in intel_pmu_drain_bts_buffer()
882 if (!event->attr.precise_ip) in intel_pebs_constraints()
887 if (constraint_match(c, event->hw.config)) { in intel_pebs_constraints()
888 event->hw.flags |= c->flags; in intel_pebs_constraints()
905 * We need the sched_task callback even for per-cpu events when we use
911 if (cpuc->n_pebs == cpuc->n_pebs_via_pt) in pebs_needs_sched_cb()
914 return cpuc->n_pebs && (cpuc->n_pebs == cpuc->n_large_pebs); in pebs_needs_sched_cb()
927 struct debug_store *ds = cpuc->ds; in pebs_update_threshold()
931 if (cpuc->n_pebs_via_pt) in pebs_update_threshold()
939 if (cpuc->n_pebs == cpuc->n_large_pebs) { in pebs_update_threshold()
940 threshold = ds->pebs_absolute_maximum - in pebs_update_threshold()
941 reserved * cpuc->pebs_record_size; in pebs_update_threshold()
943 threshold = ds->pebs_buffer_base + cpuc->pebs_record_size; in pebs_update_threshold()
946 ds->pebs_interrupt_threshold = threshold; in pebs_update_threshold()
952 u64 pebs_data_cfg = cpuc->pebs_data_cfg; in adaptive_pebs_record_size_update()
964 cpuc->pebs_record_size = sz; in adaptive_pebs_record_size_update()
973 struct perf_event_attr *attr = &event->attr; in pebs_update_adaptive_cfg()
974 u64 sample_type = attr->sample_type; in pebs_update_adaptive_cfg()
979 attr->precise_ip > 1) in pebs_update_adaptive_cfg()
992 (attr->sample_regs_intr & PEBS_GP_REGS); in pebs_update_adaptive_cfg()
995 ((attr->config & INTEL_ARCH_EVENT_MASK) == in pebs_update_adaptive_cfg()
998 if (gprs || (attr->precise_ip < 2) || tsx_weight) in pebs_update_adaptive_cfg()
1002 (attr->sample_regs_intr & PERF_REG_EXTENDED_MASK)) in pebs_update_adaptive_cfg()
1011 ((x86_pmu.lbr_nr-1) << PEBS_DATACFG_LBR_SHIFT); in pebs_update_adaptive_cfg()
1021 struct pmu *pmu = event->ctx->pmu; in pebs_update_state()
1027 bool update = cpuc->n_pebs == 1; in pebs_update_state()
1046 if (cpuc->n_pebs == 1) { in pebs_update_state()
1047 cpuc->pebs_data_cfg = 0; in pebs_update_state()
1048 cpuc->pebs_record_size = sizeof(struct pebs_basic); in pebs_update_state()
1054 if (pebs_data_cfg & ~cpuc->pebs_data_cfg) { in pebs_update_state()
1055 cpuc->pebs_data_cfg |= pebs_data_cfg; in pebs_update_state()
1068 struct hw_perf_event *hwc = &event->hw; in intel_pmu_pebs_add()
1071 cpuc->n_pebs++; in intel_pmu_pebs_add()
1072 if (hwc->flags & PERF_X86_EVENT_LARGE_PEBS) in intel_pmu_pebs_add()
1073 cpuc->n_large_pebs++; in intel_pmu_pebs_add()
1074 if (hwc->flags & PERF_X86_EVENT_PEBS_VIA_PT) in intel_pmu_pebs_add()
1075 cpuc->n_pebs_via_pt++; in intel_pmu_pebs_add()
1087 if (!(cpuc->pebs_enabled & ~PEBS_VIA_PT_MASK)) in intel_pmu_pebs_via_pt_disable()
1088 cpuc->pebs_enabled &= ~PEBS_VIA_PT_MASK; in intel_pmu_pebs_via_pt_disable()
1094 struct hw_perf_event *hwc = &event->hw; in intel_pmu_pebs_via_pt_enable()
1095 struct debug_store *ds = cpuc->ds; in intel_pmu_pebs_via_pt_enable()
1100 if (!(event->hw.flags & PERF_X86_EVENT_LARGE_PEBS)) in intel_pmu_pebs_via_pt_enable()
1101 cpuc->pebs_enabled |= PEBS_PMI_AFTER_EACH_RECORD; in intel_pmu_pebs_via_pt_enable()
1103 cpuc->pebs_enabled |= PEBS_OUTPUT_PT; in intel_pmu_pebs_via_pt_enable()
1105 wrmsrl(MSR_RELOAD_PMC0 + hwc->idx, ds->pebs_event_reset[hwc->idx]); in intel_pmu_pebs_via_pt_enable()
1111 struct hw_perf_event *hwc = &event->hw; in intel_pmu_pebs_enable()
1112 struct debug_store *ds = cpuc->ds; in intel_pmu_pebs_enable()
1114 hwc->config &= ~ARCH_PERFMON_EVENTSEL_INT; in intel_pmu_pebs_enable()
1116 cpuc->pebs_enabled |= 1ULL << hwc->idx; in intel_pmu_pebs_enable()
1118 if ((event->hw.flags & PERF_X86_EVENT_PEBS_LDLAT) && (x86_pmu.version < 5)) in intel_pmu_pebs_enable()
1119 cpuc->pebs_enabled |= 1ULL << (hwc->idx + 32); in intel_pmu_pebs_enable()
1120 else if (event->hw.flags & PERF_X86_EVENT_PEBS_ST) in intel_pmu_pebs_enable()
1121 cpuc->pebs_enabled |= 1ULL << 63; in intel_pmu_pebs_enable()
1124 hwc->config |= ICL_EVENTSEL_ADAPTIVE; in intel_pmu_pebs_enable()
1125 if (cpuc->pebs_data_cfg != cpuc->active_pebs_data_cfg) { in intel_pmu_pebs_enable()
1126 wrmsrl(MSR_PEBS_DATA_CFG, cpuc->pebs_data_cfg); in intel_pmu_pebs_enable()
1127 cpuc->active_pebs_data_cfg = cpuc->pebs_data_cfg; in intel_pmu_pebs_enable()
1132 * Use auto-reload if possible to save a MSR write in the PMI. in intel_pmu_pebs_enable()
1135 if (hwc->flags & PERF_X86_EVENT_AUTO_RELOAD) { in intel_pmu_pebs_enable()
1136 unsigned int idx = hwc->idx; in intel_pmu_pebs_enable()
1139 idx = MAX_PEBS_EVENTS + (idx - INTEL_PMC_IDX_FIXED); in intel_pmu_pebs_enable()
1140 ds->pebs_event_reset[idx] = in intel_pmu_pebs_enable()
1141 (u64)(-hwc->sample_period) & x86_pmu.cntval_mask; in intel_pmu_pebs_enable()
1143 ds->pebs_event_reset[hwc->idx] = 0; in intel_pmu_pebs_enable()
1152 struct hw_perf_event *hwc = &event->hw; in intel_pmu_pebs_del()
1155 cpuc->n_pebs--; in intel_pmu_pebs_del()
1156 if (hwc->flags & PERF_X86_EVENT_LARGE_PEBS) in intel_pmu_pebs_del()
1157 cpuc->n_large_pebs--; in intel_pmu_pebs_del()
1158 if (hwc->flags & PERF_X86_EVENT_PEBS_VIA_PT) in intel_pmu_pebs_del()
1159 cpuc->n_pebs_via_pt--; in intel_pmu_pebs_del()
1167 struct hw_perf_event *hwc = &event->hw; in intel_pmu_pebs_disable()
1169 if (cpuc->n_pebs == cpuc->n_large_pebs && in intel_pmu_pebs_disable()
1170 cpuc->n_pebs != cpuc->n_pebs_via_pt) in intel_pmu_pebs_disable()
1173 cpuc->pebs_enabled &= ~(1ULL << hwc->idx); in intel_pmu_pebs_disable()
1175 if ((event->hw.flags & PERF_X86_EVENT_PEBS_LDLAT) && in intel_pmu_pebs_disable()
1177 cpuc->pebs_enabled &= ~(1ULL << (hwc->idx + 32)); in intel_pmu_pebs_disable()
1178 else if (event->hw.flags & PERF_X86_EVENT_PEBS_ST) in intel_pmu_pebs_disable()
1179 cpuc->pebs_enabled &= ~(1ULL << 63); in intel_pmu_pebs_disable()
1183 if (cpuc->enabled) in intel_pmu_pebs_disable()
1184 wrmsrl(MSR_IA32_PEBS_ENABLE, cpuc->pebs_enabled); in intel_pmu_pebs_disable()
1186 hwc->config |= ARCH_PERFMON_EVENTSEL_INT; in intel_pmu_pebs_disable()
1193 if (cpuc->pebs_enabled) in intel_pmu_pebs_enable_all()
1194 wrmsrl(MSR_IA32_PEBS_ENABLE, cpuc->pebs_enabled); in intel_pmu_pebs_enable_all()
1201 if (cpuc->pebs_enabled) in intel_pmu_pebs_disable_all()
1208 unsigned long from = cpuc->lbr_entries[0].from; in intel_pmu_pebs_fixup_ip()
1209 unsigned long old_to, to = cpuc->lbr_entries[0].to; in intel_pmu_pebs_fixup_ip()
1210 unsigned long ip = regs->ip; in intel_pmu_pebs_fixup_ip()
1224 if (!cpuc->lbr_stack.nr || !from || !to) in intel_pmu_pebs_fixup_ip()
1237 if ((ip - to) > PEBS_FIXUP_SIZE) in intel_pmu_pebs_fixup_ip()
1248 size = ip - to; in intel_pmu_pebs_fixup_ip()
1284 size -= insn.length; in intel_pmu_pebs_fixup_ip()
1321 return ((struct pebs_record_nhm *)n)->status; in get_pebs_status()
1322 return ((struct pebs_basic *)n)->applicable_counters; in get_pebs_status()
1333 int fl = event->hw.flags; in get_data_src()
1362 sample_type = event->attr.sample_type; in setup_pebs_fixed_sample_data()
1363 fll = event->hw.flags & PERF_X86_EVENT_PEBS_LDLAT; in setup_pebs_fixed_sample_data()
1365 perf_sample_data_init(data, 0, event->hw.last_period); in setup_pebs_fixed_sample_data()
1367 data->period = event->hw.last_period; in setup_pebs_fixed_sample_data()
1370 * Use latency for weight (only avail with PEBS-LL) in setup_pebs_fixed_sample_data()
1373 data->weight = pebs->lat; in setup_pebs_fixed_sample_data()
1379 data->data_src.val = get_data_src(event, pebs->dse); in setup_pebs_fixed_sample_data()
1388 data->callchain = perf_callchain(event, iregs); in setup_pebs_fixed_sample_data()
1404 regs->flags = pebs->flags & ~PERF_EFLAGS_EXACT; in setup_pebs_fixed_sample_data()
1407 regs->ax = pebs->ax; in setup_pebs_fixed_sample_data()
1408 regs->bx = pebs->bx; in setup_pebs_fixed_sample_data()
1409 regs->cx = pebs->cx; in setup_pebs_fixed_sample_data()
1410 regs->dx = pebs->dx; in setup_pebs_fixed_sample_data()
1411 regs->si = pebs->si; in setup_pebs_fixed_sample_data()
1412 regs->di = pebs->di; in setup_pebs_fixed_sample_data()
1414 regs->bp = pebs->bp; in setup_pebs_fixed_sample_data()
1415 regs->sp = pebs->sp; in setup_pebs_fixed_sample_data()
1418 regs->r8 = pebs->r8; in setup_pebs_fixed_sample_data()
1419 regs->r9 = pebs->r9; in setup_pebs_fixed_sample_data()
1420 regs->r10 = pebs->r10; in setup_pebs_fixed_sample_data()
1421 regs->r11 = pebs->r11; in setup_pebs_fixed_sample_data()
1422 regs->r12 = pebs->r12; in setup_pebs_fixed_sample_data()
1423 regs->r13 = pebs->r13; in setup_pebs_fixed_sample_data()
1424 regs->r14 = pebs->r14; in setup_pebs_fixed_sample_data()
1425 regs->r15 = pebs->r15; in setup_pebs_fixed_sample_data()
1429 if (event->attr.precise_ip > 1) { in setup_pebs_fixed_sample_data()
1432 * (real IP) which fixes the off-by-1 skid in hardware. in setup_pebs_fixed_sample_data()
1436 set_linear_ip(regs, pebs->real_ip); in setup_pebs_fixed_sample_data()
1437 regs->flags |= PERF_EFLAGS_EXACT; in setup_pebs_fixed_sample_data()
1439 /* Otherwise, use PEBS off-by-1 IP: */ in setup_pebs_fixed_sample_data()
1440 set_linear_ip(regs, pebs->ip); in setup_pebs_fixed_sample_data()
1443 * With precise_ip >= 2, try to fix up the off-by-1 IP in setup_pebs_fixed_sample_data()
1445 * corrects regs->ip and calls set_linear_ip() on regs: in setup_pebs_fixed_sample_data()
1448 regs->flags |= PERF_EFLAGS_EXACT; in setup_pebs_fixed_sample_data()
1452 * When precise_ip == 1, return the PEBS off-by-1 IP, in setup_pebs_fixed_sample_data()
1455 set_linear_ip(regs, pebs->ip); in setup_pebs_fixed_sample_data()
1461 data->addr = pebs->dla; in setup_pebs_fixed_sample_data()
1466 data->weight = intel_get_tsx_weight(pebs->tsx_tuning); in setup_pebs_fixed_sample_data()
1469 data->txn = intel_get_tsx_transaction(pebs->tsx_tuning, in setup_pebs_fixed_sample_data()
1470 pebs->ax); in setup_pebs_fixed_sample_data()
1480 event->attr.use_clockid == 0) in setup_pebs_fixed_sample_data()
1481 data->time = native_sched_clock_from_tsc(pebs->tsc); in setup_pebs_fixed_sample_data()
1484 data->br_stack = &cpuc->lbr_stack; in setup_pebs_fixed_sample_data()
1490 regs->ax = gprs->ax; in adaptive_pebs_save_regs()
1491 regs->bx = gprs->bx; in adaptive_pebs_save_regs()
1492 regs->cx = gprs->cx; in adaptive_pebs_save_regs()
1493 regs->dx = gprs->dx; in adaptive_pebs_save_regs()
1494 regs->si = gprs->si; in adaptive_pebs_save_regs()
1495 regs->di = gprs->di; in adaptive_pebs_save_regs()
1496 regs->bp = gprs->bp; in adaptive_pebs_save_regs()
1497 regs->sp = gprs->sp; in adaptive_pebs_save_regs()
1499 regs->r8 = gprs->r8; in adaptive_pebs_save_regs()
1500 regs->r9 = gprs->r9; in adaptive_pebs_save_regs()
1501 regs->r10 = gprs->r10; in adaptive_pebs_save_regs()
1502 regs->r11 = gprs->r11; in adaptive_pebs_save_regs()
1503 regs->r12 = gprs->r12; in adaptive_pebs_save_regs()
1504 regs->r13 = gprs->r13; in adaptive_pebs_save_regs()
1505 regs->r14 = gprs->r14; in adaptive_pebs_save_regs()
1506 regs->r15 = gprs->r15; in adaptive_pebs_save_regs()
1532 perf_regs->xmm_regs = NULL; in setup_pebs_adaptive_sample_data()
1534 sample_type = event->attr.sample_type; in setup_pebs_adaptive_sample_data()
1535 format_size = basic->format_size; in setup_pebs_adaptive_sample_data()
1536 perf_sample_data_init(data, 0, event->hw.last_period); in setup_pebs_adaptive_sample_data()
1537 data->period = event->hw.last_period; in setup_pebs_adaptive_sample_data()
1539 if (event->attr.use_clockid == 0) in setup_pebs_adaptive_sample_data()
1540 data->time = native_sched_clock_from_tsc(basic->tsc); in setup_pebs_adaptive_sample_data()
1549 data->callchain = perf_callchain(event, iregs); in setup_pebs_adaptive_sample_data()
1553 set_linear_ip(regs, basic->ip); in setup_pebs_adaptive_sample_data()
1554 regs->flags = PERF_EFLAGS_EXACT; in setup_pebs_adaptive_sample_data()
1558 * But PERF_SAMPLE_TRANSACTION needs gprs->ax. in setup_pebs_adaptive_sample_data()
1570 if (event->attr.precise_ip < 2) { in setup_pebs_adaptive_sample_data()
1571 set_linear_ip(regs, gprs->ip); in setup_pebs_adaptive_sample_data()
1572 regs->flags &= ~PERF_EFLAGS_EXACT; in setup_pebs_adaptive_sample_data()
1581 data->weight = meminfo->latency ?: in setup_pebs_adaptive_sample_data()
1582 intel_get_tsx_weight(meminfo->tsx_tuning); in setup_pebs_adaptive_sample_data()
1585 data->data_src.val = get_data_src(event, meminfo->aux); in setup_pebs_adaptive_sample_data()
1588 data->addr = meminfo->address; in setup_pebs_adaptive_sample_data()
1591 data->txn = intel_get_tsx_transaction(meminfo->tsx_tuning, in setup_pebs_adaptive_sample_data()
1592 gprs ? gprs->ax : 0); in setup_pebs_adaptive_sample_data()
1599 perf_regs->xmm_regs = xmm->xmm; in setup_pebs_adaptive_sample_data()
1610 data->br_stack = &cpuc->lbr_stack; in setup_pebs_adaptive_sample_data()
1617 (u64)(next_record - __pebs), in setup_pebs_adaptive_sample_data()
1618 basic->format_size); in setup_pebs_adaptive_sample_data()
1622 get_next_pebs_record_by_bit(void *base, void *top, int bit) in get_next_pebs_record_by_bit() argument
1638 for (at = base; at < top; at += cpuc->pebs_record_size) { in get_next_pebs_record_by_bit()
1649 /* clear non-PEBS bit and re-check */ in get_next_pebs_record_by_bit()
1650 pebs_status = status & cpuc->pebs_enabled; in get_next_pebs_record_by_bit()
1661 WARN_ON(!(event->hw.flags & PERF_X86_EVENT_AUTO_RELOAD)); in intel_pmu_auto_reload_read()
1663 perf_pmu_disable(event->pmu); in intel_pmu_auto_reload_read()
1665 perf_pmu_enable(event->pmu); in intel_pmu_auto_reload_read()
1669 * Special variant of intel_pmu_save_and_restart() for auto-reload.
1674 struct hw_perf_event *hwc = &event->hw; in intel_pmu_save_and_restart_reload()
1675 int shift = 64 - x86_pmu.cntval_bits; in intel_pmu_save_and_restart_reload()
1676 u64 period = hwc->sample_period; in intel_pmu_save_and_restart_reload()
1687 prev_raw_count = local64_read(&hwc->prev_count); in intel_pmu_save_and_restart_reload()
1688 rdpmcl(hwc->event_base_rdpmc, new_raw_count); in intel_pmu_save_and_restart_reload()
1689 local64_set(&hwc->prev_count, new_raw_count); in intel_pmu_save_and_restart_reload()
1695 * [-period, 0] in intel_pmu_save_and_restart_reload()
1699 * A) value2 - value1; in intel_pmu_save_and_restart_reload()
1702 * B) (0 - value1) + (value2 - (-period)); in intel_pmu_save_and_restart_reload()
1705 * C) (0 - value1) + (n - 1) * (period) + (value2 - (-period)); in intel_pmu_save_and_restart_reload()
1709 * discrete interval, where the first term is to the top of the in intel_pmu_save_and_restart_reload()
1716 * value2 - value1 + n * period in intel_pmu_save_and_restart_reload()
1720 local64_add(new - old + count * period, &event->count); in intel_pmu_save_and_restart_reload()
1722 local64_set(&hwc->period_left, -new); in intel_pmu_save_and_restart_reload()
1733 void *base, void *top, in __intel_pmu_pebs_event() argument
1742 struct hw_perf_event *hwc = &event->hw; in __intel_pmu_pebs_event()
1745 void *at = get_next_pebs_record_by_bit(base, top, bit); in __intel_pmu_pebs_event()
1748 if (hwc->flags & PERF_X86_EVENT_AUTO_RELOAD) { in __intel_pmu_pebs_event()
1750 * Now, auto-reload is only enabled in fixed period mode. in __intel_pmu_pebs_event()
1751 * The reload value is always hwc->sample_period. in __intel_pmu_pebs_event()
1752 * May need to change it, if auto-reload is enabled in in __intel_pmu_pebs_event()
1765 at += cpuc->pebs_record_size; in __intel_pmu_pebs_event()
1766 at = get_next_pebs_record_by_bit(at, top, bit); in __intel_pmu_pebs_event()
1767 count--; in __intel_pmu_pebs_event()
1773 * The PEBS records may be drained in the non-overflow context, in __intel_pmu_pebs_event()
1792 struct debug_store *ds = cpuc->ds; in intel_pmu_drain_pebs_core()
1793 struct perf_event *event = cpuc->events[0]; /* PMC0 only */ in intel_pmu_drain_pebs_core()
1794 struct pebs_record_core *at, *top; in intel_pmu_drain_pebs_core() local
1800 at = (struct pebs_record_core *)(unsigned long)ds->pebs_buffer_base; in intel_pmu_drain_pebs_core()
1801 top = (struct pebs_record_core *)(unsigned long)ds->pebs_index; in intel_pmu_drain_pebs_core()
1806 ds->pebs_index = ds->pebs_buffer_base; in intel_pmu_drain_pebs_core()
1808 if (!test_bit(0, cpuc->active_mask)) in intel_pmu_drain_pebs_core()
1813 if (!event->attr.precise_ip) in intel_pmu_drain_pebs_core()
1816 n = top - at; in intel_pmu_drain_pebs_core()
1818 if (event->hw.flags & PERF_X86_EVENT_AUTO_RELOAD) in intel_pmu_drain_pebs_core()
1823 __intel_pmu_pebs_event(event, iregs, data, at, top, 0, n, in intel_pmu_drain_pebs_core()
1834 * for auto-reload event in pmu::read(). There are no in intel_pmu_pebs_event_update_no_drain()
1837 * update the event->count for this case. in intel_pmu_pebs_event_update_no_drain()
1839 for_each_set_bit(bit, (unsigned long *)&cpuc->pebs_enabled, size) { in intel_pmu_pebs_event_update_no_drain()
1840 event = cpuc->events[bit]; in intel_pmu_pebs_event_update_no_drain()
1841 if (event->hw.flags & PERF_X86_EVENT_AUTO_RELOAD) in intel_pmu_pebs_event_update_no_drain()
1849 struct debug_store *ds = cpuc->ds; in intel_pmu_drain_pebs_nhm()
1851 void *base, *at, *top; in intel_pmu_drain_pebs_nhm() local
1860 base = (struct pebs_record_nhm *)(unsigned long)ds->pebs_buffer_base; in intel_pmu_drain_pebs_nhm()
1861 top = (struct pebs_record_nhm *)(unsigned long)ds->pebs_index; in intel_pmu_drain_pebs_nhm()
1863 ds->pebs_index = ds->pebs_buffer_base; in intel_pmu_drain_pebs_nhm()
1865 mask = (1ULL << x86_pmu.max_pebs_events) - 1; in intel_pmu_drain_pebs_nhm()
1868 mask |= ((1ULL << x86_pmu.num_counters_fixed) - 1) << INTEL_PMC_IDX_FIXED; in intel_pmu_drain_pebs_nhm()
1872 if (unlikely(base >= top)) { in intel_pmu_drain_pebs_nhm()
1877 for (at = base; at < top; at += x86_pmu.pebs_record_size) { in intel_pmu_drain_pebs_nhm()
1881 pebs_status = p->status & cpuc->pebs_enabled; in intel_pmu_drain_pebs_nhm()
1900 if (!pebs_status && cpuc->pebs_enabled && in intel_pmu_drain_pebs_nhm()
1901 !(cpuc->pebs_enabled & (cpuc->pebs_enabled-1))) in intel_pmu_drain_pebs_nhm()
1902 pebs_status = p->status = cpuc->pebs_enabled; in intel_pmu_drain_pebs_nhm()
1914 * If these events include one PEBS and multiple non-PEBS in intel_pmu_drain_pebs_nhm()
1937 event = cpuc->events[bit]; in intel_pmu_drain_pebs_nhm()
1941 if (WARN_ON_ONCE(!event->attr.precise_ip)) in intel_pmu_drain_pebs_nhm()
1954 top, bit, counts[bit], in intel_pmu_drain_pebs_nhm()
1964 struct debug_store *ds = cpuc->ds; in intel_pmu_drain_pebs_icl()
1966 void *base, *at, *top; in intel_pmu_drain_pebs_icl() local
1973 base = (struct pebs_basic *)(unsigned long)ds->pebs_buffer_base; in intel_pmu_drain_pebs_icl()
1974 top = (struct pebs_basic *)(unsigned long)ds->pebs_index; in intel_pmu_drain_pebs_icl()
1976 ds->pebs_index = ds->pebs_buffer_base; in intel_pmu_drain_pebs_icl()
1978 mask = ((1ULL << x86_pmu.max_pebs_events) - 1) | in intel_pmu_drain_pebs_icl()
1979 (((1ULL << x86_pmu.num_counters_fixed) - 1) << INTEL_PMC_IDX_FIXED); in intel_pmu_drain_pebs_icl()
1982 if (unlikely(base >= top)) { in intel_pmu_drain_pebs_icl()
1987 for (at = base; at < top; at += cpuc->pebs_record_size) { in intel_pmu_drain_pebs_icl()
1990 pebs_status = get_pebs_status(at) & cpuc->pebs_enabled; in intel_pmu_drain_pebs_icl()
2001 event = cpuc->events[bit]; in intel_pmu_drain_pebs_icl()
2005 if (WARN_ON_ONCE(!event->attr.precise_ip)) in intel_pmu_drain_pebs_icl()
2009 top, bit, counts[bit], in intel_pmu_drain_pebs_icl()
2033 char pebs_type = x86_pmu.intel_cap.pebs_trap ? '+' : '-'; in intel_ds_init()
2083 pebs_qual = "-baseline"; in intel_ds_init()
2084 x86_get_pmu(smp_processor_id())->capabilities |= PERF_PMU_CAP_EXTENDED_REGS; in intel_ds_init()
2098 pr_cont("PEBS-via-PT, "); in intel_ds_init()
2099 x86_get_pmu(smp_processor_id())->capabilities |= PERF_PMU_CAP_AUX_OUTPUT; in intel_ds_init()