Merge branch 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip (465a7e29) · Commits · 戴 / test

arch/x86/events/amd/core.c

+17 −13

Original line number	Diff line number	Diff line
		@@ -5,12 +5,14 @@
		#include <linux/init.h>
		#include <linux/slab.h>
		#include <linux/delay.h>
		#include <linux/jiffies.h>
		#include <asm/apicdef.h>
		#include <asm/nmi.h>

		#include "../perf_event.h"

		static DEFINE_PER_CPU(unsigned int, perf_nmi_counter);
		static DEFINE_PER_CPU(unsigned long, perf_nmi_tstamp);
		static unsigned long perf_nmi_window;

		static __initconst const u64 amd_hw_cache_event_ids
		[PERF_COUNT_HW_CACHE_MAX]
		@@ -641,11 +643,12 @@ static void amd_pmu_disable_event(struct perf_event *event)
		* handler when multiple PMCs are active or PMC overflow while handling some
		* other source of an NMI.
		*
		* Attempt to mitigate this by using the number of active PMCs to determine
		* whether to return NMI_HANDLED if the perf NMI handler did not handle/reset
		* any PMCs. The per-CPU perf_nmi_counter variable is set to a minimum of the
		* number of active PMCs or 2. The value of 2 is used in case an NMI does not
		* arrive at the LAPIC in time to be collapsed into an already pending NMI.
		* Attempt to mitigate this by creating an NMI window in which un-handled NMIs
		* received during this window will be claimed. This prevents extending the
		* window past when it is possible that latent NMIs should be received. The
		* per-CPU perf_nmi_tstamp will be set to the window end time whenever perf has
		* handled a counter. When an un-handled NMI is received, it will be claimed
		* only if arriving within that window.
		*/
		static int amd_pmu_handle_irq(struct pt_regs *regs)
		{
		@@ -663,21 +666,19 @@ static int amd_pmu_handle_irq(struct pt_regs *regs)
		handled = x86_pmu_handle_irq(regs);

		/*
		* If a counter was handled, record the number of possible remaining
		* NMIs that can occur.
		* If a counter was handled, record a timestamp such that un-handled
		* NMIs will be claimed if arriving within that window.
		*/
		if (handled) {
		this_cpu_write(perf_nmi_counter,
		min_t(unsigned int, 2, active));
		this_cpu_write(perf_nmi_tstamp,
		jiffies + perf_nmi_window);

		return handled;
		}

		if (!this_cpu_read(perf_nmi_counter))
		if (time_after(jiffies, this_cpu_read(perf_nmi_tstamp)))
		return NMI_DONE;

		this_cpu_dec(perf_nmi_counter);

		return NMI_HANDLED;
		}

		@@ -909,6 +910,9 @@ static int __init amd_core_pmu_init(void)
		if (!boot_cpu_has(X86_FEATURE_PERFCTR_CORE))
		return 0;

		/* Avoid calulating the value each time in the NMI handler */
		perf_nmi_window = msecs_to_jiffies(100);

		switch (boot_cpu_data.x86) {
		case 0x15:
		pr_cont("Fam15h ");

arch/x86/events/intel/core.c

+4 −0

Original line number	Diff line number	Diff line
		@@ -4983,6 +4983,8 @@ __init int intel_pmu_init(void)
		case INTEL_FAM6_SKYLAKE:
		case INTEL_FAM6_KABYLAKE_L:
		case INTEL_FAM6_KABYLAKE:
		case INTEL_FAM6_COMETLAKE_L:
		case INTEL_FAM6_COMETLAKE:
		x86_add_quirk(intel_pebs_isolation_quirk);
		x86_pmu.late_ack = true;
		memcpy(hw_cache_event_ids, skl_hw_cache_event_ids, sizeof(hw_cache_event_ids));
		@@ -5031,6 +5033,8 @@ __init int intel_pmu_init(void)
		/* fall through */
		case INTEL_FAM6_ICELAKE_L:
		case INTEL_FAM6_ICELAKE:
		case INTEL_FAM6_TIGERLAKE_L:
		case INTEL_FAM6_TIGERLAKE:
		x86_pmu.late_ack = true;
		memcpy(hw_cache_event_ids, skl_hw_cache_event_ids, sizeof(hw_cache_event_ids));
		memcpy(hw_cache_extra_regs, skl_hw_cache_extra_regs, sizeof(hw_cache_extra_regs));

arch/x86/events/intel/cstate.c

+32 −12

Original line number	Diff line number	Diff line
		@@ -45,46 +45,49 @@
		* MSR_CORE_C3_RESIDENCY: CORE C3 Residency Counter
		* perf code: 0x01
		* Available model: NHM,WSM,SNB,IVB,HSW,BDW,SKL,GLM,
		CNL
		* CNL,KBL,CML
		* Scope: Core
		* MSR_CORE_C6_RESIDENCY: CORE C6 Residency Counter
		* perf code: 0x02
		* Available model: SLM,AMT,NHM,WSM,SNB,IVB,HSW,BDW,
		* SKL,KNL,GLM,CNL
		* SKL,KNL,GLM,CNL,KBL,CML,ICL,TGL
		* Scope: Core
		* MSR_CORE_C7_RESIDENCY: CORE C7 Residency Counter
		* perf code: 0x03
		* Available model: SNB,IVB,HSW,BDW,SKL,CNL
		* Available model: SNB,IVB,HSW,BDW,SKL,CNL,KBL,CML,
		* ICL,TGL
		* Scope: Core
		* MSR_PKG_C2_RESIDENCY: Package C2 Residency Counter.
		* perf code: 0x00
		* Available model: SNB,IVB,HSW,BDW,SKL,KNL,GLM,CNL
		* Available model: SNB,IVB,HSW,BDW,SKL,KNL,GLM,CNL,
		* KBL,CML,ICL,TGL
		* Scope: Package (physical package)
		* MSR_PKG_C3_RESIDENCY: Package C3 Residency Counter.
		* perf code: 0x01
		* Available model: NHM,WSM,SNB,IVB,HSW,BDW,SKL,KNL,
		* GLM,CNL
		* GLM,CNL,KBL,CML,ICL,TGL
		* Scope: Package (physical package)
		* MSR_PKG_C6_RESIDENCY: Package C6 Residency Counter.
		* perf code: 0x02
		* Available model: SLM,AMT,NHM,WSM,SNB,IVB,HSW,BDW
		* SKL,KNL,GLM,CNL
		* SKL,KNL,GLM,CNL,KBL,CML,ICL,TGL
		* Scope: Package (physical package)
		* MSR_PKG_C7_RESIDENCY: Package C7 Residency Counter.
		* perf code: 0x03
		* Available model: NHM,WSM,SNB,IVB,HSW,BDW,SKL,CNL
		* Available model: NHM,WSM,SNB,IVB,HSW,BDW,SKL,CNL,
		* KBL,CML,ICL,TGL
		* Scope: Package (physical package)
		* MSR_PKG_C8_RESIDENCY: Package C8 Residency Counter.
		* perf code: 0x04
		* Available model: HSW ULT,KBL,CNL
		* Available model: HSW ULT,KBL,CNL,CML,ICL,TGL
		* Scope: Package (physical package)
		* MSR_PKG_C9_RESIDENCY: Package C9 Residency Counter.
		* perf code: 0x05
		* Available model: HSW ULT,KBL,CNL
		* Available model: HSW ULT,KBL,CNL,CML,ICL,TGL
		* Scope: Package (physical package)
		* MSR_PKG_C10_RESIDENCY: Package C10 Residency Counter.
		* perf code: 0x06
		* Available model: HSW ULT,KBL,GLM,CNL
		* Available model: HSW ULT,KBL,GLM,CNL,CML,ICL,TGL
		* Scope: Package (physical package)
		*
		*/
		@@ -544,6 +547,19 @@ static const struct cstate_model cnl_cstates __initconst = {
		BIT(PERF_CSTATE_PKG_C10_RES),
		};

		static const struct cstate_model icl_cstates __initconst = {
		.core_events = BIT(PERF_CSTATE_CORE_C6_RES) \|
		BIT(PERF_CSTATE_CORE_C7_RES),

		.pkg_events = BIT(PERF_CSTATE_PKG_C2_RES) \|
		BIT(PERF_CSTATE_PKG_C3_RES) \|
		BIT(PERF_CSTATE_PKG_C6_RES) \|
		BIT(PERF_CSTATE_PKG_C7_RES) \|
		BIT(PERF_CSTATE_PKG_C8_RES) \|
		BIT(PERF_CSTATE_PKG_C9_RES) \|
		BIT(PERF_CSTATE_PKG_C10_RES),
		};

		static const struct cstate_model slm_cstates __initconst = {
		.core_events = BIT(PERF_CSTATE_CORE_C1_RES) \|
		BIT(PERF_CSTATE_CORE_C6_RES),
		@@ -614,6 +630,8 @@ static const struct x86_cpu_id intel_cstates_match[] __initconst = {

		X86_CSTATES_MODEL(INTEL_FAM6_KABYLAKE_L, hswult_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_KABYLAKE, hswult_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_COMETLAKE_L, hswult_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_COMETLAKE, hswult_cstates),

		X86_CSTATES_MODEL(INTEL_FAM6_CANNONLAKE_L, cnl_cstates),

		@@ -625,8 +643,10 @@ static const struct x86_cpu_id intel_cstates_match[] __initconst = {

		X86_CSTATES_MODEL(INTEL_FAM6_ATOM_GOLDMONT_PLUS, glm_cstates),

		X86_CSTATES_MODEL(INTEL_FAM6_ICELAKE_L, snb_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_ICELAKE, snb_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_ICELAKE_L, icl_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_ICELAKE, icl_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_TIGERLAKE_L, icl_cstates),
		X86_CSTATES_MODEL(INTEL_FAM6_TIGERLAKE, icl_cstates),
		{ },
		};
		MODULE_DEVICE_TABLE(x86cpu, intel_cstates_match);

arch/x86/events/msr.c

+7 −0

Original line number	Diff line number	Diff line
		@@ -89,7 +89,14 @@ static bool test_intel(int idx, void *data)
		case INTEL_FAM6_SKYLAKE_X:
		case INTEL_FAM6_KABYLAKE_L:
		case INTEL_FAM6_KABYLAKE:
		case INTEL_FAM6_COMETLAKE_L:
		case INTEL_FAM6_COMETLAKE:
		case INTEL_FAM6_ICELAKE_L:
		case INTEL_FAM6_ICELAKE:
		case INTEL_FAM6_ICELAKE_X:
		case INTEL_FAM6_ICELAKE_D:
		case INTEL_FAM6_TIGERLAKE_L:
		case INTEL_FAM6_TIGERLAKE:
		if (idx == PERF_MSR_SMI \|\| idx == PERF_MSR_PPERF)
		return true;
		break;

kernel/events/core.c

+36 −7

Original line number	Diff line number	Diff line
		@@ -3779,11 +3779,23 @@ static void rotate_ctx(struct perf_event_context ctx, struct perf_event event)
		perf_event_groups_insert(&ctx->flexible_groups, event);
		}

		/* pick an event from the flexible_groups to rotate */
		static inline struct perf_event *
		ctx_first_active(struct perf_event_context *ctx)
		ctx_event_to_rotate(struct perf_event_context *ctx)
		{
		return list_first_entry_or_null(&ctx->flexible_active,
		struct perf_event *event;

		/* pick the first active flexible event */
		event = list_first_entry_or_null(&ctx->flexible_active,
		struct perf_event, active_list);

		/* if no active flexible event, pick the first event */
		if (!event) {
		event = rb_entry_safe(rb_first(&ctx->flexible_groups.tree),
		typeof(*event), group_node);
		}

		return event;
		}

		static bool perf_rotate_context(struct perf_cpu_context *cpuctx)
		@@ -3808,9 +3820,9 @@ static bool perf_rotate_context(struct perf_cpu_context *cpuctx)
		perf_pmu_disable(cpuctx->ctx.pmu);

		if (task_rotate)
		task_event = ctx_first_active(task_ctx);
		task_event = ctx_event_to_rotate(task_ctx);
		if (cpu_rotate)
		cpu_event = ctx_first_active(&cpuctx->ctx);
		cpu_event = ctx_event_to_rotate(&cpuctx->ctx);

		/*
		* As per the order given at ctx_resched() first 'pop' task flexible
		@@ -5668,7 +5680,8 @@ again:
		* undo the VM accounting.
		*/

		atomic_long_sub((size >> PAGE_SHIFT) + 1, &mmap_user->locked_vm);
		atomic_long_sub((size >> PAGE_SHIFT) + 1 - mmap_locked,
		&mmap_user->locked_vm);
		atomic64_sub(mmap_locked, &vma->vm_mm->pinned_vm);
		free_uid(mmap_user);

		@@ -5812,8 +5825,20 @@ accounting:

		user_locked = atomic_long_read(&user->locked_vm) + user_extra;

		if (user_locked > user_lock_limit)
		if (user_locked <= user_lock_limit) {
		/* charge all to locked_vm */
		} else if (atomic_long_read(&user->locked_vm) >= user_lock_limit) {
		/* charge all to pinned_vm */
		extra = user_extra;
		user_extra = 0;
		} else {
		/*
		* charge locked_vm until it hits user_lock_limit;
		* charge the rest from pinned_vm
		*/
		extra = user_locked - user_lock_limit;
		user_extra -= extra;
		}

		lock_limit = rlimit(RLIMIT_MEMLOCK);
		lock_limit >>= PAGE_SHIFT;
		@@ -11862,6 +11887,10 @@ static int inherit_group(struct perf_event *parent_event,
		child, leader, child_ctx);
		if (IS_ERR(child_ctr))
		return PTR_ERR(child_ctr);

		if (sub->aux_event == parent_event &&
		!perf_get_aux_event(child_ctr, leader))
		return -EINVAL;
		}
		return 0;
		}

Admin message