diff options
| author | Sage Weil <sage@inktank.com> | 2013-08-15 11:11:45 -0700 | 
|---|---|---|
| committer | Sage Weil <sage@inktank.com> | 2013-08-15 11:11:45 -0700 | 
| commit | ee3e542fec6e69bc9fb668698889a37d93950ddf (patch) | |
| tree | e74ee766a4764769ef1d3d45d266b4dea64101d3 /arch/x86/kernel/cpu | |
| parent | fe2a801b50c0bb8039d627e5ae1fec249d10ff39 (diff) | |
| parent | f1d6e17f540af37bb1891480143669ba7636c4cf (diff) | |
Merge remote-tracking branch 'linus/master' into testing
Diffstat (limited to 'arch/x86/kernel/cpu')
39 files changed, 1460 insertions, 420 deletions
| diff --git a/arch/x86/kernel/cpu/Makefile b/arch/x86/kernel/cpu/Makefile index b0684e4a73a..47b56a7e99c 100644 --- a/arch/x86/kernel/cpu/Makefile +++ b/arch/x86/kernel/cpu/Makefile @@ -31,11 +31,15 @@ obj-$(CONFIG_PERF_EVENTS)		+= perf_event.o  ifdef CONFIG_PERF_EVENTS  obj-$(CONFIG_CPU_SUP_AMD)		+= perf_event_amd.o perf_event_amd_uncore.o +ifdef CONFIG_AMD_IOMMU +obj-$(CONFIG_CPU_SUP_AMD)		+= perf_event_amd_iommu.o +endif  obj-$(CONFIG_CPU_SUP_INTEL)		+= perf_event_p6.o perf_event_knc.o perf_event_p4.o  obj-$(CONFIG_CPU_SUP_INTEL)		+= perf_event_intel_lbr.o perf_event_intel_ds.o perf_event_intel.o  obj-$(CONFIG_CPU_SUP_INTEL)		+= perf_event_intel_uncore.o  endif +  obj-$(CONFIG_X86_MCE)			+= mcheck/  obj-$(CONFIG_MTRR)			+= mtrr/ diff --git a/arch/x86/kernel/cpu/amd.c b/arch/x86/kernel/cpu/amd.c index 5013a48d1af..f654ecefea5 100644 --- a/arch/x86/kernel/cpu/amd.c +++ b/arch/x86/kernel/cpu/amd.c @@ -69,7 +69,7 @@ static inline int wrmsrl_amd_safe(unsigned msr, unsigned long long val)  extern void vide(void);  __asm__(".align 4\nvide: ret"); -static void __cpuinit init_amd_k5(struct cpuinfo_x86 *c) +static void init_amd_k5(struct cpuinfo_x86 *c)  {  /*   * General Systems BIOSen alias the cpu frequency registers @@ -87,10 +87,10 @@ static void __cpuinit init_amd_k5(struct cpuinfo_x86 *c)  } -static void __cpuinit init_amd_k6(struct cpuinfo_x86 *c) +static void init_amd_k6(struct cpuinfo_x86 *c)  {  	u32 l, h; -	int mbytes = num_physpages >> (20-PAGE_SHIFT); +	int mbytes = get_num_physpages() >> (20-PAGE_SHIFT);  	if (c->x86_model < 6) {  		/* Based on AMD doc 20734R - June 2000 */ @@ -179,7 +179,7 @@ static void __cpuinit init_amd_k6(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit amd_k7_smp_check(struct cpuinfo_x86 *c) +static void amd_k7_smp_check(struct cpuinfo_x86 *c)  {  	/* calling is from identify_secondary_cpu() ? */  	if (!c->cpu_index) @@ -222,7 +222,7 @@ static void __cpuinit amd_k7_smp_check(struct cpuinfo_x86 *c)  	add_taint(TAINT_UNSAFE_SMP, LOCKDEP_NOW_UNRELIABLE);  } -static void __cpuinit init_amd_k7(struct cpuinfo_x86 *c) +static void init_amd_k7(struct cpuinfo_x86 *c)  {  	u32 l, h; @@ -267,7 +267,7 @@ static void __cpuinit init_amd_k7(struct cpuinfo_x86 *c)   * To workaround broken NUMA config.  Read the comment in   * srat_detect_node().   */ -static int __cpuinit nearby_node(int apicid) +static int nearby_node(int apicid)  {  	int i, node; @@ -292,7 +292,7 @@ static int __cpuinit nearby_node(int apicid)   * (2) AMD processors supporting compute units   */  #ifdef CONFIG_X86_HT -static void __cpuinit amd_get_topology(struct cpuinfo_x86 *c) +static void amd_get_topology(struct cpuinfo_x86 *c)  {  	u32 nodes, cores_per_cu = 1;  	u8 node_id; @@ -342,7 +342,7 @@ static void __cpuinit amd_get_topology(struct cpuinfo_x86 *c)   * On a AMD dual core setup the lower bits of the APIC id distingush the cores.   * Assumes number of cores is a power of two.   */ -static void __cpuinit amd_detect_cmp(struct cpuinfo_x86 *c) +static void amd_detect_cmp(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_HT  	unsigned bits; @@ -369,7 +369,7 @@ u16 amd_get_nb_id(int cpu)  }  EXPORT_SYMBOL_GPL(amd_get_nb_id); -static void __cpuinit srat_detect_node(struct cpuinfo_x86 *c) +static void srat_detect_node(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_NUMA  	int cpu = smp_processor_id(); @@ -421,7 +421,7 @@ static void __cpuinit srat_detect_node(struct cpuinfo_x86 *c)  #endif  } -static void __cpuinit early_init_amd_mc(struct cpuinfo_x86 *c) +static void early_init_amd_mc(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_HT  	unsigned bits, ecx; @@ -447,7 +447,7 @@ static void __cpuinit early_init_amd_mc(struct cpuinfo_x86 *c)  #endif  } -static void __cpuinit bsp_init_amd(struct cpuinfo_x86 *c) +static void bsp_init_amd(struct cpuinfo_x86 *c)  {  	if (cpu_has(c, X86_FEATURE_CONSTANT_TSC)) { @@ -475,7 +475,7 @@ static void __cpuinit bsp_init_amd(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit early_init_amd(struct cpuinfo_x86 *c) +static void early_init_amd(struct cpuinfo_x86 *c)  {  	early_init_amd_mc(c); @@ -514,7 +514,7 @@ static const int amd_erratum_383[];  static const int amd_erratum_400[];  static bool cpu_has_amd_erratum(const int *erratum); -static void __cpuinit init_amd(struct cpuinfo_x86 *c) +static void init_amd(struct cpuinfo_x86 *c)  {  	u32 dummy;  	unsigned long long value; @@ -740,8 +740,7 @@ static void __cpuinit init_amd(struct cpuinfo_x86 *c)  }  #ifdef CONFIG_X86_32 -static unsigned int __cpuinit amd_size_cache(struct cpuinfo_x86 *c, -							unsigned int size) +static unsigned int amd_size_cache(struct cpuinfo_x86 *c, unsigned int size)  {  	/* AMD errata T13 (order #21922) */  	if ((c->x86 == 6)) { @@ -757,7 +756,7 @@ static unsigned int __cpuinit amd_size_cache(struct cpuinfo_x86 *c,  }  #endif -static void __cpuinit cpu_set_tlb_flushall_shift(struct cpuinfo_x86 *c) +static void cpu_set_tlb_flushall_shift(struct cpuinfo_x86 *c)  {  	tlb_flushall_shift = 5; @@ -765,7 +764,7 @@ static void __cpuinit cpu_set_tlb_flushall_shift(struct cpuinfo_x86 *c)  		tlb_flushall_shift = 4;  } -static void __cpuinit cpu_detect_tlb_amd(struct cpuinfo_x86 *c) +static void cpu_detect_tlb_amd(struct cpuinfo_x86 *c)  {  	u32 ebx, eax, ecx, edx;  	u16 mask = 0xfff; @@ -820,7 +819,7 @@ static void __cpuinit cpu_detect_tlb_amd(struct cpuinfo_x86 *c)  	cpu_set_tlb_flushall_shift(c);  } -static const struct cpu_dev __cpuinitconst amd_cpu_dev = { +static const struct cpu_dev amd_cpu_dev = {  	.c_vendor	= "AMD",  	.c_ident	= { "AuthenticAMD" },  #ifdef CONFIG_X86_32 diff --git a/arch/x86/kernel/cpu/bugs.c b/arch/x86/kernel/cpu/bugs.c index 4112be9a465..03445346ee0 100644 --- a/arch/x86/kernel/cpu/bugs.c +++ b/arch/x86/kernel/cpu/bugs.c @@ -17,15 +17,6 @@  #include <asm/paravirt.h>  #include <asm/alternative.h> -static int __init no_387(char *s) -{ -	boot_cpu_data.hard_math = 0; -	write_cr0(X86_CR0_TS | X86_CR0_EM | X86_CR0_MP | read_cr0()); -	return 1; -} - -__setup("no387", no_387); -  static double __initdata x = 4195835.0;  static double __initdata y = 3145727.0; @@ -44,15 +35,6 @@ static void __init check_fpu(void)  {  	s32 fdiv_bug; -	if (!boot_cpu_data.hard_math) { -#ifndef CONFIG_MATH_EMULATION -		pr_emerg("No coprocessor found and no math emulation present\n"); -		pr_emerg("Giving up\n"); -		for (;;) ; -#endif -		return; -	} -  	kernel_fpu_begin();  	/* @@ -107,5 +89,6 @@ void __init check_bugs(void)  	 * kernel_fpu_begin/end() in check_fpu() relies on the patched  	 * alternative instructions.  	 */ -	check_fpu(); +	if (cpu_has_fpu) +		check_fpu();  } diff --git a/arch/x86/kernel/cpu/centaur.c b/arch/x86/kernel/cpu/centaur.c index 159103c0b1f..fbf6c3bc240 100644 --- a/arch/x86/kernel/cpu/centaur.c +++ b/arch/x86/kernel/cpu/centaur.c @@ -11,7 +11,7 @@  #ifdef CONFIG_X86_OOSTORE -static u32 __cpuinit power2(u32 x) +static u32 power2(u32 x)  {  	u32 s = 1; @@ -25,7 +25,7 @@ static u32 __cpuinit power2(u32 x)  /*   * Set up an actual MCR   */ -static void __cpuinit centaur_mcr_insert(int reg, u32 base, u32 size, int key) +static void centaur_mcr_insert(int reg, u32 base, u32 size, int key)  {  	u32 lo, hi; @@ -42,7 +42,7 @@ static void __cpuinit centaur_mcr_insert(int reg, u32 base, u32 size, int key)   *   * Shortcut: We know you can't put 4Gig of RAM on a winchip   */ -static u32 __cpuinit ramtop(void) +static u32 ramtop(void)  {  	u32 clip = 0xFFFFFFFFUL;  	u32 top = 0; @@ -91,7 +91,7 @@ static u32 __cpuinit ramtop(void)  /*   * Compute a set of MCR's to give maximum coverage   */ -static int __cpuinit centaur_mcr_compute(int nr, int key) +static int centaur_mcr_compute(int nr, int key)  {  	u32 mem = ramtop();  	u32 root = power2(mem); @@ -157,7 +157,7 @@ static int __cpuinit centaur_mcr_compute(int nr, int key)  	return ct;  } -static void __cpuinit centaur_create_optimal_mcr(void) +static void centaur_create_optimal_mcr(void)  {  	int used;  	int i; @@ -181,7 +181,7 @@ static void __cpuinit centaur_create_optimal_mcr(void)  		wrmsr(MSR_IDT_MCR0+i, 0, 0);  } -static void __cpuinit winchip2_create_optimal_mcr(void) +static void winchip2_create_optimal_mcr(void)  {  	u32 lo, hi;  	int used; @@ -217,7 +217,7 @@ static void __cpuinit winchip2_create_optimal_mcr(void)  /*   * Handle the MCR key on the Winchip 2.   */ -static void __cpuinit winchip2_unprotect_mcr(void) +static void winchip2_unprotect_mcr(void)  {  	u32 lo, hi;  	u32 key; @@ -229,7 +229,7 @@ static void __cpuinit winchip2_unprotect_mcr(void)  	wrmsr(MSR_IDT_MCR_CTRL, lo, hi);  } -static void __cpuinit winchip2_protect_mcr(void) +static void winchip2_protect_mcr(void)  {  	u32 lo, hi; @@ -247,7 +247,7 @@ static void __cpuinit winchip2_protect_mcr(void)  #define RNG_ENABLED	(1 << 3)  #define RNG_ENABLE	(1 << 6)	/* MSR_VIA_RNG */ -static void __cpuinit init_c3(struct cpuinfo_x86 *c) +static void init_c3(struct cpuinfo_x86 *c)  {  	u32  lo, hi; @@ -318,7 +318,7 @@ enum {  		EAMD3D		= 1<<20,  }; -static void __cpuinit early_init_centaur(struct cpuinfo_x86 *c) +static void early_init_centaur(struct cpuinfo_x86 *c)  {  	switch (c->x86) {  #ifdef CONFIG_X86_32 @@ -337,7 +337,7 @@ static void __cpuinit early_init_centaur(struct cpuinfo_x86 *c)  #endif  } -static void __cpuinit init_centaur(struct cpuinfo_x86 *c) +static void init_centaur(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_32  	char *name; @@ -468,7 +468,7 @@ static void __cpuinit init_centaur(struct cpuinfo_x86 *c)  #endif  } -static unsigned int __cpuinit +static unsigned int  centaur_size_cache(struct cpuinfo_x86 *c, unsigned int size)  {  #ifdef CONFIG_X86_32 @@ -488,7 +488,7 @@ centaur_size_cache(struct cpuinfo_x86 *c, unsigned int size)  	return size;  } -static const struct cpu_dev __cpuinitconst centaur_cpu_dev = { +static const struct cpu_dev centaur_cpu_dev = {  	.c_vendor	= "Centaur",  	.c_ident	= { "CentaurHauls" },  	.c_early_init	= early_init_centaur, diff --git a/arch/x86/kernel/cpu/common.c b/arch/x86/kernel/cpu/common.c index 22018f70a67..25eb2747b06 100644 --- a/arch/x86/kernel/cpu/common.c +++ b/arch/x86/kernel/cpu/common.c @@ -63,7 +63,7 @@ void __init setup_cpu_local_masks(void)  	alloc_bootmem_cpumask_var(&cpu_sibling_setup_mask);  } -static void __cpuinit default_init(struct cpuinfo_x86 *c) +static void default_init(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_64  	cpu_detect_cache_sizes(c); @@ -80,13 +80,13 @@ static void __cpuinit default_init(struct cpuinfo_x86 *c)  #endif  } -static const struct cpu_dev __cpuinitconst default_cpu = { +static const struct cpu_dev default_cpu = {  	.c_init		= default_init,  	.c_vendor	= "Unknown",  	.c_x86_vendor	= X86_VENDOR_UNKNOWN,  }; -static const struct cpu_dev *this_cpu __cpuinitdata = &default_cpu; +static const struct cpu_dev *this_cpu = &default_cpu;  DEFINE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page) = { .gdt = {  #ifdef CONFIG_X86_64 @@ -160,8 +160,8 @@ static int __init x86_xsaveopt_setup(char *s)  __setup("noxsaveopt", x86_xsaveopt_setup);  #ifdef CONFIG_X86_32 -static int cachesize_override __cpuinitdata = -1; -static int disable_x86_serial_nr __cpuinitdata = 1; +static int cachesize_override = -1; +static int disable_x86_serial_nr = 1;  static int __init cachesize_setup(char *str)  { @@ -215,12 +215,12 @@ static inline int flag_is_changeable_p(u32 flag)  }  /* Probe for the CPUID instruction */ -int __cpuinit have_cpuid_p(void) +int have_cpuid_p(void)  {  	return flag_is_changeable_p(X86_EFLAGS_ID);  } -static void __cpuinit squash_the_stupid_serial_number(struct cpuinfo_x86 *c) +static void squash_the_stupid_serial_number(struct cpuinfo_x86 *c)  {  	unsigned long lo, hi; @@ -298,7 +298,7 @@ struct cpuid_dependent_feature {  	u32 level;  }; -static const struct cpuid_dependent_feature __cpuinitconst +static const struct cpuid_dependent_feature  cpuid_dependent_features[] = {  	{ X86_FEATURE_MWAIT,		0x00000005 },  	{ X86_FEATURE_DCA,		0x00000009 }, @@ -306,7 +306,7 @@ cpuid_dependent_features[] = {  	{ 0, 0 }  }; -static void __cpuinit filter_cpuid_features(struct cpuinfo_x86 *c, bool warn) +static void filter_cpuid_features(struct cpuinfo_x86 *c, bool warn)  {  	const struct cpuid_dependent_feature *df; @@ -344,7 +344,7 @@ static void __cpuinit filter_cpuid_features(struct cpuinfo_x86 *c, bool warn)   */  /* Look up CPU names by table lookup. */ -static const char *__cpuinit table_lookup_model(struct cpuinfo_x86 *c) +static const char *table_lookup_model(struct cpuinfo_x86 *c)  {  	const struct cpu_model_info *info; @@ -364,8 +364,8 @@ static const char *__cpuinit table_lookup_model(struct cpuinfo_x86 *c)  	return NULL;		/* Not found */  } -__u32 cpu_caps_cleared[NCAPINTS] __cpuinitdata; -__u32 cpu_caps_set[NCAPINTS] __cpuinitdata; +__u32 cpu_caps_cleared[NCAPINTS]; +__u32 cpu_caps_set[NCAPINTS];  void load_percpu_segment(int cpu)  { @@ -394,9 +394,9 @@ void switch_to_new_gdt(int cpu)  	load_percpu_segment(cpu);  } -static const struct cpu_dev *__cpuinitdata cpu_devs[X86_VENDOR_NUM] = {}; +static const struct cpu_dev *cpu_devs[X86_VENDOR_NUM] = {}; -static void __cpuinit get_model_name(struct cpuinfo_x86 *c) +static void get_model_name(struct cpuinfo_x86 *c)  {  	unsigned int *v;  	char *p, *q; @@ -425,7 +425,7 @@ static void __cpuinit get_model_name(struct cpuinfo_x86 *c)  	}  } -void __cpuinit cpu_detect_cache_sizes(struct cpuinfo_x86 *c) +void cpu_detect_cache_sizes(struct cpuinfo_x86 *c)  {  	unsigned int n, dummy, ebx, ecx, edx, l2size; @@ -479,7 +479,7 @@ u16 __read_mostly tlb_lld_4m[NR_INFO];   */  s8  __read_mostly tlb_flushall_shift = -1; -void __cpuinit cpu_detect_tlb(struct cpuinfo_x86 *c) +void cpu_detect_tlb(struct cpuinfo_x86 *c)  {  	if (this_cpu->c_detect_tlb)  		this_cpu->c_detect_tlb(c); @@ -493,7 +493,7 @@ void __cpuinit cpu_detect_tlb(struct cpuinfo_x86 *c)  		tlb_flushall_shift);  } -void __cpuinit detect_ht(struct cpuinfo_x86 *c) +void detect_ht(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_HT  	u32 eax, ebx, ecx, edx; @@ -544,7 +544,7 @@ out:  #endif  } -static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c) +static void get_cpu_vendor(struct cpuinfo_x86 *c)  {  	char *v = c->x86_vendor_id;  	int i; @@ -571,7 +571,7 @@ static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)  	this_cpu = &default_cpu;  } -void __cpuinit cpu_detect(struct cpuinfo_x86 *c) +void cpu_detect(struct cpuinfo_x86 *c)  {  	/* Get vendor name */  	cpuid(0x00000000, (unsigned int *)&c->cpuid_level, @@ -601,7 +601,7 @@ void __cpuinit cpu_detect(struct cpuinfo_x86 *c)  	}  } -void __cpuinit get_cpu_cap(struct cpuinfo_x86 *c) +void get_cpu_cap(struct cpuinfo_x86 *c)  {  	u32 tfms, xlvl;  	u32 ebx; @@ -652,7 +652,7 @@ void __cpuinit get_cpu_cap(struct cpuinfo_x86 *c)  	init_scattered_cpuid_features(c);  } -static void __cpuinit identify_cpu_without_cpuid(struct cpuinfo_x86 *c) +static void identify_cpu_without_cpuid(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_32  	int i; @@ -711,10 +711,9 @@ static void __init early_identify_cpu(struct cpuinfo_x86 *c)  		return;  	cpu_detect(c); -  	get_cpu_vendor(c); -  	get_cpu_cap(c); +	fpu_detect(c);  	if (this_cpu->c_early_init)  		this_cpu->c_early_init(c); @@ -724,6 +723,8 @@ static void __init early_identify_cpu(struct cpuinfo_x86 *c)  	if (this_cpu->c_bsp_init)  		this_cpu->c_bsp_init(c); + +	setup_force_cpu_cap(X86_FEATURE_ALWAYS);  }  void __init early_cpu_init(void) @@ -768,7 +769,7 @@ void __init early_cpu_init(void)   * unless we can find a reliable way to detect all the broken cases.   * Enable it explicitly on 64-bit for non-constant inputs of cpu_has().   */ -static void __cpuinit detect_nopl(struct cpuinfo_x86 *c) +static void detect_nopl(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_X86_32  	clear_cpu_cap(c, X86_FEATURE_NOPL); @@ -777,7 +778,7 @@ static void __cpuinit detect_nopl(struct cpuinfo_x86 *c)  #endif  } -static void __cpuinit generic_identify(struct cpuinfo_x86 *c) +static void generic_identify(struct cpuinfo_x86 *c)  {  	c->extended_cpuid_level = 0; @@ -814,7 +815,7 @@ static void __cpuinit generic_identify(struct cpuinfo_x86 *c)  /*   * This does the hard work of actually picking apart the CPU stuff...   */ -static void __cpuinit identify_cpu(struct cpuinfo_x86 *c) +static void identify_cpu(struct cpuinfo_x86 *c)  {  	int i; @@ -959,7 +960,7 @@ void __init identify_boot_cpu(void)  	cpu_detect_tlb(&boot_cpu_data);  } -void __cpuinit identify_secondary_cpu(struct cpuinfo_x86 *c) +void identify_secondary_cpu(struct cpuinfo_x86 *c)  {  	BUG_ON(c == &boot_cpu_data);  	identify_cpu(c); @@ -974,14 +975,14 @@ struct msr_range {  	unsigned	max;  }; -static const struct msr_range msr_range_array[] __cpuinitconst = { +static const struct msr_range msr_range_array[] = {  	{ 0x00000000, 0x00000418},  	{ 0xc0000000, 0xc000040b},  	{ 0xc0010000, 0xc0010142},  	{ 0xc0011000, 0xc001103b},  }; -static void __cpuinit __print_cpu_msr(void) +static void __print_cpu_msr(void)  {  	unsigned index_min, index_max;  	unsigned index; @@ -1000,7 +1001,7 @@ static void __cpuinit __print_cpu_msr(void)  	}  } -static int show_msr __cpuinitdata; +static int show_msr;  static __init int setup_show_msr(char *arg)  { @@ -1021,7 +1022,7 @@ static __init int setup_noclflush(char *arg)  }  __setup("noclflush", setup_noclflush); -void __cpuinit print_cpu_info(struct cpuinfo_x86 *c) +void print_cpu_info(struct cpuinfo_x86 *c)  {  	const char *vendor = NULL; @@ -1050,7 +1051,7 @@ void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)  	print_cpu_msr(c);  } -void __cpuinit print_cpu_msr(struct cpuinfo_x86 *c) +void print_cpu_msr(struct cpuinfo_x86 *c)  {  	if (c->cpu_index < show_msr)  		__print_cpu_msr(); @@ -1071,8 +1072,8 @@ __setup("clearcpuid=", setup_disablecpuid);  #ifdef CONFIG_X86_64  struct desc_ptr idt_descr = { NR_VECTORS * 16 - 1, (unsigned long) idt_table }; -struct desc_ptr nmi_idt_descr = { NR_VECTORS * 16 - 1, -				    (unsigned long) nmi_idt_table }; +struct desc_ptr debug_idt_descr = { NR_VECTORS * 16 - 1, +				    (unsigned long) debug_idt_table };  DEFINE_PER_CPU_FIRST(union irq_stack_union,  		     irq_stack_union) __aligned(PAGE_SIZE); @@ -1148,20 +1149,20 @@ int is_debug_stack(unsigned long addr)  		 addr > (__get_cpu_var(debug_stack_addr) - DEBUG_STKSZ));  } -static DEFINE_PER_CPU(u32, debug_stack_use_ctr); +DEFINE_PER_CPU(u32, debug_idt_ctr);  void debug_stack_set_zero(void)  { -	this_cpu_inc(debug_stack_use_ctr); -	load_idt((const struct desc_ptr *)&nmi_idt_descr); +	this_cpu_inc(debug_idt_ctr); +	load_current_idt();  }  void debug_stack_reset(void)  { -	if (WARN_ON(!this_cpu_read(debug_stack_use_ctr))) +	if (WARN_ON(!this_cpu_read(debug_idt_ctr)))  		return; -	if (this_cpu_dec_return(debug_stack_use_ctr) == 0) -		load_idt((const struct desc_ptr *)&idt_descr); +	if (this_cpu_dec_return(debug_idt_ctr) == 0) +		load_current_idt();  }  #else	/* CONFIG_X86_64 */ @@ -1215,7 +1216,7 @@ static void dbg_restore_debug_regs(void)   */  #ifdef CONFIG_X86_64 -void __cpuinit cpu_init(void) +void cpu_init(void)  {  	struct orig_ist *oist;  	struct task_struct *me; @@ -1257,7 +1258,7 @@ void __cpuinit cpu_init(void)  	switch_to_new_gdt(cpu);  	loadsegment(fs, 0); -	load_idt((const struct desc_ptr *)&idt_descr); +	load_current_idt();  	memset(me->thread.tls_array, 0, GDT_ENTRY_TLS_ENTRIES * 8);  	syscall_init(); @@ -1314,7 +1315,7 @@ void __cpuinit cpu_init(void)  #else -void __cpuinit cpu_init(void) +void cpu_init(void)  {  	int cpu = smp_processor_id();  	struct task_struct *curr = current; @@ -1334,7 +1335,7 @@ void __cpuinit cpu_init(void)  	if (cpu_has_vme || cpu_has_tsc || cpu_has_de)  		clear_in_cr4(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE); -	load_idt(&idt_descr); +	load_current_idt();  	switch_to_new_gdt(cpu);  	/* @@ -1363,3 +1364,17 @@ void __cpuinit cpu_init(void)  	fpu_init();  }  #endif + +#ifdef CONFIG_X86_DEBUG_STATIC_CPU_HAS +void warn_pre_alternatives(void) +{ +	WARN(1, "You're using static_cpu_has before alternatives have run!\n"); +} +EXPORT_SYMBOL_GPL(warn_pre_alternatives); +#endif + +inline bool __static_cpu_has_safe(u16 bit) +{ +	return boot_cpu_has(bit); +} +EXPORT_SYMBOL_GPL(__static_cpu_has_safe); diff --git a/arch/x86/kernel/cpu/cyrix.c b/arch/x86/kernel/cpu/cyrix.c index d048d5ca43c..d0969c75ab5 100644 --- a/arch/x86/kernel/cpu/cyrix.c +++ b/arch/x86/kernel/cpu/cyrix.c @@ -15,7 +15,7 @@  /*   * Read NSC/Cyrix DEVID registers (DIR) to get more detailed info. about the CPU   */ -static void __cpuinit __do_cyrix_devid(unsigned char *dir0, unsigned char *dir1) +static void __do_cyrix_devid(unsigned char *dir0, unsigned char *dir1)  {  	unsigned char ccr2, ccr3; @@ -44,7 +44,7 @@ static void __cpuinit __do_cyrix_devid(unsigned char *dir0, unsigned char *dir1)  	}  } -static void __cpuinit do_cyrix_devid(unsigned char *dir0, unsigned char *dir1) +static void do_cyrix_devid(unsigned char *dir0, unsigned char *dir1)  {  	unsigned long flags; @@ -59,25 +59,25 @@ static void __cpuinit do_cyrix_devid(unsigned char *dir0, unsigned char *dir1)   * Actually since bugs.h doesn't even reference this perhaps someone should   * fix the documentation ???   */ -static unsigned char Cx86_dir0_msb __cpuinitdata = 0; +static unsigned char Cx86_dir0_msb = 0; -static const char __cpuinitconst Cx86_model[][9] = { +static const char Cx86_model[][9] = {  	"Cx486", "Cx486", "5x86 ", "6x86", "MediaGX ", "6x86MX ",  	"M II ", "Unknown"  }; -static const char __cpuinitconst Cx486_name[][5] = { +static const char Cx486_name[][5] = {  	"SLC", "DLC", "SLC2", "DLC2", "SRx", "DRx",  	"SRx2", "DRx2"  }; -static const char __cpuinitconst Cx486S_name[][4] = { +static const char Cx486S_name[][4] = {  	"S", "S2", "Se", "S2e"  }; -static const char __cpuinitconst Cx486D_name[][4] = { +static const char Cx486D_name[][4] = {  	"DX", "DX2", "?", "?", "?", "DX4"  }; -static char Cx86_cb[] __cpuinitdata = "?.5x Core/Bus Clock"; -static const char __cpuinitconst cyrix_model_mult1[] = "12??43"; -static const char __cpuinitconst cyrix_model_mult2[] = "12233445"; +static char Cx86_cb[] = "?.5x Core/Bus Clock"; +static const char cyrix_model_mult1[] = "12??43"; +static const char cyrix_model_mult2[] = "12233445";  /*   * Reset the slow-loop (SLOP) bit on the 686(L) which is set by some old @@ -87,7 +87,7 @@ static const char __cpuinitconst cyrix_model_mult2[] = "12233445";   * FIXME: our newer udelay uses the tsc. We don't need to frob with SLOP   */ -static void __cpuinit check_cx686_slop(struct cpuinfo_x86 *c) +static void check_cx686_slop(struct cpuinfo_x86 *c)  {  	unsigned long flags; @@ -112,7 +112,7 @@ static void __cpuinit check_cx686_slop(struct cpuinfo_x86 *c)  } -static void __cpuinit set_cx86_reorder(void) +static void set_cx86_reorder(void)  {  	u8 ccr3; @@ -127,7 +127,7 @@ static void __cpuinit set_cx86_reorder(void)  	setCx86(CX86_CCR3, ccr3);  } -static void __cpuinit set_cx86_memwb(void) +static void set_cx86_memwb(void)  {  	printk(KERN_INFO "Enable Memory-Write-back mode on Cyrix/NSC processor.\n"); @@ -143,7 +143,7 @@ static void __cpuinit set_cx86_memwb(void)   *	Configure later MediaGX and/or Geode processor.   */ -static void __cpuinit geode_configure(void) +static void geode_configure(void)  {  	unsigned long flags;  	u8 ccr3; @@ -166,7 +166,7 @@ static void __cpuinit geode_configure(void)  	local_irq_restore(flags);  } -static void __cpuinit early_init_cyrix(struct cpuinfo_x86 *c) +static void early_init_cyrix(struct cpuinfo_x86 *c)  {  	unsigned char dir0, dir0_msn, dir1 = 0; @@ -185,7 +185,7 @@ static void __cpuinit early_init_cyrix(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit init_cyrix(struct cpuinfo_x86 *c) +static void init_cyrix(struct cpuinfo_x86 *c)  {  	unsigned char dir0, dir0_msn, dir0_lsn, dir1 = 0;  	char *buf = c->x86_model_id; @@ -333,7 +333,7 @@ static void __cpuinit init_cyrix(struct cpuinfo_x86 *c)  		switch (dir0_lsn) {  		case 0xd:  /* either a 486SLC or DLC w/o DEVID */  			dir0_msn = 0; -			p = Cx486_name[(c->hard_math) ? 1 : 0]; +			p = Cx486_name[(cpu_has_fpu ? 1 : 0)];  			break;  		case 0xe:  /* a 486S A step */ @@ -356,7 +356,7 @@ static void __cpuinit init_cyrix(struct cpuinfo_x86 *c)  /*   * Handle National Semiconductor branded processors   */ -static void __cpuinit init_nsc(struct cpuinfo_x86 *c) +static void init_nsc(struct cpuinfo_x86 *c)  {  	/*  	 * There may be GX1 processors in the wild that are branded @@ -405,7 +405,7 @@ static inline int test_cyrix_52div(void)  	return (unsigned char) (test >> 8) == 0x02;  } -static void __cpuinit cyrix_identify(struct cpuinfo_x86 *c) +static void cyrix_identify(struct cpuinfo_x86 *c)  {  	/* Detect Cyrix with disabled CPUID */  	if (c->x86 == 4 && test_cyrix_52div()) { @@ -441,7 +441,7 @@ static void __cpuinit cyrix_identify(struct cpuinfo_x86 *c)  	}  } -static const struct cpu_dev __cpuinitconst cyrix_cpu_dev = { +static const struct cpu_dev cyrix_cpu_dev = {  	.c_vendor	= "Cyrix",  	.c_ident	= { "CyrixInstead" },  	.c_early_init	= early_init_cyrix, @@ -452,7 +452,7 @@ static const struct cpu_dev __cpuinitconst cyrix_cpu_dev = {  cpu_dev_register(cyrix_cpu_dev); -static const struct cpu_dev __cpuinitconst nsc_cpu_dev = { +static const struct cpu_dev nsc_cpu_dev = {  	.c_vendor	= "NSC",  	.c_ident	= { "Geode by NSC" },  	.c_init		= init_nsc, diff --git a/arch/x86/kernel/cpu/hypervisor.c b/arch/x86/kernel/cpu/hypervisor.c index 1e7e84a02eb..87279212d31 100644 --- a/arch/x86/kernel/cpu/hypervisor.c +++ b/arch/x86/kernel/cpu/hypervisor.c @@ -60,7 +60,7 @@ detect_hypervisor_vendor(void)  	}  } -void __cpuinit init_hypervisor(struct cpuinfo_x86 *c) +void init_hypervisor(struct cpuinfo_x86 *c)  {  	if (x86_hyper && x86_hyper->set_cpu_features)  		x86_hyper->set_cpu_features(c); diff --git a/arch/x86/kernel/cpu/intel.c b/arch/x86/kernel/cpu/intel.c index 9b0c441c03f..ec7299566f7 100644 --- a/arch/x86/kernel/cpu/intel.c +++ b/arch/x86/kernel/cpu/intel.c @@ -26,7 +26,7 @@  #include <asm/apic.h>  #endif -static void __cpuinit early_init_intel(struct cpuinfo_x86 *c) +static void early_init_intel(struct cpuinfo_x86 *c)  {  	u64 misc_enable; @@ -163,7 +163,7 @@ static void __cpuinit early_init_intel(struct cpuinfo_x86 *c)   *	This is called before we do cpu ident work   */ -int __cpuinit ppro_with_ram_bug(void) +int ppro_with_ram_bug(void)  {  	/* Uses data from early_cpu_detect now */  	if (boot_cpu_data.x86_vendor == X86_VENDOR_INTEL && @@ -176,7 +176,7 @@ int __cpuinit ppro_with_ram_bug(void)  	return 0;  } -static void __cpuinit intel_smp_check(struct cpuinfo_x86 *c) +static void intel_smp_check(struct cpuinfo_x86 *c)  {  	/* calling is from identify_secondary_cpu() ? */  	if (!c->cpu_index) @@ -196,7 +196,7 @@ static void __cpuinit intel_smp_check(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit intel_workarounds(struct cpuinfo_x86 *c) +static void intel_workarounds(struct cpuinfo_x86 *c)  {  	unsigned long lo, hi; @@ -275,12 +275,12 @@ static void __cpuinit intel_workarounds(struct cpuinfo_x86 *c)  	intel_smp_check(c);  }  #else -static void __cpuinit intel_workarounds(struct cpuinfo_x86 *c) +static void intel_workarounds(struct cpuinfo_x86 *c)  {  }  #endif -static void __cpuinit srat_detect_node(struct cpuinfo_x86 *c) +static void srat_detect_node(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_NUMA  	unsigned node; @@ -300,7 +300,7 @@ static void __cpuinit srat_detect_node(struct cpuinfo_x86 *c)  /*   * find out the number of processor cores on the die   */ -static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c) +static int intel_num_cpu_cores(struct cpuinfo_x86 *c)  {  	unsigned int eax, ebx, ecx, edx; @@ -315,7 +315,7 @@ static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c)  		return 1;  } -static void __cpuinit detect_vmx_virtcap(struct cpuinfo_x86 *c) +static void detect_vmx_virtcap(struct cpuinfo_x86 *c)  {  	/* Intel VMX MSR indicated features */  #define X86_VMX_FEATURE_PROC_CTLS_TPR_SHADOW	0x00200000 @@ -353,7 +353,7 @@ static void __cpuinit detect_vmx_virtcap(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit init_intel(struct cpuinfo_x86 *c) +static void init_intel(struct cpuinfo_x86 *c)  {  	unsigned int l2 = 0; @@ -472,7 +472,7 @@ static void __cpuinit init_intel(struct cpuinfo_x86 *c)  }  #ifdef CONFIG_X86_32 -static unsigned int __cpuinit intel_size_cache(struct cpuinfo_x86 *c, unsigned int size) +static unsigned int intel_size_cache(struct cpuinfo_x86 *c, unsigned int size)  {  	/*  	 * Intel PIII Tualatin. This comes in two flavours. @@ -506,7 +506,7 @@ static unsigned int __cpuinit intel_size_cache(struct cpuinfo_x86 *c, unsigned i  #define STLB_4K		0x41 -static const struct _tlb_table intel_tlb_table[] __cpuinitconst = { +static const struct _tlb_table intel_tlb_table[] = {  	{ 0x01, TLB_INST_4K,		32,	" TLB_INST 4 KByte pages, 4-way set associative" },  	{ 0x02, TLB_INST_4M,		2,	" TLB_INST 4 MByte pages, full associative" },  	{ 0x03, TLB_DATA_4K,		64,	" TLB_DATA 4 KByte pages, 4-way set associative" }, @@ -536,7 +536,7 @@ static const struct _tlb_table intel_tlb_table[] __cpuinitconst = {  	{ 0x00, 0, 0 }  }; -static void __cpuinit intel_tlb_lookup(const unsigned char desc) +static void intel_tlb_lookup(const unsigned char desc)  {  	unsigned char k;  	if (desc == 0) @@ -605,7 +605,7 @@ static void __cpuinit intel_tlb_lookup(const unsigned char desc)  	}  } -static void __cpuinit intel_tlb_flushall_shift_set(struct cpuinfo_x86 *c) +static void intel_tlb_flushall_shift_set(struct cpuinfo_x86 *c)  {  	switch ((c->x86 << 8) + c->x86_model) {  	case 0x60f: /* original 65 nm celeron/pentium/core2/xeon, "Merom"/"Conroe" */ @@ -634,7 +634,7 @@ static void __cpuinit intel_tlb_flushall_shift_set(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit intel_detect_tlb(struct cpuinfo_x86 *c) +static void intel_detect_tlb(struct cpuinfo_x86 *c)  {  	int i, j, n;  	unsigned int regs[4]; @@ -661,7 +661,7 @@ static void __cpuinit intel_detect_tlb(struct cpuinfo_x86 *c)  	intel_tlb_flushall_shift_set(c);  } -static const struct cpu_dev __cpuinitconst intel_cpu_dev = { +static const struct cpu_dev intel_cpu_dev = {  	.c_vendor	= "Intel",  	.c_ident	= { "GenuineIntel" },  #ifdef CONFIG_X86_32 diff --git a/arch/x86/kernel/cpu/intel_cacheinfo.c b/arch/x86/kernel/cpu/intel_cacheinfo.c index 7c6f7d548c0..1414c90feab 100644 --- a/arch/x86/kernel/cpu/intel_cacheinfo.c +++ b/arch/x86/kernel/cpu/intel_cacheinfo.c @@ -37,7 +37,7 @@ struct _cache_table {  /* All the cache descriptor types we care about (no TLB or     trace cache entries) */ -static const struct _cache_table __cpuinitconst cache_table[] = +static const struct _cache_table cache_table[] =  {  	{ 0x06, LVL_1_INST, 8 },	/* 4-way set assoc, 32 byte line size */  	{ 0x08, LVL_1_INST, 16 },	/* 4-way set assoc, 32 byte line size */ @@ -203,7 +203,7 @@ union l3_cache {  	unsigned val;  }; -static const unsigned short __cpuinitconst assocs[] = { +static const unsigned short assocs[] = {  	[1] = 1,  	[2] = 2,  	[4] = 4, @@ -217,10 +217,10 @@ static const unsigned short __cpuinitconst assocs[] = {  	[0xf] = 0xffff /* fully associative - no way to show this currently */  }; -static const unsigned char __cpuinitconst levels[] = { 1, 1, 2, 3 }; -static const unsigned char __cpuinitconst types[] = { 1, 2, 3, 3 }; +static const unsigned char levels[] = { 1, 1, 2, 3 }; +static const unsigned char types[] = { 1, 2, 3, 3 }; -static void __cpuinit +static void  amd_cpuid4(int leaf, union _cpuid4_leaf_eax *eax,  		     union _cpuid4_leaf_ebx *ebx,  		     union _cpuid4_leaf_ecx *ecx) @@ -302,7 +302,7 @@ struct _cache_attr {  /*   * L3 cache descriptors   */ -static void __cpuinit amd_calc_l3_indices(struct amd_northbridge *nb) +static void amd_calc_l3_indices(struct amd_northbridge *nb)  {  	struct amd_l3_cache *l3 = &nb->l3_cache;  	unsigned int sc0, sc1, sc2, sc3; @@ -325,7 +325,7 @@ static void __cpuinit amd_calc_l3_indices(struct amd_northbridge *nb)  	l3->indices = (max(max3(sc0, sc1, sc2), sc3) << 10) - 1;  } -static void __cpuinit amd_init_l3_cache(struct _cpuid4_info_regs *this_leaf, int index) +static void amd_init_l3_cache(struct _cpuid4_info_regs *this_leaf, int index)  {  	int node; @@ -528,8 +528,7 @@ static struct _cache_attr subcaches =  #endif  /* CONFIG_AMD_NB && CONFIG_SYSFS */  static int -__cpuinit cpuid4_cache_lookup_regs(int index, -				   struct _cpuid4_info_regs *this_leaf) +cpuid4_cache_lookup_regs(int index, struct _cpuid4_info_regs *this_leaf)  {  	union _cpuid4_leaf_eax	eax;  	union _cpuid4_leaf_ebx	ebx; @@ -560,7 +559,7 @@ __cpuinit cpuid4_cache_lookup_regs(int index,  	return 0;  } -static int __cpuinit find_num_cache_leaves(struct cpuinfo_x86 *c) +static int find_num_cache_leaves(struct cpuinfo_x86 *c)  {  	unsigned int		eax, ebx, ecx, edx, op;  	union _cpuid4_leaf_eax	cache_eax; @@ -580,7 +579,7 @@ static int __cpuinit find_num_cache_leaves(struct cpuinfo_x86 *c)  	return i;  } -void __cpuinit init_amd_cacheinfo(struct cpuinfo_x86 *c) +void init_amd_cacheinfo(struct cpuinfo_x86 *c)  {  	if (cpu_has_topoext) { @@ -593,7 +592,7 @@ void __cpuinit init_amd_cacheinfo(struct cpuinfo_x86 *c)  	}  } -unsigned int __cpuinit init_intel_cacheinfo(struct cpuinfo_x86 *c) +unsigned int init_intel_cacheinfo(struct cpuinfo_x86 *c)  {  	/* Cache sizes */  	unsigned int trace = 0, l1i = 0, l1d = 0, l2 = 0, l3 = 0; @@ -618,36 +617,34 @@ unsigned int __cpuinit init_intel_cacheinfo(struct cpuinfo_x86 *c)  		 * parameters cpuid leaf to find the cache details  		 */  		for (i = 0; i < num_cache_leaves; i++) { -			struct _cpuid4_info_regs this_leaf; +			struct _cpuid4_info_regs this_leaf = {};  			int retval;  			retval = cpuid4_cache_lookup_regs(i, &this_leaf); -			if (retval >= 0) { -				switch (this_leaf.eax.split.level) { -				case 1: -					if (this_leaf.eax.split.type == -							CACHE_TYPE_DATA) -						new_l1d = this_leaf.size/1024; -					else if (this_leaf.eax.split.type == -							CACHE_TYPE_INST) -						new_l1i = this_leaf.size/1024; -					break; -				case 2: -					new_l2 = this_leaf.size/1024; -					num_threads_sharing = 1 + this_leaf.eax.split.num_threads_sharing; -					index_msb = get_count_order(num_threads_sharing); -					l2_id = c->apicid & ~((1 << index_msb) - 1); -					break; -				case 3: -					new_l3 = this_leaf.size/1024; -					num_threads_sharing = 1 + this_leaf.eax.split.num_threads_sharing; -					index_msb = get_count_order( -							num_threads_sharing); -					l3_id = c->apicid & ~((1 << index_msb) - 1); -					break; -				default: -					break; -				} +			if (retval < 0) +				continue; + +			switch (this_leaf.eax.split.level) { +			case 1: +				if (this_leaf.eax.split.type == CACHE_TYPE_DATA) +					new_l1d = this_leaf.size/1024; +				else if (this_leaf.eax.split.type == CACHE_TYPE_INST) +					new_l1i = this_leaf.size/1024; +				break; +			case 2: +				new_l2 = this_leaf.size/1024; +				num_threads_sharing = 1 + this_leaf.eax.split.num_threads_sharing; +				index_msb = get_count_order(num_threads_sharing); +				l2_id = c->apicid & ~((1 << index_msb) - 1); +				break; +			case 3: +				new_l3 = this_leaf.size/1024; +				num_threads_sharing = 1 + this_leaf.eax.split.num_threads_sharing; +				index_msb = get_count_order(num_threads_sharing); +				l3_id = c->apicid & ~((1 << index_msb) - 1); +				break; +			default: +				break;  			}  		}  	} @@ -746,7 +743,7 @@ static DEFINE_PER_CPU(struct _cpuid4_info *, ici_cpuid4_info);  #ifdef CONFIG_SMP -static int __cpuinit cache_shared_amd_cpu_map_setup(unsigned int cpu, int index) +static int cache_shared_amd_cpu_map_setup(unsigned int cpu, int index)  {  	struct _cpuid4_info *this_leaf;  	int i, sibling; @@ -795,7 +792,7 @@ static int __cpuinit cache_shared_amd_cpu_map_setup(unsigned int cpu, int index)  	return 1;  } -static void __cpuinit cache_shared_cpu_map_setup(unsigned int cpu, int index) +static void cache_shared_cpu_map_setup(unsigned int cpu, int index)  {  	struct _cpuid4_info *this_leaf, *sibling_leaf;  	unsigned long num_threads_sharing; @@ -830,7 +827,7 @@ static void __cpuinit cache_shared_cpu_map_setup(unsigned int cpu, int index)  		}  	}  } -static void __cpuinit cache_remove_shared_cpu_map(unsigned int cpu, int index) +static void cache_remove_shared_cpu_map(unsigned int cpu, int index)  {  	struct _cpuid4_info	*this_leaf, *sibling_leaf;  	int sibling; @@ -843,16 +840,16 @@ static void __cpuinit cache_remove_shared_cpu_map(unsigned int cpu, int index)  	}  }  #else -static void __cpuinit cache_shared_cpu_map_setup(unsigned int cpu, int index) +static void cache_shared_cpu_map_setup(unsigned int cpu, int index)  {  } -static void __cpuinit cache_remove_shared_cpu_map(unsigned int cpu, int index) +static void cache_remove_shared_cpu_map(unsigned int cpu, int index)  {  }  #endif -static void __cpuinit free_cache_attributes(unsigned int cpu) +static void free_cache_attributes(unsigned int cpu)  {  	int i; @@ -863,7 +860,7 @@ static void __cpuinit free_cache_attributes(unsigned int cpu)  	per_cpu(ici_cpuid4_info, cpu) = NULL;  } -static void __cpuinit get_cpu_leaves(void *_retval) +static void get_cpu_leaves(void *_retval)  {  	int j, *retval = _retval, cpu = smp_processor_id(); @@ -883,7 +880,7 @@ static void __cpuinit get_cpu_leaves(void *_retval)  	}  } -static int __cpuinit detect_cache_attributes(unsigned int cpu) +static int detect_cache_attributes(unsigned int cpu)  {  	int			retval; @@ -1017,7 +1014,7 @@ static struct attribute *default_attrs[] = {  };  #ifdef CONFIG_AMD_NB -static struct attribute ** __cpuinit amd_l3_attrs(void) +static struct attribute **amd_l3_attrs(void)  {  	static struct attribute **attrs;  	int n; @@ -1093,7 +1090,7 @@ static struct kobj_type ktype_percpu_entry = {  	.sysfs_ops	= &sysfs_ops,  }; -static void __cpuinit cpuid4_cache_sysfs_exit(unsigned int cpu) +static void cpuid4_cache_sysfs_exit(unsigned int cpu)  {  	kfree(per_cpu(ici_cache_kobject, cpu));  	kfree(per_cpu(ici_index_kobject, cpu)); @@ -1102,7 +1099,7 @@ static void __cpuinit cpuid4_cache_sysfs_exit(unsigned int cpu)  	free_cache_attributes(cpu);  } -static int __cpuinit cpuid4_cache_sysfs_init(unsigned int cpu) +static int cpuid4_cache_sysfs_init(unsigned int cpu)  {  	int err; @@ -1134,7 +1131,7 @@ err_out:  static DECLARE_BITMAP(cache_dev_map, NR_CPUS);  /* Add/Remove cache interface for CPU device */ -static int __cpuinit cache_add_dev(struct device *dev) +static int cache_add_dev(struct device *dev)  {  	unsigned int cpu = dev->id;  	unsigned long i, j; @@ -1185,7 +1182,7 @@ static int __cpuinit cache_add_dev(struct device *dev)  	return 0;  } -static void __cpuinit cache_remove_dev(struct device *dev) +static void cache_remove_dev(struct device *dev)  {  	unsigned int cpu = dev->id;  	unsigned long i; @@ -1202,8 +1199,8 @@ static void __cpuinit cache_remove_dev(struct device *dev)  	cpuid4_cache_sysfs_exit(cpu);  } -static int __cpuinit cacheinfo_cpu_callback(struct notifier_block *nfb, -					unsigned long action, void *hcpu) +static int cacheinfo_cpu_callback(struct notifier_block *nfb, +				  unsigned long action, void *hcpu)  {  	unsigned int cpu = (unsigned long)hcpu;  	struct device *dev; @@ -1222,7 +1219,7 @@ static int __cpuinit cacheinfo_cpu_callback(struct notifier_block *nfb,  	return NOTIFY_OK;  } -static struct notifier_block __cpuinitdata cacheinfo_cpu_notifier = { +static struct notifier_block cacheinfo_cpu_notifier = {  	.notifier_call = cacheinfo_cpu_callback,  }; diff --git a/arch/x86/kernel/cpu/mcheck/mce-inject.c b/arch/x86/kernel/cpu/mcheck/mce-inject.c index ddc72f83933..5ac2d1fb28b 100644 --- a/arch/x86/kernel/cpu/mcheck/mce-inject.c +++ b/arch/x86/kernel/cpu/mcheck/mce-inject.c @@ -153,7 +153,7 @@ static void raise_mce(struct mce *m)  		return;  #ifdef CONFIG_X86_LOCAL_APIC -	if (m->inject_flags & (MCJ_IRQ_BRAODCAST | MCJ_NMI_BROADCAST)) { +	if (m->inject_flags & (MCJ_IRQ_BROADCAST | MCJ_NMI_BROADCAST)) {  		unsigned long start;  		int cpu; @@ -167,7 +167,7 @@ static void raise_mce(struct mce *m)  				cpumask_clear_cpu(cpu, mce_inject_cpumask);  		}  		if (!cpumask_empty(mce_inject_cpumask)) { -			if (m->inject_flags & MCJ_IRQ_BRAODCAST) { +			if (m->inject_flags & MCJ_IRQ_BROADCAST) {  				/*  				 * don't wait because mce_irq_ipi is necessary  				 * to be sync with following raise_local diff --git a/arch/x86/kernel/cpu/mcheck/mce-severity.c b/arch/x86/kernel/cpu/mcheck/mce-severity.c index beb1f1689e5..c370e1c4468 100644 --- a/arch/x86/kernel/cpu/mcheck/mce-severity.c +++ b/arch/x86/kernel/cpu/mcheck/mce-severity.c @@ -110,22 +110,17 @@ static struct severity {  	/* known AR MCACODs: */  #ifdef	CONFIG_MEMORY_FAILURE  	MCESEV( -		KEEP, "HT thread notices Action required: data load error", -		SER, MASK(MCI_STATUS_OVER|MCI_UC_SAR|MCI_ADDR|MCACOD, MCI_UC_SAR|MCI_ADDR|MCACOD_DATA), -		MCGMASK(MCG_STATUS_EIPV, 0) +		KEEP, "Action required but unaffected thread is continuable", +		SER, MASK(MCI_STATUS_OVER|MCI_UC_SAR|MCI_ADDR, MCI_UC_SAR|MCI_ADDR), +		MCGMASK(MCG_STATUS_RIPV|MCG_STATUS_EIPV, MCG_STATUS_RIPV)  		),  	MCESEV( -		AR, "Action required: data load error", +		AR, "Action required: data load error in a user process",  		SER, MASK(MCI_STATUS_OVER|MCI_UC_SAR|MCI_ADDR|MCACOD, MCI_UC_SAR|MCI_ADDR|MCACOD_DATA),  		USER  		),  	MCESEV( -		KEEP, "HT thread notices Action required: instruction fetch error", -		SER, MASK(MCI_STATUS_OVER|MCI_UC_SAR|MCI_ADDR|MCACOD, MCI_UC_SAR|MCI_ADDR|MCACOD_INSTR), -		MCGMASK(MCG_STATUS_EIPV, 0) -		), -	MCESEV( -		AR, "Action required: instruction fetch error", +		AR, "Action required: instruction fetch error in a user process",  		SER, MASK(MCI_STATUS_OVER|MCI_UC_SAR|MCI_ADDR|MCACOD, MCI_UC_SAR|MCI_ADDR|MCACOD_INSTR),  		USER  		), diff --git a/arch/x86/kernel/cpu/mcheck/mce.c b/arch/x86/kernel/cpu/mcheck/mce.c index 9239504b41c..87a65c939bc 100644 --- a/arch/x86/kernel/cpu/mcheck/mce.c +++ b/arch/x86/kernel/cpu/mcheck/mce.c @@ -89,7 +89,10 @@ static DECLARE_WAIT_QUEUE_HEAD(mce_chrdev_wait);  static DEFINE_PER_CPU(struct mce, mces_seen);  static int			cpu_missing; -/* MCA banks polled by the period polling timer for corrected events */ +/* + * MCA banks polled by the period polling timer for corrected events. + * With Intel CMCI, this only has MCA banks which do not support CMCI (if any). + */  DEFINE_PER_CPU(mce_banks_t, mce_poll_banks) = {  	[0 ... BITS_TO_LONGS(MAX_NR_BANKS)-1] = ~0UL  }; @@ -1360,7 +1363,7 @@ int mce_notify_irq(void)  }  EXPORT_SYMBOL_GPL(mce_notify_irq); -static int __cpuinit __mcheck_cpu_mce_banks_init(void) +static int __mcheck_cpu_mce_banks_init(void)  {  	int i;  	u8 num_banks = mca_cfg.banks; @@ -1381,7 +1384,7 @@ static int __cpuinit __mcheck_cpu_mce_banks_init(void)  /*   * Initialize Machine Checks for a CPU.   */ -static int __cpuinit __mcheck_cpu_cap_init(void) +static int __mcheck_cpu_cap_init(void)  {  	unsigned b;  	u64 cap; @@ -1480,7 +1483,7 @@ static void quirk_sandybridge_ifu(int bank, struct mce *m, struct pt_regs *regs)  }  /* Add per CPU specific workarounds here */ -static int __cpuinit __mcheck_cpu_apply_quirks(struct cpuinfo_x86 *c) +static int __mcheck_cpu_apply_quirks(struct cpuinfo_x86 *c)  {  	struct mca_config *cfg = &mca_cfg; @@ -1590,7 +1593,7 @@ static int __cpuinit __mcheck_cpu_apply_quirks(struct cpuinfo_x86 *c)  	return 0;  } -static int __cpuinit __mcheck_cpu_ancient_init(struct cpuinfo_x86 *c) +static int __mcheck_cpu_ancient_init(struct cpuinfo_x86 *c)  {  	if (c->x86 != 5)  		return 0; @@ -1661,7 +1664,7 @@ void (*machine_check_vector)(struct pt_regs *, long error_code) =   * Called for each booted CPU to set up machine checks.   * Must be called with preempt off:   */ -void __cpuinit mcheck_cpu_init(struct cpuinfo_x86 *c) +void mcheck_cpu_init(struct cpuinfo_x86 *c)  {  	if (mca_cfg.disabled)  		return; @@ -2079,7 +2082,6 @@ static struct bus_type mce_subsys = {  DEFINE_PER_CPU(struct device *, mce_device); -__cpuinitdata  void (*threshold_cpu_callback)(unsigned long action, unsigned int cpu);  static inline struct mce_bank *attr_to_bank(struct device_attribute *attr) @@ -2225,7 +2227,7 @@ static void mce_device_release(struct device *dev)  }  /* Per cpu device init. All of the cpus still share the same ctrl bank: */ -static __cpuinit int mce_device_create(unsigned int cpu) +static int mce_device_create(unsigned int cpu)  {  	struct device *dev;  	int err; @@ -2271,7 +2273,7 @@ error:  	return err;  } -static __cpuinit void mce_device_remove(unsigned int cpu) +static void mce_device_remove(unsigned int cpu)  {  	struct device *dev = per_cpu(mce_device, cpu);  	int i; @@ -2291,7 +2293,7 @@ static __cpuinit void mce_device_remove(unsigned int cpu)  }  /* Make sure there are no machine checks on offlined CPUs. */ -static void __cpuinit mce_disable_cpu(void *h) +static void mce_disable_cpu(void *h)  {  	unsigned long action = *(unsigned long *)h;  	int i; @@ -2309,7 +2311,7 @@ static void __cpuinit mce_disable_cpu(void *h)  	}  } -static void __cpuinit mce_reenable_cpu(void *h) +static void mce_reenable_cpu(void *h)  {  	unsigned long action = *(unsigned long *)h;  	int i; @@ -2328,7 +2330,7 @@ static void __cpuinit mce_reenable_cpu(void *h)  }  /* Get notified when a cpu comes on/off. Be hotplug friendly. */ -static int __cpuinit +static int  mce_cpu_callback(struct notifier_block *nfb, unsigned long action, void *hcpu)  {  	unsigned int cpu = (unsigned long)hcpu; @@ -2364,7 +2366,7 @@ mce_cpu_callback(struct notifier_block *nfb, unsigned long action, void *hcpu)  	return NOTIFY_OK;  } -static struct notifier_block mce_cpu_notifier __cpuinitdata = { +static struct notifier_block mce_cpu_notifier = {  	.notifier_call = mce_cpu_callback,  }; diff --git a/arch/x86/kernel/cpu/mcheck/mce_amd.c b/arch/x86/kernel/cpu/mcheck/mce_amd.c index 9cb52767999..603df4f7464 100644 --- a/arch/x86/kernel/cpu/mcheck/mce_amd.c +++ b/arch/x86/kernel/cpu/mcheck/mce_amd.c @@ -458,10 +458,8 @@ static struct kobj_type threshold_ktype = {  	.default_attrs		= default_attrs,  }; -static __cpuinit int allocate_threshold_blocks(unsigned int cpu, -					       unsigned int bank, -					       unsigned int block, -					       u32 address) +static int allocate_threshold_blocks(unsigned int cpu, unsigned int bank, +				     unsigned int block, u32 address)  {  	struct threshold_block *b = NULL;  	u32 low, high; @@ -543,7 +541,7 @@ out_free:  	return err;  } -static __cpuinit int __threshold_add_blocks(struct threshold_bank *b) +static int __threshold_add_blocks(struct threshold_bank *b)  {  	struct list_head *head = &b->blocks->miscj;  	struct threshold_block *pos = NULL; @@ -567,7 +565,7 @@ static __cpuinit int __threshold_add_blocks(struct threshold_bank *b)  	return err;  } -static __cpuinit int threshold_create_bank(unsigned int cpu, unsigned int bank) +static int threshold_create_bank(unsigned int cpu, unsigned int bank)  {  	struct device *dev = per_cpu(mce_device, cpu);  	struct amd_northbridge *nb = NULL; @@ -632,7 +630,7 @@ static __cpuinit int threshold_create_bank(unsigned int cpu, unsigned int bank)  }  /* create dir/files for all valid threshold banks */ -static __cpuinit int threshold_create_device(unsigned int cpu) +static int threshold_create_device(unsigned int cpu)  {  	unsigned int bank;  	struct threshold_bank **bp; @@ -736,7 +734,7 @@ static void threshold_remove_device(unsigned int cpu)  }  /* get notified when a cpu comes on/off */ -static void __cpuinit +static void  amd_64_threshold_cpu_callback(unsigned long action, unsigned int cpu)  {  	switch (action) { diff --git a/arch/x86/kernel/cpu/mcheck/mce_intel.c b/arch/x86/kernel/cpu/mcheck/mce_intel.c index ae1697c2afe..d56405309dc 100644 --- a/arch/x86/kernel/cpu/mcheck/mce_intel.c +++ b/arch/x86/kernel/cpu/mcheck/mce_intel.c @@ -24,6 +24,18 @@   * Also supports reliable discovery of shared banks.   */ +/* + * CMCI can be delivered to multiple cpus that share a machine check bank + * so we need to designate a single cpu to process errors logged in each bank + * in the interrupt handler (otherwise we would have many races and potential + * double reporting of the same error). + * Note that this can change when a cpu is offlined or brought online since + * some MCA banks are shared across cpus. When a cpu is offlined, cmci_clear() + * disables CMCI on all banks owned by the cpu and clears this bitfield. At + * this point, cmci_rediscover() kicks in and a different cpu may end up + * taking ownership of some of the shared MCA banks that were previously + * owned by the offlined cpu. + */  static DEFINE_PER_CPU(mce_banks_t, mce_banks_owned);  /* diff --git a/arch/x86/kernel/cpu/mcheck/therm_throt.c b/arch/x86/kernel/cpu/mcheck/therm_throt.c index 47a1870279a..3eec7de76ef 100644 --- a/arch/x86/kernel/cpu/mcheck/therm_throt.c +++ b/arch/x86/kernel/cpu/mcheck/therm_throt.c @@ -29,6 +29,7 @@  #include <asm/idle.h>  #include <asm/mce.h>  #include <asm/msr.h> +#include <asm/trace/irq_vectors.h>  /* How long to wait between reporting thermal events */  #define CHECK_INTERVAL		(300 * HZ) @@ -54,12 +55,24 @@ struct thermal_state {  	struct _thermal_state package_power_limit;  	struct _thermal_state core_thresh0;  	struct _thermal_state core_thresh1; +	struct _thermal_state pkg_thresh0; +	struct _thermal_state pkg_thresh1;  };  /* Callback to handle core threshold interrupts */  int (*platform_thermal_notify)(__u64 msr_val);  EXPORT_SYMBOL(platform_thermal_notify); +/* Callback to handle core package threshold_interrupts */ +int (*platform_thermal_package_notify)(__u64 msr_val); +EXPORT_SYMBOL_GPL(platform_thermal_package_notify); + +/* Callback support of rate control, return true, if + * callback has rate control */ +bool (*platform_thermal_package_rate_control)(void); +EXPORT_SYMBOL_GPL(platform_thermal_package_rate_control); + +  static DEFINE_PER_CPU(struct thermal_state, thermal_state);  static atomic_t therm_throt_en	= ATOMIC_INIT(0); @@ -181,11 +194,6 @@ static int therm_throt_process(bool new_event, int event, int level)  				this_cpu,  				level == CORE_LEVEL ? "Core" : "Package",  				state->count); -		else -			printk(KERN_CRIT "CPU%d: %s power limit notification (total events = %lu)\n", -				this_cpu, -				level == CORE_LEVEL ? "Core" : "Package", -				state->count);  		return 1;  	}  	if (old_event) { @@ -193,36 +201,46 @@ static int therm_throt_process(bool new_event, int event, int level)  			printk(KERN_INFO "CPU%d: %s temperature/speed normal\n",  				this_cpu,  				level == CORE_LEVEL ? "Core" : "Package"); -		else -			printk(KERN_INFO "CPU%d: %s power limit normal\n", -				this_cpu, -				level == CORE_LEVEL ? "Core" : "Package");  		return 1;  	}  	return 0;  } -static int thresh_event_valid(int event) +static int thresh_event_valid(int level, int event)  {  	struct _thermal_state *state;  	unsigned int this_cpu = smp_processor_id();  	struct thermal_state *pstate = &per_cpu(thermal_state, this_cpu);  	u64 now = get_jiffies_64(); -	state = (event == 0) ? &pstate->core_thresh0 : &pstate->core_thresh1; +	if (level == PACKAGE_LEVEL) +		state = (event == 0) ? &pstate->pkg_thresh0 : +						&pstate->pkg_thresh1; +	else +		state = (event == 0) ? &pstate->core_thresh0 : +						&pstate->core_thresh1;  	if (time_before64(now, state->next_check))  		return 0;  	state->next_check = now + CHECK_INTERVAL; + +	return 1; +} + +static bool int_pln_enable; +static int __init int_pln_enable_setup(char *s) +{ +	int_pln_enable = true; +  	return 1;  } +__setup("int_pln_enable", int_pln_enable_setup);  #ifdef CONFIG_SYSFS  /* Add/Remove thermal_throttle interface for CPU device: */ -static __cpuinit int thermal_throttle_add_dev(struct device *dev, -				unsigned int cpu) +static int thermal_throttle_add_dev(struct device *dev, unsigned int cpu)  {  	int err;  	struct cpuinfo_x86 *c = &cpu_data(cpu); @@ -231,7 +249,7 @@ static __cpuinit int thermal_throttle_add_dev(struct device *dev,  	if (err)  		return err; -	if (cpu_has(c, X86_FEATURE_PLN)) +	if (cpu_has(c, X86_FEATURE_PLN) && int_pln_enable)  		err = sysfs_add_file_to_group(&dev->kobj,  					      &dev_attr_core_power_limit_count.attr,  					      thermal_attr_group.name); @@ -239,7 +257,7 @@ static __cpuinit int thermal_throttle_add_dev(struct device *dev,  		err = sysfs_add_file_to_group(&dev->kobj,  					      &dev_attr_package_throttle_count.attr,  					      thermal_attr_group.name); -		if (cpu_has(c, X86_FEATURE_PLN)) +		if (cpu_has(c, X86_FEATURE_PLN) && int_pln_enable)  			err = sysfs_add_file_to_group(&dev->kobj,  					&dev_attr_package_power_limit_count.attr,  					thermal_attr_group.name); @@ -248,7 +266,7 @@ static __cpuinit int thermal_throttle_add_dev(struct device *dev,  	return err;  } -static __cpuinit void thermal_throttle_remove_dev(struct device *dev) +static void thermal_throttle_remove_dev(struct device *dev)  {  	sysfs_remove_group(&dev->kobj, &thermal_attr_group);  } @@ -257,7 +275,7 @@ static __cpuinit void thermal_throttle_remove_dev(struct device *dev)  static DEFINE_MUTEX(therm_cpu_lock);  /* Get notified when a cpu comes on/off. Be hotplug friendly. */ -static __cpuinit int +static int  thermal_throttle_cpu_callback(struct notifier_block *nfb,  			      unsigned long action,  			      void *hcpu) @@ -288,7 +306,7 @@ thermal_throttle_cpu_callback(struct notifier_block *nfb,  	return notifier_from_errno(err);  } -static struct notifier_block thermal_throttle_cpu_notifier __cpuinitdata = +static struct notifier_block thermal_throttle_cpu_notifier =  {  	.notifier_call = thermal_throttle_cpu_callback,  }; @@ -321,6 +339,39 @@ device_initcall(thermal_throttle_init_device);  #endif /* CONFIG_SYSFS */ +static void notify_package_thresholds(__u64 msr_val) +{ +	bool notify_thres_0 = false; +	bool notify_thres_1 = false; + +	if (!platform_thermal_package_notify) +		return; + +	/* lower threshold check */ +	if (msr_val & THERM_LOG_THRESHOLD0) +		notify_thres_0 = true; +	/* higher threshold check */ +	if (msr_val & THERM_LOG_THRESHOLD1) +		notify_thres_1 = true; + +	if (!notify_thres_0 && !notify_thres_1) +		return; + +	if (platform_thermal_package_rate_control && +		platform_thermal_package_rate_control()) { +		/* Rate control is implemented in callback */ +		platform_thermal_package_notify(msr_val); +		return; +	} + +	/* lower threshold reached */ +	if (notify_thres_0 && thresh_event_valid(PACKAGE_LEVEL, 0)) +		platform_thermal_package_notify(msr_val); +	/* higher threshold reached */ +	if (notify_thres_1 && thresh_event_valid(PACKAGE_LEVEL, 1)) +		platform_thermal_package_notify(msr_val); +} +  static void notify_thresholds(__u64 msr_val)  {  	/* check whether the interrupt handler is defined; @@ -330,10 +381,12 @@ static void notify_thresholds(__u64 msr_val)  		return;  	/* lower threshold reached */ -	if ((msr_val & THERM_LOG_THRESHOLD0) &&	thresh_event_valid(0)) +	if ((msr_val & THERM_LOG_THRESHOLD0) && +			thresh_event_valid(CORE_LEVEL, 0))  		platform_thermal_notify(msr_val);  	/* higher threshold reached */ -	if ((msr_val & THERM_LOG_THRESHOLD1) && thresh_event_valid(1)) +	if ((msr_val & THERM_LOG_THRESHOLD1) && +			thresh_event_valid(CORE_LEVEL, 1))  		platform_thermal_notify(msr_val);  } @@ -352,17 +405,19 @@ static void intel_thermal_interrupt(void)  				CORE_LEVEL) != 0)  		mce_log_therm_throt_event(msr_val); -	if (this_cpu_has(X86_FEATURE_PLN)) +	if (this_cpu_has(X86_FEATURE_PLN) && int_pln_enable)  		therm_throt_process(msr_val & THERM_STATUS_POWER_LIMIT,  					POWER_LIMIT_EVENT,  					CORE_LEVEL);  	if (this_cpu_has(X86_FEATURE_PTS)) {  		rdmsrl(MSR_IA32_PACKAGE_THERM_STATUS, msr_val); +		/* check violations of package thermal thresholds */ +		notify_package_thresholds(msr_val);  		therm_throt_process(msr_val & PACKAGE_THERM_STATUS_PROCHOT,  					THERMAL_THROTTLING_EVENT,  					PACKAGE_LEVEL); -		if (this_cpu_has(X86_FEATURE_PLN)) +		if (this_cpu_has(X86_FEATURE_PLN) && int_pln_enable)  			therm_throt_process(msr_val &  					PACKAGE_THERM_STATUS_POWER_LIMIT,  					POWER_LIMIT_EVENT, @@ -378,15 +433,26 @@ static void unexpected_thermal_interrupt(void)  static void (*smp_thermal_vector)(void) = unexpected_thermal_interrupt; -asmlinkage void smp_thermal_interrupt(struct pt_regs *regs) +static inline void __smp_thermal_interrupt(void)  { -	irq_enter(); -	exit_idle();  	inc_irq_stat(irq_thermal_count);  	smp_thermal_vector(); -	irq_exit(); -	/* Ack only at the end to avoid potential reentry */ -	ack_APIC_irq(); +} + +asmlinkage void smp_thermal_interrupt(struct pt_regs *regs) +{ +	entering_irq(); +	__smp_thermal_interrupt(); +	exiting_ack_irq(); +} + +asmlinkage void smp_trace_thermal_interrupt(struct pt_regs *regs) +{ +	entering_irq(); +	trace_thermal_apic_entry(THERMAL_APIC_VECTOR); +	__smp_thermal_interrupt(); +	trace_thermal_apic_exit(THERMAL_APIC_VECTOR); +	exiting_ack_irq();  }  /* Thermal monitoring depends on APIC, ACPI and clock modulation */ @@ -470,9 +536,13 @@ void intel_init_thermal(struct cpuinfo_x86 *c)  	apic_write(APIC_LVTTHMR, h);  	rdmsr(MSR_IA32_THERM_INTERRUPT, l, h); -	if (cpu_has(c, X86_FEATURE_PLN)) +	if (cpu_has(c, X86_FEATURE_PLN) && !int_pln_enable) +		wrmsr(MSR_IA32_THERM_INTERRUPT, +			(l | (THERM_INT_LOW_ENABLE +			| THERM_INT_HIGH_ENABLE)) & ~THERM_INT_PLN_ENABLE, h); +	else if (cpu_has(c, X86_FEATURE_PLN) && int_pln_enable)  		wrmsr(MSR_IA32_THERM_INTERRUPT, -		      l | (THERM_INT_LOW_ENABLE +			l | (THERM_INT_LOW_ENABLE  			| THERM_INT_HIGH_ENABLE | THERM_INT_PLN_ENABLE), h);  	else  		wrmsr(MSR_IA32_THERM_INTERRUPT, @@ -480,9 +550,14 @@ void intel_init_thermal(struct cpuinfo_x86 *c)  	if (cpu_has(c, X86_FEATURE_PTS)) {  		rdmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, l, h); -		if (cpu_has(c, X86_FEATURE_PLN)) +		if (cpu_has(c, X86_FEATURE_PLN) && !int_pln_enable)  			wrmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, -			      l | (PACKAGE_THERM_INT_LOW_ENABLE +				(l | (PACKAGE_THERM_INT_LOW_ENABLE +				| PACKAGE_THERM_INT_HIGH_ENABLE)) +				& ~PACKAGE_THERM_INT_PLN_ENABLE, h); +		else if (cpu_has(c, X86_FEATURE_PLN) && int_pln_enable) +			wrmsr(MSR_IA32_PACKAGE_THERM_INTERRUPT, +				l | (PACKAGE_THERM_INT_LOW_ENABLE  				| PACKAGE_THERM_INT_HIGH_ENABLE  				| PACKAGE_THERM_INT_PLN_ENABLE), h);  		else diff --git a/arch/x86/kernel/cpu/mcheck/threshold.c b/arch/x86/kernel/cpu/mcheck/threshold.c index aa578cadb94..fe6b1c86645 100644 --- a/arch/x86/kernel/cpu/mcheck/threshold.c +++ b/arch/x86/kernel/cpu/mcheck/threshold.c @@ -8,6 +8,7 @@  #include <asm/apic.h>  #include <asm/idle.h>  #include <asm/mce.h> +#include <asm/trace/irq_vectors.h>  static void default_threshold_interrupt(void)  { @@ -17,13 +18,24 @@ static void default_threshold_interrupt(void)  void (*mce_threshold_vector)(void) = default_threshold_interrupt; -asmlinkage void smp_threshold_interrupt(void) +static inline void __smp_threshold_interrupt(void)  { -	irq_enter(); -	exit_idle();  	inc_irq_stat(irq_threshold_count);  	mce_threshold_vector(); -	irq_exit(); -	/* Ack only at the end to avoid potential reentry */ -	ack_APIC_irq(); +} + +asmlinkage void smp_threshold_interrupt(void) +{ +	entering_irq(); +	__smp_threshold_interrupt(); +	exiting_ack_irq(); +} + +asmlinkage void smp_trace_threshold_interrupt(void) +{ +	entering_irq(); +	trace_threshold_apic_entry(THRESHOLD_APIC_VECTOR); +	__smp_threshold_interrupt(); +	trace_threshold_apic_exit(THRESHOLD_APIC_VECTOR); +	exiting_ack_irq();  } diff --git a/arch/x86/kernel/cpu/mtrr/cyrix.c b/arch/x86/kernel/cpu/mtrr/cyrix.c index 68a3343e579..9e451b0876b 100644 --- a/arch/x86/kernel/cpu/mtrr/cyrix.c +++ b/arch/x86/kernel/cpu/mtrr/cyrix.c @@ -167,7 +167,7 @@ static void post_set(void)  	setCx86(CX86_CCR3, ccr3);  	/* Enable caches */ -	write_cr0(read_cr0() & 0xbfffffff); +	write_cr0(read_cr0() & ~X86_CR0_CD);  	/* Restore value of CR4 */  	if (cpu_has_pge) diff --git a/arch/x86/kernel/cpu/mtrr/generic.c b/arch/x86/kernel/cpu/mtrr/generic.c index fa72a39e5d4..d4cdfa67509 100644 --- a/arch/x86/kernel/cpu/mtrr/generic.c +++ b/arch/x86/kernel/cpu/mtrr/generic.c @@ -510,8 +510,9 @@ generic_get_free_region(unsigned long base, unsigned long size, int replace_reg)  static void generic_get_mtrr(unsigned int reg, unsigned long *base,  			     unsigned long *size, mtrr_type *type)  { -	unsigned int mask_lo, mask_hi, base_lo, base_hi; -	unsigned int tmp, hi; +	u32 mask_lo, mask_hi, base_lo, base_hi; +	unsigned int hi; +	u64 tmp, mask;  	/*  	 * get_mtrr doesn't need to update mtrr_state, also it could be called @@ -532,18 +533,18 @@ static void generic_get_mtrr(unsigned int reg, unsigned long *base,  	rdmsr(MTRRphysBase_MSR(reg), base_lo, base_hi);  	/* Work out the shifted address mask: */ -	tmp = mask_hi << (32 - PAGE_SHIFT) | mask_lo >> PAGE_SHIFT; -	mask_lo = size_or_mask | tmp; +	tmp = (u64)mask_hi << (32 - PAGE_SHIFT) | mask_lo >> PAGE_SHIFT; +	mask = size_or_mask | tmp;  	/* Expand tmp with high bits to all 1s: */ -	hi = fls(tmp); +	hi = fls64(tmp);  	if (hi > 0) { -		tmp |= ~((1<<(hi - 1)) - 1); +		tmp |= ~((1ULL<<(hi - 1)) - 1); -		if (tmp != mask_lo) { +		if (tmp != mask) {  			printk(KERN_WARNING "mtrr: your BIOS has configured an incorrect mask, fixing it.\n");  			add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK); -			mask_lo = tmp; +			mask = tmp;  		}  	} @@ -551,8 +552,8 @@ static void generic_get_mtrr(unsigned int reg, unsigned long *base,  	 * This works correctly if size is a power of two, i.e. a  	 * contiguous range:  	 */ -	*size = -mask_lo; -	*base = base_hi << (32 - PAGE_SHIFT) | base_lo >> PAGE_SHIFT; +	*size = -mask; +	*base = (u64)base_hi << (32 - PAGE_SHIFT) | base_lo >> PAGE_SHIFT;  	*type = base_lo & 0xff;  out_put_cpu: @@ -701,7 +702,7 @@ static void post_set(void) __releases(set_atomicity_lock)  	mtrr_wrmsr(MSR_MTRRdefType, deftype_lo, deftype_hi);  	/* Enable caches */ -	write_cr0(read_cr0() & 0xbfffffff); +	write_cr0(read_cr0() & ~X86_CR0_CD);  	/* Restore value of CR4 */  	if (cpu_has_pge) diff --git a/arch/x86/kernel/cpu/mtrr/main.c b/arch/x86/kernel/cpu/mtrr/main.c index 726bf963c22..f961de9964c 100644 --- a/arch/x86/kernel/cpu/mtrr/main.c +++ b/arch/x86/kernel/cpu/mtrr/main.c @@ -51,9 +51,13 @@  #include <asm/e820.h>  #include <asm/mtrr.h>  #include <asm/msr.h> +#include <asm/pat.h>  #include "mtrr.h" +/* arch_phys_wc_add returns an MTRR register index plus this offset. */ +#define MTRR_TO_PHYS_WC_OFFSET 1000 +  u32 num_var_ranges;  unsigned int mtrr_usage_table[MTRR_MAX_VAR_RANGES]; @@ -305,7 +309,8 @@ int mtrr_add_page(unsigned long base, unsigned long size,  		return -EINVAL;  	} -	if (base & size_or_mask || size & size_or_mask) { +	if ((base | (base + size - 1)) >> +	    (boot_cpu_data.x86_phys_bits - PAGE_SHIFT)) {  		pr_warning("mtrr: base or size exceeds the MTRR width\n");  		return -EINVAL;  	} @@ -524,6 +529,73 @@ int mtrr_del(int reg, unsigned long base, unsigned long size)  }  EXPORT_SYMBOL(mtrr_del); +/** + * arch_phys_wc_add - add a WC MTRR and handle errors if PAT is unavailable + * @base: Physical base address + * @size: Size of region + * + * If PAT is available, this does nothing.  If PAT is unavailable, it + * attempts to add a WC MTRR covering size bytes starting at base and + * logs an error if this fails. + * + * Drivers must store the return value to pass to mtrr_del_wc_if_needed, + * but drivers should not try to interpret that return value. + */ +int arch_phys_wc_add(unsigned long base, unsigned long size) +{ +	int ret; + +	if (pat_enabled) +		return 0;  /* Success!  (We don't need to do anything.) */ + +	ret = mtrr_add(base, size, MTRR_TYPE_WRCOMB, true); +	if (ret < 0) { +		pr_warn("Failed to add WC MTRR for [%p-%p]; performance may suffer.", +			(void *)base, (void *)(base + size - 1)); +		return ret; +	} +	return ret + MTRR_TO_PHYS_WC_OFFSET; +} +EXPORT_SYMBOL(arch_phys_wc_add); + +/* + * arch_phys_wc_del - undoes arch_phys_wc_add + * @handle: Return value from arch_phys_wc_add + * + * This cleans up after mtrr_add_wc_if_needed. + * + * The API guarantees that mtrr_del_wc_if_needed(error code) and + * mtrr_del_wc_if_needed(0) do nothing. + */ +void arch_phys_wc_del(int handle) +{ +	if (handle >= 1) { +		WARN_ON(handle < MTRR_TO_PHYS_WC_OFFSET); +		mtrr_del(handle - MTRR_TO_PHYS_WC_OFFSET, 0, 0); +	} +} +EXPORT_SYMBOL(arch_phys_wc_del); + +/* + * phys_wc_to_mtrr_index - translates arch_phys_wc_add's return value + * @handle: Return value from arch_phys_wc_add + * + * This will turn the return value from arch_phys_wc_add into an mtrr + * index suitable for debugging. + * + * Note: There is no legitimate use for this function, except possibly + * in printk line.  Alas there is an illegitimate use in some ancient + * drm ioctls. + */ +int phys_wc_to_mtrr_index(int handle) +{ +	if (handle < MTRR_TO_PHYS_WC_OFFSET) +		return -1; +	else +		return handle - MTRR_TO_PHYS_WC_OFFSET; +} +EXPORT_SYMBOL_GPL(phys_wc_to_mtrr_index); +  /*   * HACK ALERT!   * These should be called implicitly, but we can't yet until all the initcall @@ -583,6 +655,7 @@ static struct syscore_ops mtrr_syscore_ops = {  int __initdata changed_by_mtrr_cleanup; +#define SIZE_OR_MASK_BITS(n)  (~((1ULL << ((n) - PAGE_SHIFT)) - 1))  /**   * mtrr_bp_init - initialize mtrrs on the boot CPU   * @@ -600,7 +673,7 @@ void __init mtrr_bp_init(void)  	if (cpu_has_mtrr) {  		mtrr_if = &generic_mtrr_ops; -		size_or_mask = 0xff000000;			/* 36 bits */ +		size_or_mask = SIZE_OR_MASK_BITS(36);  		size_and_mask = 0x00f00000;  		phys_addr = 36; @@ -619,7 +692,7 @@ void __init mtrr_bp_init(void)  			     boot_cpu_data.x86_mask == 0x4))  				phys_addr = 36; -			size_or_mask = ~((1ULL << (phys_addr - PAGE_SHIFT)) - 1); +			size_or_mask = SIZE_OR_MASK_BITS(phys_addr);  			size_and_mask = ~size_or_mask & 0xfffff00000ULL;  		} else if (boot_cpu_data.x86_vendor == X86_VENDOR_CENTAUR &&  			   boot_cpu_data.x86 == 6) { @@ -627,7 +700,7 @@ void __init mtrr_bp_init(void)  			 * VIA C* family have Intel style MTRRs,  			 * but don't support PAE  			 */ -			size_or_mask = 0xfff00000;		/* 32 bits */ +			size_or_mask = SIZE_OR_MASK_BITS(32);  			size_and_mask = 0;  			phys_addr = 32;  		} @@ -637,21 +710,21 @@ void __init mtrr_bp_init(void)  			if (cpu_has_k6_mtrr) {  				/* Pre-Athlon (K6) AMD CPU MTRRs */  				mtrr_if = mtrr_ops[X86_VENDOR_AMD]; -				size_or_mask = 0xfff00000;	/* 32 bits */ +				size_or_mask = SIZE_OR_MASK_BITS(32);  				size_and_mask = 0;  			}  			break;  		case X86_VENDOR_CENTAUR:  			if (cpu_has_centaur_mcr) {  				mtrr_if = mtrr_ops[X86_VENDOR_CENTAUR]; -				size_or_mask = 0xfff00000;	/* 32 bits */ +				size_or_mask = SIZE_OR_MASK_BITS(32);  				size_and_mask = 0;  			}  			break;  		case X86_VENDOR_CYRIX:  			if (cpu_has_cyrix_arr) {  				mtrr_if = mtrr_ops[X86_VENDOR_CYRIX]; -				size_or_mask = 0xfff00000;	/* 32 bits */ +				size_or_mask = SIZE_OR_MASK_BITS(32);  				size_and_mask = 0;  			}  			break; diff --git a/arch/x86/kernel/cpu/perf_event.c b/arch/x86/kernel/cpu/perf_event.c index 1025f3c99d2..a7c7305030c 100644 --- a/arch/x86/kernel/cpu/perf_event.c +++ b/arch/x86/kernel/cpu/perf_event.c @@ -403,7 +403,8 @@ int x86_pmu_hw_config(struct perf_event *event)  		 * check that PEBS LBR correction does not conflict with  		 * whatever the user is asking with attr->branch_sample_type  		 */ -		if (event->attr.precise_ip > 1) { +		if (event->attr.precise_ip > 1 && +		    x86_pmu.intel_cap.pebs_format < 2) {  			u64 *br_type = &event->attr.branch_sample_type;  			if (has_branch_stack(event)) { @@ -568,7 +569,7 @@ struct sched_state {  struct perf_sched {  	int			max_weight;  	int			max_events; -	struct event_constraint	**constraints; +	struct perf_event	**events;  	struct sched_state	state;  	int			saved_states;  	struct sched_state	saved[SCHED_STATES_MAX]; @@ -577,7 +578,7 @@ struct perf_sched {  /*   * Initialize interator that runs through all events and counters.   */ -static void perf_sched_init(struct perf_sched *sched, struct event_constraint **c, +static void perf_sched_init(struct perf_sched *sched, struct perf_event **events,  			    int num, int wmin, int wmax)  {  	int idx; @@ -585,10 +586,10 @@ static void perf_sched_init(struct perf_sched *sched, struct event_constraint **  	memset(sched, 0, sizeof(*sched));  	sched->max_events	= num;  	sched->max_weight	= wmax; -	sched->constraints	= c; +	sched->events		= events;  	for (idx = 0; idx < num; idx++) { -		if (c[idx]->weight == wmin) +		if (events[idx]->hw.constraint->weight == wmin)  			break;  	} @@ -635,8 +636,7 @@ static bool __perf_sched_find_counter(struct perf_sched *sched)  	if (sched->state.event >= sched->max_events)  		return false; -	c = sched->constraints[sched->state.event]; - +	c = sched->events[sched->state.event]->hw.constraint;  	/* Prefer fixed purpose counters */  	if (c->idxmsk64 & (~0ULL << INTEL_PMC_IDX_FIXED)) {  		idx = INTEL_PMC_IDX_FIXED; @@ -694,7 +694,7 @@ static bool perf_sched_next_event(struct perf_sched *sched)  			if (sched->state.weight > sched->max_weight)  				return false;  		} -		c = sched->constraints[sched->state.event]; +		c = sched->events[sched->state.event]->hw.constraint;  	} while (c->weight != sched->state.weight);  	sched->state.counter = 0;	/* start with first counter */ @@ -705,12 +705,12 @@ static bool perf_sched_next_event(struct perf_sched *sched)  /*   * Assign a counter for each event.   */ -int perf_assign_events(struct event_constraint **constraints, int n, +int perf_assign_events(struct perf_event **events, int n,  			int wmin, int wmax, int *assign)  {  	struct perf_sched sched; -	perf_sched_init(&sched, constraints, n, wmin, wmax); +	perf_sched_init(&sched, events, n, wmin, wmax);  	do {  		if (!perf_sched_find_counter(&sched)) @@ -724,16 +724,19 @@ int perf_assign_events(struct event_constraint **constraints, int n,  int x86_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign)  { -	struct event_constraint *c, *constraints[X86_PMC_IDX_MAX]; +	struct event_constraint *c;  	unsigned long used_mask[BITS_TO_LONGS(X86_PMC_IDX_MAX)]; +	struct perf_event *e;  	int i, wmin, wmax, num = 0;  	struct hw_perf_event *hwc;  	bitmap_zero(used_mask, X86_PMC_IDX_MAX);  	for (i = 0, wmin = X86_PMC_IDX_MAX, wmax = 0; i < n; i++) { +		hwc = &cpuc->event_list[i]->hw;  		c = x86_pmu.get_event_constraints(cpuc, cpuc->event_list[i]); -		constraints[i] = c; +		hwc->constraint = c; +  		wmin = min(wmin, c->weight);  		wmax = max(wmax, c->weight);  	} @@ -743,7 +746,7 @@ int x86_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign)  	 */  	for (i = 0; i < n; i++) {  		hwc = &cpuc->event_list[i]->hw; -		c = constraints[i]; +		c = hwc->constraint;  		/* never assigned */  		if (hwc->idx == -1) @@ -764,16 +767,35 @@ int x86_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign)  	/* slow path */  	if (i != n) -		num = perf_assign_events(constraints, n, wmin, wmax, assign); +		num = perf_assign_events(cpuc->event_list, n, wmin, +					 wmax, assign);  	/* +	 * Mark the event as committed, so we do not put_constraint() +	 * in case new events are added and fail scheduling. +	 */ +	if (!num && assign) { +		for (i = 0; i < n; i++) { +			e = cpuc->event_list[i]; +			e->hw.flags |= PERF_X86_EVENT_COMMITTED; +		} +	} +	/*  	 * scheduling failed or is just a simulation,  	 * free resources if necessary  	 */  	if (!assign || num) {  		for (i = 0; i < n; i++) { +			e = cpuc->event_list[i]; +			/* +			 * do not put_constraint() on comitted events, +			 * because they are good to go +			 */ +			if ((e->hw.flags & PERF_X86_EVENT_COMMITTED)) +				continue; +  			if (x86_pmu.put_event_constraints) -				x86_pmu.put_event_constraints(cpuc, cpuc->event_list[i]); +				x86_pmu.put_event_constraints(cpuc, e);  		}  	}  	return num ? -EINVAL : 0; @@ -1153,6 +1175,11 @@ static void x86_pmu_del(struct perf_event *event, int flags)  	int i;  	/* +	 * event is descheduled +	 */ +	event->hw.flags &= ~PERF_X86_EVENT_COMMITTED; + +	/*  	 * If we're called during a txn, we don't need to do anything.  	 * The events never got scheduled and ->cancel_txn will truncate  	 * the event_list. @@ -1249,16 +1276,26 @@ void perf_events_lapic_init(void)  static int __kprobes  perf_event_nmi_handler(unsigned int cmd, struct pt_regs *regs)  { +	int ret; +	u64 start_clock; +	u64 finish_clock; +  	if (!atomic_read(&active_events))  		return NMI_DONE; -	return x86_pmu.handle_irq(regs); +	start_clock = local_clock(); +	ret = x86_pmu.handle_irq(regs); +	finish_clock = local_clock(); + +	perf_sample_event_took(finish_clock - start_clock); + +	return ret;  }  struct event_constraint emptyconstraint;  struct event_constraint unconstrained; -static int __cpuinit +static int  x86_pmu_notifier(struct notifier_block *self, unsigned long action, void *hcpu)  {  	unsigned int cpu = (long)hcpu; diff --git a/arch/x86/kernel/cpu/perf_event.h b/arch/x86/kernel/cpu/perf_event.h index ba9aadfa683..97e557bc4c9 100644 --- a/arch/x86/kernel/cpu/perf_event.h +++ b/arch/x86/kernel/cpu/perf_event.h @@ -63,10 +63,12 @@ struct event_constraint {  	int	flags;  };  /* - * struct event_constraint flags + * struct hw_perf_event.flags flags   */  #define PERF_X86_EVENT_PEBS_LDLAT	0x1 /* ld+ldlat data address sampling */  #define PERF_X86_EVENT_PEBS_ST		0x2 /* st data address sampling */ +#define PERF_X86_EVENT_PEBS_ST_HSW	0x4 /* haswell style st data sampling */ +#define PERF_X86_EVENT_COMMITTED	0x8 /* event passed commit_txn */  struct amd_nb {  	int nb_id;  /* NorthBridge id */ @@ -227,11 +229,14 @@ struct cpu_hw_events {   *  - inv   *  - edge   *  - cnt-mask + *  - in_tx + *  - in_tx_checkpointed   *  The other filters are supported by fixed counters.   *  The any-thread option is supported starting with v3.   */ +#define FIXED_EVENT_FLAGS (X86_RAW_EVENT_MASK|HSW_IN_TX|HSW_IN_TX_CHECKPOINTED)  #define FIXED_EVENT_CONSTRAINT(c, n)	\ -	EVENT_CONSTRAINT(c, (1ULL << (32+n)), X86_RAW_EVENT_MASK) +	EVENT_CONSTRAINT(c, (1ULL << (32+n)), FIXED_EVENT_FLAGS)  /*   * Constraint on the Event code + UMask @@ -247,6 +252,11 @@ struct cpu_hw_events {  	__EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK, \  			  HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_ST) +/* DataLA version of store sampling without extra enable bit. */ +#define INTEL_PST_HSW_CONSTRAINT(c, n)	\ +	__EVENT_CONSTRAINT(c, n, INTEL_ARCH_EVENT_MASK, \ +			  HWEIGHT(n), 0, PERF_X86_EVENT_PEBS_ST_HSW) +  #define EVENT_CONSTRAINT_END		\  	EVENT_CONSTRAINT(0, 0, 0) @@ -301,6 +311,11 @@ union perf_capabilities {  		u64	pebs_arch_reg:1;  		u64	pebs_format:4;  		u64	smm_freeze:1; +		/* +		 * PMU supports separate counter range for writing +		 * values > 32bit. +		 */ +		u64	full_width_write:1;  	};  	u64	capabilities;  }; @@ -375,6 +390,7 @@ struct x86_pmu {  	struct event_constraint *event_constraints;  	struct x86_pmu_quirk *quirks;  	int		perfctr_second_write; +	bool		late_ack;  	/*  	 * sysfs attrs @@ -528,7 +544,7 @@ static inline void __x86_pmu_enable_event(struct hw_perf_event *hwc,  void x86_pmu_enable_all(int added); -int perf_assign_events(struct event_constraint **constraints, int n, +int perf_assign_events(struct perf_event **events, int n,  			int wmin, int wmax, int *assign);  int x86_schedule_events(struct cpu_hw_events *cpuc, int n, int *assign); @@ -633,6 +649,8 @@ extern struct event_constraint intel_snb_pebs_event_constraints[];  extern struct event_constraint intel_ivb_pebs_event_constraints[]; +extern struct event_constraint intel_hsw_pebs_event_constraints[]; +  struct event_constraint *intel_pebs_constraints(struct perf_event *event);  void intel_pmu_pebs_enable(struct perf_event *event); diff --git a/arch/x86/kernel/cpu/perf_event_amd.c b/arch/x86/kernel/cpu/perf_event_amd.c index 7e28d9467bb..4cbe03287b0 100644 --- a/arch/x86/kernel/cpu/perf_event_amd.c +++ b/arch/x86/kernel/cpu/perf_event_amd.c @@ -648,48 +648,48 @@ static __initconst const struct x86_pmu amd_pmu = {  	.cpu_dead		= amd_pmu_cpu_dead,  }; -static int setup_event_constraints(void) +static int __init amd_core_pmu_init(void)  { -	if (boot_cpu_data.x86 == 0x15) +	if (!cpu_has_perfctr_core) +		return 0; + +	switch (boot_cpu_data.x86) { +	case 0x15: +		pr_cont("Fam15h ");  		x86_pmu.get_event_constraints = amd_get_event_constraints_f15h; -	return 0; -} +		break; -static int setup_perfctr_core(void) -{ -	if (!cpu_has_perfctr_core) { -		WARN(x86_pmu.get_event_constraints == amd_get_event_constraints_f15h, -		     KERN_ERR "Odd, counter constraints enabled but no core perfctrs detected!"); +	default: +		pr_err("core perfctr but no constraints; unknown hardware!\n");  		return -ENODEV;  	} -	WARN(x86_pmu.get_event_constraints == amd_get_event_constraints, -	     KERN_ERR "hw perf events core counters need constraints handler!"); -  	/*  	 * If core performance counter extensions exists, we must use  	 * MSR_F15H_PERF_CTL/MSR_F15H_PERF_CTR msrs. See also -	 * x86_pmu_addr_offset(). +	 * amd_pmu_addr_offset().  	 */  	x86_pmu.eventsel	= MSR_F15H_PERF_CTL;  	x86_pmu.perfctr		= MSR_F15H_PERF_CTR;  	x86_pmu.num_counters	= AMD64_NUM_COUNTERS_CORE; -	printk(KERN_INFO "perf: AMD core performance counters detected\n"); - +	pr_cont("core perfctr, ");  	return 0;  }  __init int amd_pmu_init(void)  { +	int ret; +  	/* Performance-monitoring supported from K7 and later: */  	if (boot_cpu_data.x86 < 6)  		return -ENODEV;  	x86_pmu = amd_pmu; -	setup_event_constraints(); -	setup_perfctr_core(); +	ret = amd_core_pmu_init(); +	if (ret) +		return ret;  	/* Events are common for all AMDs */  	memcpy(hw_cache_event_ids, amd_hw_cache_event_ids, diff --git a/arch/x86/kernel/cpu/perf_event_amd_ibs.c b/arch/x86/kernel/cpu/perf_event_amd_ibs.c index 5f0581e713c..e09f0bfb7b8 100644 --- a/arch/x86/kernel/cpu/perf_event_amd_ibs.c +++ b/arch/x86/kernel/cpu/perf_event_amd_ibs.c @@ -851,7 +851,7 @@ static void clear_APIC_ibs(void *dummy)  		setup_APIC_eilvt(offset, 0, APIC_EILVT_MSG_FIX, 1);  } -static int __cpuinit +static int  perf_ibs_cpu_notifier(struct notifier_block *self, unsigned long action, void *hcpu)  {  	switch (action & ~CPU_TASKS_FROZEN) { diff --git a/arch/x86/kernel/cpu/perf_event_amd_iommu.c b/arch/x86/kernel/cpu/perf_event_amd_iommu.c new file mode 100644 index 00000000000..639d1289b1b --- /dev/null +++ b/arch/x86/kernel/cpu/perf_event_amd_iommu.c @@ -0,0 +1,502 @@ +/* + * Copyright (C) 2013 Advanced Micro Devices, Inc. + * + * Author: Steven Kinney <Steven.Kinney@amd.com> + * Author: Suravee Suthikulpanit <Suraveee.Suthikulpanit@amd.com> + * + * Perf: amd_iommu - AMD IOMMU Performance Counter PMU implementation + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License version 2 as + * published by the Free Software Foundation. + */ + +#include <linux/perf_event.h> +#include <linux/module.h> +#include <linux/cpumask.h> +#include <linux/slab.h> + +#include "perf_event.h" +#include "perf_event_amd_iommu.h" + +#define COUNTER_SHIFT		16 + +#define _GET_BANK(ev)       ((u8)(ev->hw.extra_reg.reg >> 8)) +#define _GET_CNTR(ev)       ((u8)(ev->hw.extra_reg.reg)) + +/* iommu pmu config masks */ +#define _GET_CSOURCE(ev)    ((ev->hw.config & 0xFFULL)) +#define _GET_DEVID(ev)      ((ev->hw.config >> 8)  & 0xFFFFULL) +#define _GET_PASID(ev)      ((ev->hw.config >> 24) & 0xFFFFULL) +#define _GET_DOMID(ev)      ((ev->hw.config >> 40) & 0xFFFFULL) +#define _GET_DEVID_MASK(ev) ((ev->hw.extra_reg.config)  & 0xFFFFULL) +#define _GET_PASID_MASK(ev) ((ev->hw.extra_reg.config >> 16) & 0xFFFFULL) +#define _GET_DOMID_MASK(ev) ((ev->hw.extra_reg.config >> 32) & 0xFFFFULL) + +static struct perf_amd_iommu __perf_iommu; + +struct perf_amd_iommu { +	struct pmu pmu; +	u8 max_banks; +	u8 max_counters; +	u64 cntr_assign_mask; +	raw_spinlock_t lock; +	const struct attribute_group *attr_groups[4]; +}; + +#define format_group	attr_groups[0] +#define cpumask_group	attr_groups[1] +#define events_group	attr_groups[2] +#define null_group	attr_groups[3] + +/*--------------------------------------------- + * sysfs format attributes + *---------------------------------------------*/ +PMU_FORMAT_ATTR(csource,    "config:0-7"); +PMU_FORMAT_ATTR(devid,      "config:8-23"); +PMU_FORMAT_ATTR(pasid,      "config:24-39"); +PMU_FORMAT_ATTR(domid,      "config:40-55"); +PMU_FORMAT_ATTR(devid_mask, "config1:0-15"); +PMU_FORMAT_ATTR(pasid_mask, "config1:16-31"); +PMU_FORMAT_ATTR(domid_mask, "config1:32-47"); + +static struct attribute *iommu_format_attrs[] = { +	&format_attr_csource.attr, +	&format_attr_devid.attr, +	&format_attr_pasid.attr, +	&format_attr_domid.attr, +	&format_attr_devid_mask.attr, +	&format_attr_pasid_mask.attr, +	&format_attr_domid_mask.attr, +	NULL, +}; + +static struct attribute_group amd_iommu_format_group = { +	.name = "format", +	.attrs = iommu_format_attrs, +}; + +/*--------------------------------------------- + * sysfs events attributes + *---------------------------------------------*/ +struct amd_iommu_event_desc { +	struct kobj_attribute attr; +	const char *event; +}; + +static ssize_t _iommu_event_show(struct kobject *kobj, +				struct kobj_attribute *attr, char *buf) +{ +	struct amd_iommu_event_desc *event = +		container_of(attr, struct amd_iommu_event_desc, attr); +	return sprintf(buf, "%s\n", event->event); +} + +#define AMD_IOMMU_EVENT_DESC(_name, _event)			\ +{								\ +	.attr  = __ATTR(_name, 0444, _iommu_event_show, NULL),	\ +	.event = _event,					\ +} + +static struct amd_iommu_event_desc amd_iommu_v2_event_descs[] = { +	AMD_IOMMU_EVENT_DESC(mem_pass_untrans,        "csource=0x01"), +	AMD_IOMMU_EVENT_DESC(mem_pass_pretrans,       "csource=0x02"), +	AMD_IOMMU_EVENT_DESC(mem_pass_excl,           "csource=0x03"), +	AMD_IOMMU_EVENT_DESC(mem_target_abort,        "csource=0x04"), +	AMD_IOMMU_EVENT_DESC(mem_trans_total,         "csource=0x05"), +	AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pte_hit,   "csource=0x06"), +	AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pte_mis,   "csource=0x07"), +	AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pde_hit,   "csource=0x08"), +	AMD_IOMMU_EVENT_DESC(mem_iommu_tlb_pde_mis,   "csource=0x09"), +	AMD_IOMMU_EVENT_DESC(mem_dte_hit,             "csource=0x0a"), +	AMD_IOMMU_EVENT_DESC(mem_dte_mis,             "csource=0x0b"), +	AMD_IOMMU_EVENT_DESC(page_tbl_read_tot,       "csource=0x0c"), +	AMD_IOMMU_EVENT_DESC(page_tbl_read_nst,       "csource=0x0d"), +	AMD_IOMMU_EVENT_DESC(page_tbl_read_gst,       "csource=0x0e"), +	AMD_IOMMU_EVENT_DESC(int_dte_hit,             "csource=0x0f"), +	AMD_IOMMU_EVENT_DESC(int_dte_mis,             "csource=0x10"), +	AMD_IOMMU_EVENT_DESC(cmd_processed,           "csource=0x11"), +	AMD_IOMMU_EVENT_DESC(cmd_processed_inv,       "csource=0x12"), +	AMD_IOMMU_EVENT_DESC(tlb_inv,                 "csource=0x13"), +	{ /* end: all zeroes */ }, +}; + +/*--------------------------------------------- + * sysfs cpumask attributes + *---------------------------------------------*/ +static cpumask_t iommu_cpumask; + +static ssize_t _iommu_cpumask_show(struct device *dev, +				   struct device_attribute *attr, +				   char *buf) +{ +	int n = cpulist_scnprintf(buf, PAGE_SIZE - 2, &iommu_cpumask); +	buf[n++] = '\n'; +	buf[n] = '\0'; +	return n; +} +static DEVICE_ATTR(cpumask, S_IRUGO, _iommu_cpumask_show, NULL); + +static struct attribute *iommu_cpumask_attrs[] = { +	&dev_attr_cpumask.attr, +	NULL, +}; + +static struct attribute_group amd_iommu_cpumask_group = { +	.attrs = iommu_cpumask_attrs, +}; + +/*---------------------------------------------*/ + +static int get_next_avail_iommu_bnk_cntr(struct perf_amd_iommu *perf_iommu) +{ +	unsigned long flags; +	int shift, bank, cntr, retval; +	int max_banks = perf_iommu->max_banks; +	int max_cntrs = perf_iommu->max_counters; + +	raw_spin_lock_irqsave(&perf_iommu->lock, flags); + +	for (bank = 0, shift = 0; bank < max_banks; bank++) { +		for (cntr = 0; cntr < max_cntrs; cntr++) { +			shift = bank + (bank*3) + cntr; +			if (perf_iommu->cntr_assign_mask & (1ULL<<shift)) { +				continue; +			} else { +				perf_iommu->cntr_assign_mask |= (1ULL<<shift); +				retval = ((u16)((u16)bank<<8) | (u8)(cntr)); +				goto out; +			} +		} +	} +	retval = -ENOSPC; +out: +	raw_spin_unlock_irqrestore(&perf_iommu->lock, flags); +	return retval; +} + +static int clear_avail_iommu_bnk_cntr(struct perf_amd_iommu *perf_iommu, +					u8 bank, u8 cntr) +{ +	unsigned long flags; +	int max_banks, max_cntrs; +	int shift = 0; + +	max_banks = perf_iommu->max_banks; +	max_cntrs = perf_iommu->max_counters; + +	if ((bank > max_banks) || (cntr > max_cntrs)) +		return -EINVAL; + +	shift = bank + cntr + (bank*3); + +	raw_spin_lock_irqsave(&perf_iommu->lock, flags); +	perf_iommu->cntr_assign_mask &= ~(1ULL<<shift); +	raw_spin_unlock_irqrestore(&perf_iommu->lock, flags); + +	return 0; +} + +static int perf_iommu_event_init(struct perf_event *event) +{ +	struct hw_perf_event *hwc = &event->hw; +	struct perf_amd_iommu *perf_iommu; +	u64 config, config1; + +	/* test the event attr type check for PMU enumeration */ +	if (event->attr.type != event->pmu->type) +		return -ENOENT; + +	/* +	 * IOMMU counters are shared across all cores. +	 * Therefore, it does not support per-process mode. +	 * Also, it does not support event sampling mode. +	 */ +	if (is_sampling_event(event) || event->attach_state & PERF_ATTACH_TASK) +		return -EINVAL; + +	/* IOMMU counters do not have usr/os/guest/host bits */ +	if (event->attr.exclude_user || event->attr.exclude_kernel || +	    event->attr.exclude_host || event->attr.exclude_guest) +		return -EINVAL; + +	if (event->cpu < 0) +		return -EINVAL; + +	perf_iommu = &__perf_iommu; + +	if (event->pmu != &perf_iommu->pmu) +		return -ENOENT; + +	if (perf_iommu) { +		config = event->attr.config; +		config1 = event->attr.config1; +	} else { +		return -EINVAL; +	} + +	/* integrate with iommu base devid (0000), assume one iommu */ +	perf_iommu->max_banks = +		amd_iommu_pc_get_max_banks(IOMMU_BASE_DEVID); +	perf_iommu->max_counters = +		amd_iommu_pc_get_max_counters(IOMMU_BASE_DEVID); +	if ((perf_iommu->max_banks == 0) || (perf_iommu->max_counters == 0)) +		return -EINVAL; + +	/* update the hw_perf_event struct with the iommu config data */ +	hwc->config = config; +	hwc->extra_reg.config = config1; + +	return 0; +} + +static void perf_iommu_enable_event(struct perf_event *ev) +{ +	u8 csource = _GET_CSOURCE(ev); +	u16 devid = _GET_DEVID(ev); +	u64 reg = 0ULL; + +	reg = csource; +	amd_iommu_pc_get_set_reg_val(devid, +			_GET_BANK(ev), _GET_CNTR(ev) , +			 IOMMU_PC_COUNTER_SRC_REG, ®, true); + +	reg = 0ULL | devid | (_GET_DEVID_MASK(ev) << 32); +	if (reg) +		reg |= (1UL << 31); +	amd_iommu_pc_get_set_reg_val(devid, +			_GET_BANK(ev), _GET_CNTR(ev) , +			 IOMMU_PC_DEVID_MATCH_REG, ®, true); + +	reg = 0ULL | _GET_PASID(ev) | (_GET_PASID_MASK(ev) << 32); +	if (reg) +		reg |= (1UL << 31); +	amd_iommu_pc_get_set_reg_val(devid, +			_GET_BANK(ev), _GET_CNTR(ev) , +			 IOMMU_PC_PASID_MATCH_REG, ®, true); + +	reg = 0ULL | _GET_DOMID(ev) | (_GET_DOMID_MASK(ev) << 32); +	if (reg) +		reg |= (1UL << 31); +	amd_iommu_pc_get_set_reg_val(devid, +			_GET_BANK(ev), _GET_CNTR(ev) , +			 IOMMU_PC_DOMID_MATCH_REG, ®, true); +} + +static void perf_iommu_disable_event(struct perf_event *event) +{ +	u64 reg = 0ULL; + +	amd_iommu_pc_get_set_reg_val(_GET_DEVID(event), +			_GET_BANK(event), _GET_CNTR(event), +			IOMMU_PC_COUNTER_SRC_REG, ®, true); +} + +static void perf_iommu_start(struct perf_event *event, int flags) +{ +	struct hw_perf_event *hwc = &event->hw; + +	pr_debug("perf: amd_iommu:perf_iommu_start\n"); +	if (WARN_ON_ONCE(!(hwc->state & PERF_HES_STOPPED))) +		return; + +	WARN_ON_ONCE(!(hwc->state & PERF_HES_UPTODATE)); +	hwc->state = 0; + +	if (flags & PERF_EF_RELOAD) { +		u64 prev_raw_count =  local64_read(&hwc->prev_count); +		amd_iommu_pc_get_set_reg_val(_GET_DEVID(event), +				_GET_BANK(event), _GET_CNTR(event), +				IOMMU_PC_COUNTER_REG, &prev_raw_count, true); +	} + +	perf_iommu_enable_event(event); +	perf_event_update_userpage(event); + +} + +static void perf_iommu_read(struct perf_event *event) +{ +	u64 count = 0ULL; +	u64 prev_raw_count = 0ULL; +	u64 delta = 0ULL; +	struct hw_perf_event *hwc = &event->hw; +	pr_debug("perf: amd_iommu:perf_iommu_read\n"); + +	amd_iommu_pc_get_set_reg_val(_GET_DEVID(event), +				_GET_BANK(event), _GET_CNTR(event), +				IOMMU_PC_COUNTER_REG, &count, false); + +	/* IOMMU pc counter register is only 48 bits */ +	count &= 0xFFFFFFFFFFFFULL; + +	prev_raw_count =  local64_read(&hwc->prev_count); +	if (local64_cmpxchg(&hwc->prev_count, prev_raw_count, +					count) != prev_raw_count) +		return; + +	/* Handling 48-bit counter overflowing */ +	delta = (count << COUNTER_SHIFT) - (prev_raw_count << COUNTER_SHIFT); +	delta >>= COUNTER_SHIFT; +	local64_add(delta, &event->count); + +} + +static void perf_iommu_stop(struct perf_event *event, int flags) +{ +	struct hw_perf_event *hwc = &event->hw; +	u64 config; + +	pr_debug("perf: amd_iommu:perf_iommu_stop\n"); + +	if (hwc->state & PERF_HES_UPTODATE) +		return; + +	perf_iommu_disable_event(event); +	WARN_ON_ONCE(hwc->state & PERF_HES_STOPPED); +	hwc->state |= PERF_HES_STOPPED; + +	if (hwc->state & PERF_HES_UPTODATE) +		return; + +	config = hwc->config; +	perf_iommu_read(event); +	hwc->state |= PERF_HES_UPTODATE; +} + +static int perf_iommu_add(struct perf_event *event, int flags) +{ +	int retval; +	struct perf_amd_iommu *perf_iommu = +			container_of(event->pmu, struct perf_amd_iommu, pmu); + +	pr_debug("perf: amd_iommu:perf_iommu_add\n"); +	event->hw.state = PERF_HES_UPTODATE | PERF_HES_STOPPED; + +	/* request an iommu bank/counter */ +	retval = get_next_avail_iommu_bnk_cntr(perf_iommu); +	if (retval != -ENOSPC) +		event->hw.extra_reg.reg = (u16)retval; +	else +		return retval; + +	if (flags & PERF_EF_START) +		perf_iommu_start(event, PERF_EF_RELOAD); + +	return 0; +} + +static void perf_iommu_del(struct perf_event *event, int flags) +{ +	struct perf_amd_iommu *perf_iommu = +			container_of(event->pmu, struct perf_amd_iommu, pmu); + +	pr_debug("perf: amd_iommu:perf_iommu_del\n"); +	perf_iommu_stop(event, PERF_EF_UPDATE); + +	/* clear the assigned iommu bank/counter */ +	clear_avail_iommu_bnk_cntr(perf_iommu, +				     _GET_BANK(event), +				     _GET_CNTR(event)); + +	perf_event_update_userpage(event); +} + +static __init int _init_events_attrs(struct perf_amd_iommu *perf_iommu) +{ +	struct attribute **attrs; +	struct attribute_group *attr_group; +	int i = 0, j; + +	while (amd_iommu_v2_event_descs[i].attr.attr.name) +		i++; + +	attr_group = kzalloc(sizeof(struct attribute *) +		* (i + 1) + sizeof(*attr_group), GFP_KERNEL); +	if (!attr_group) +		return -ENOMEM; + +	attrs = (struct attribute **)(attr_group + 1); +	for (j = 0; j < i; j++) +		attrs[j] = &amd_iommu_v2_event_descs[j].attr.attr; + +	attr_group->name = "events"; +	attr_group->attrs = attrs; +	perf_iommu->events_group = attr_group; + +	return 0; +} + +static __init void amd_iommu_pc_exit(void) +{ +	if (__perf_iommu.events_group != NULL) { +		kfree(__perf_iommu.events_group); +		__perf_iommu.events_group = NULL; +	} +} + +static __init int _init_perf_amd_iommu( +	struct perf_amd_iommu *perf_iommu, char *name) +{ +	int ret; + +	raw_spin_lock_init(&perf_iommu->lock); + +	/* Init format attributes */ +	perf_iommu->format_group = &amd_iommu_format_group; + +	/* Init cpumask attributes to only core 0 */ +	cpumask_set_cpu(0, &iommu_cpumask); +	perf_iommu->cpumask_group = &amd_iommu_cpumask_group; + +	/* Init events attributes */ +	if (_init_events_attrs(perf_iommu) != 0) +		pr_err("perf: amd_iommu: Only support raw events.\n"); + +	/* Init null attributes */ +	perf_iommu->null_group = NULL; +	perf_iommu->pmu.attr_groups = perf_iommu->attr_groups; + +	ret = perf_pmu_register(&perf_iommu->pmu, name, -1); +	if (ret) { +		pr_err("perf: amd_iommu: Failed to initialized.\n"); +		amd_iommu_pc_exit(); +	} else { +		pr_info("perf: amd_iommu: Detected. (%d banks, %d counters/bank)\n", +			amd_iommu_pc_get_max_banks(IOMMU_BASE_DEVID), +			amd_iommu_pc_get_max_counters(IOMMU_BASE_DEVID)); +	} + +	return ret; +} + +static struct perf_amd_iommu __perf_iommu = { +	.pmu = { +		.event_init	= perf_iommu_event_init, +		.add		= perf_iommu_add, +		.del		= perf_iommu_del, +		.start		= perf_iommu_start, +		.stop		= perf_iommu_stop, +		.read		= perf_iommu_read, +	}, +	.max_banks		= 0x00, +	.max_counters		= 0x00, +	.cntr_assign_mask	= 0ULL, +	.format_group		= NULL, +	.cpumask_group		= NULL, +	.events_group		= NULL, +	.null_group		= NULL, +}; + +static __init int amd_iommu_pc_init(void) +{ +	/* Make sure the IOMMU PC resource is available */ +	if (!amd_iommu_pc_supported()) +		return -ENODEV; + +	_init_perf_amd_iommu(&__perf_iommu, "amd_iommu"); + +	return 0; +} + +device_initcall(amd_iommu_pc_init); diff --git a/arch/x86/kernel/cpu/perf_event_amd_iommu.h b/arch/x86/kernel/cpu/perf_event_amd_iommu.h new file mode 100644 index 00000000000..845d173278e --- /dev/null +++ b/arch/x86/kernel/cpu/perf_event_amd_iommu.h @@ -0,0 +1,40 @@ +/* + * Copyright (C) 2013 Advanced Micro Devices, Inc. + * + * Author: Steven Kinney <Steven.Kinney@amd.com> + * Author: Suravee Suthikulpanit <Suraveee.Suthikulpanit@amd.com> + * + * This program is free software; you can redistribute it and/or modify + * it under the terms of the GNU General Public License version 2 as + * published by the Free Software Foundation. + */ + +#ifndef _PERF_EVENT_AMD_IOMMU_H_ +#define _PERF_EVENT_AMD_IOMMU_H_ + +/* iommu pc mmio region register indexes */ +#define IOMMU_PC_COUNTER_REG			0x00 +#define IOMMU_PC_COUNTER_SRC_REG		0x08 +#define IOMMU_PC_PASID_MATCH_REG		0x10 +#define IOMMU_PC_DOMID_MATCH_REG		0x18 +#define IOMMU_PC_DEVID_MATCH_REG		0x20 +#define IOMMU_PC_COUNTER_REPORT_REG		0x28 + +/* maximun specified bank/counters */ +#define PC_MAX_SPEC_BNKS			64 +#define PC_MAX_SPEC_CNTRS			16 + +/* iommu pc reg masks*/ +#define IOMMU_BASE_DEVID			0x0000 + +/* amd_iommu_init.c external support functions */ +extern bool amd_iommu_pc_supported(void); + +extern u8 amd_iommu_pc_get_max_banks(u16 devid); + +extern u8 amd_iommu_pc_get_max_counters(u16 devid); + +extern int amd_iommu_pc_get_set_reg_val(u16 devid, u8 bank, u8 cntr, +			u8 fxn, u64 *value, bool is_write); + +#endif /*_PERF_EVENT_AMD_IOMMU_H_*/ diff --git a/arch/x86/kernel/cpu/perf_event_amd_uncore.c b/arch/x86/kernel/cpu/perf_event_amd_uncore.c index c0c661adf03..754291adec3 100644 --- a/arch/x86/kernel/cpu/perf_event_amd_uncore.c +++ b/arch/x86/kernel/cpu/perf_event_amd_uncore.c @@ -288,13 +288,13 @@ static struct pmu amd_l2_pmu = {  	.read		= amd_uncore_read,  }; -static struct amd_uncore * __cpuinit amd_uncore_alloc(unsigned int cpu) +static struct amd_uncore *amd_uncore_alloc(unsigned int cpu)  {  	return kzalloc_node(sizeof(struct amd_uncore), GFP_KERNEL,  			cpu_to_node(cpu));  } -static void __cpuinit amd_uncore_cpu_up_prepare(unsigned int cpu) +static void amd_uncore_cpu_up_prepare(unsigned int cpu)  {  	struct amd_uncore *uncore; @@ -322,8 +322,8 @@ static void __cpuinit amd_uncore_cpu_up_prepare(unsigned int cpu)  }  static struct amd_uncore * -__cpuinit amd_uncore_find_online_sibling(struct amd_uncore *this, -					 struct amd_uncore * __percpu *uncores) +amd_uncore_find_online_sibling(struct amd_uncore *this, +			       struct amd_uncore * __percpu *uncores)  {  	unsigned int cpu;  	struct amd_uncore *that; @@ -348,7 +348,7 @@ __cpuinit amd_uncore_find_online_sibling(struct amd_uncore *this,  	return this;  } -static void __cpuinit amd_uncore_cpu_starting(unsigned int cpu) +static void amd_uncore_cpu_starting(unsigned int cpu)  {  	unsigned int eax, ebx, ecx, edx;  	struct amd_uncore *uncore; @@ -376,8 +376,8 @@ static void __cpuinit amd_uncore_cpu_starting(unsigned int cpu)  	}  } -static void __cpuinit uncore_online(unsigned int cpu, -				    struct amd_uncore * __percpu *uncores) +static void uncore_online(unsigned int cpu, +			  struct amd_uncore * __percpu *uncores)  {  	struct amd_uncore *uncore = *per_cpu_ptr(uncores, cpu); @@ -388,7 +388,7 @@ static void __cpuinit uncore_online(unsigned int cpu,  		cpumask_set_cpu(cpu, uncore->active_mask);  } -static void __cpuinit amd_uncore_cpu_online(unsigned int cpu) +static void amd_uncore_cpu_online(unsigned int cpu)  {  	if (amd_uncore_nb)  		uncore_online(cpu, amd_uncore_nb); @@ -397,8 +397,8 @@ static void __cpuinit amd_uncore_cpu_online(unsigned int cpu)  		uncore_online(cpu, amd_uncore_l2);  } -static void __cpuinit uncore_down_prepare(unsigned int cpu, -					  struct amd_uncore * __percpu *uncores) +static void uncore_down_prepare(unsigned int cpu, +				struct amd_uncore * __percpu *uncores)  {  	unsigned int i;  	struct amd_uncore *this = *per_cpu_ptr(uncores, cpu); @@ -423,7 +423,7 @@ static void __cpuinit uncore_down_prepare(unsigned int cpu,  	}  } -static void __cpuinit amd_uncore_cpu_down_prepare(unsigned int cpu) +static void amd_uncore_cpu_down_prepare(unsigned int cpu)  {  	if (amd_uncore_nb)  		uncore_down_prepare(cpu, amd_uncore_nb); @@ -432,8 +432,7 @@ static void __cpuinit amd_uncore_cpu_down_prepare(unsigned int cpu)  		uncore_down_prepare(cpu, amd_uncore_l2);  } -static void __cpuinit uncore_dead(unsigned int cpu, -				  struct amd_uncore * __percpu *uncores) +static void uncore_dead(unsigned int cpu, struct amd_uncore * __percpu *uncores)  {  	struct amd_uncore *uncore = *per_cpu_ptr(uncores, cpu); @@ -445,7 +444,7 @@ static void __cpuinit uncore_dead(unsigned int cpu,  	*per_cpu_ptr(amd_uncore_nb, cpu) = NULL;  } -static void __cpuinit amd_uncore_cpu_dead(unsigned int cpu) +static void amd_uncore_cpu_dead(unsigned int cpu)  {  	if (amd_uncore_nb)  		uncore_dead(cpu, amd_uncore_nb); @@ -454,7 +453,7 @@ static void __cpuinit amd_uncore_cpu_dead(unsigned int cpu)  		uncore_dead(cpu, amd_uncore_l2);  } -static int __cpuinit +static int  amd_uncore_cpu_notifier(struct notifier_block *self, unsigned long action,  			void *hcpu)  { @@ -489,7 +488,7 @@ amd_uncore_cpu_notifier(struct notifier_block *self, unsigned long action,  	return NOTIFY_OK;  } -static struct notifier_block amd_uncore_cpu_notifier_block __cpuinitdata = { +static struct notifier_block amd_uncore_cpu_notifier_block = {  	.notifier_call	= amd_uncore_cpu_notifier,  	.priority	= CPU_PRI_PERF + 1,  }; diff --git a/arch/x86/kernel/cpu/perf_event_intel.c b/arch/x86/kernel/cpu/perf_event_intel.c index a9e22073bd5..a45d8d4ace1 100644 --- a/arch/x86/kernel/cpu/perf_event_intel.c +++ b/arch/x86/kernel/cpu/perf_event_intel.c @@ -13,6 +13,7 @@  #include <linux/slab.h>  #include <linux/export.h> +#include <asm/cpufeature.h>  #include <asm/hardirq.h>  #include <asm/apic.h> @@ -190,6 +191,22 @@ struct attribute *snb_events_attrs[] = {  	NULL,  }; +static struct event_constraint intel_hsw_event_constraints[] = { +	FIXED_EVENT_CONSTRAINT(0x00c0, 0), /* INST_RETIRED.ANY */ +	FIXED_EVENT_CONSTRAINT(0x003c, 1), /* CPU_CLK_UNHALTED.CORE */ +	FIXED_EVENT_CONSTRAINT(0x0300, 2), /* CPU_CLK_UNHALTED.REF */ +	INTEL_EVENT_CONSTRAINT(0x48, 0x4), /* L1D_PEND_MISS.* */ +	INTEL_UEVENT_CONSTRAINT(0x01c0, 0x2), /* INST_RETIRED.PREC_DIST */ +	INTEL_EVENT_CONSTRAINT(0xcd, 0x8), /* MEM_TRANS_RETIRED.LOAD_LATENCY */ +	/* CYCLE_ACTIVITY.CYCLES_L1D_PENDING */ +	INTEL_EVENT_CONSTRAINT(0x08a3, 0x4), +	/* CYCLE_ACTIVITY.STALLS_L1D_PENDING */ +	INTEL_EVENT_CONSTRAINT(0x0ca3, 0x4), +	/* CYCLE_ACTIVITY.CYCLES_NO_EXECUTE */ +	INTEL_EVENT_CONSTRAINT(0x04a3, 0xf), +	EVENT_CONSTRAINT_END +}; +  static u64 intel_pmu_event_map(int hw_event)  {  	return intel_perfmon_event_map[hw_event]; @@ -872,7 +889,8 @@ static inline bool intel_pmu_needs_lbr_smpl(struct perf_event *event)  		return true;  	/* implicit branch sampling to correct PEBS skid */ -	if (x86_pmu.intel_cap.pebs_trap && event->attr.precise_ip > 1) +	if (x86_pmu.intel_cap.pebs_trap && event->attr.precise_ip > 1 && +	    x86_pmu.intel_cap.pebs_format < 2)  		return true;  	return false; @@ -1167,15 +1185,11 @@ static int intel_pmu_handle_irq(struct pt_regs *regs)  	cpuc = &__get_cpu_var(cpu_hw_events);  	/* -	 * Some chipsets need to unmask the LVTPC in a particular spot -	 * inside the nmi handler.  As a result, the unmasking was pushed -	 * into all the nmi handlers. -	 * -	 * This handler doesn't seem to have any issues with the unmasking -	 * so it was left at the top. +	 * No known reason to not always do late ACK, +	 * but just in case do it opt-in.  	 */ -	apic_write(APIC_LVTPC, APIC_DM_NMI); - +	if (!x86_pmu.late_ack) +		apic_write(APIC_LVTPC, APIC_DM_NMI);  	intel_pmu_disable_all();  	handled = intel_pmu_drain_bts_buffer();  	status = intel_pmu_get_status(); @@ -1188,8 +1202,12 @@ static int intel_pmu_handle_irq(struct pt_regs *regs)  again:  	intel_pmu_ack_status(status);  	if (++loops > 100) { -		WARN_ONCE(1, "perfevents: irq loop stuck!\n"); -		perf_event_print_debug(); +		static bool warned = false; +		if (!warned) { +			WARN(1, "perfevents: irq loop stuck!\n"); +			perf_event_print_debug(); +			warned = true; +		}  		intel_pmu_reset();  		goto done;  	} @@ -1235,6 +1253,13 @@ again:  done:  	intel_pmu_enable_all(0); +	/* +	 * Only unmask the NMI after the overflow counters +	 * have been reset. This avoids spurious NMIs on +	 * Haswell CPUs. +	 */ +	if (x86_pmu.late_ack) +		apic_write(APIC_LVTPC, APIC_DM_NMI);  	return handled;  } @@ -1425,7 +1450,6 @@ x86_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event)  	if (x86_pmu.event_constraints) {  		for_each_event_constraint(c, x86_pmu.event_constraints) {  			if ((event->hw.config & c->cmask) == c->code) { -				/* hw.flags zeroed at initialization */  				event->hw.flags |= c->flags;  				return c;  			} @@ -1473,7 +1497,6 @@ intel_put_shared_regs_event_constraints(struct cpu_hw_events *cpuc,  static void intel_put_event_constraints(struct cpu_hw_events *cpuc,  					struct perf_event *event)  { -	event->hw.flags = 0;  	intel_put_shared_regs_event_constraints(cpuc, event);  } @@ -1646,6 +1669,47 @@ static void core_pmu_enable_all(int added)  	}  } +static int hsw_hw_config(struct perf_event *event) +{ +	int ret = intel_pmu_hw_config(event); + +	if (ret) +		return ret; +	if (!boot_cpu_has(X86_FEATURE_RTM) && !boot_cpu_has(X86_FEATURE_HLE)) +		return 0; +	event->hw.config |= event->attr.config & (HSW_IN_TX|HSW_IN_TX_CHECKPOINTED); + +	/* +	 * IN_TX/IN_TX-CP filters are not supported by the Haswell PMU with +	 * PEBS or in ANY thread mode. Since the results are non-sensical forbid +	 * this combination. +	 */ +	if ((event->hw.config & (HSW_IN_TX|HSW_IN_TX_CHECKPOINTED)) && +	     ((event->hw.config & ARCH_PERFMON_EVENTSEL_ANY) || +	      event->attr.precise_ip > 0)) +		return -EOPNOTSUPP; + +	return 0; +} + +static struct event_constraint counter2_constraint = +			EVENT_CONSTRAINT(0, 0x4, 0); + +static struct event_constraint * +hsw_get_event_constraints(struct cpu_hw_events *cpuc, struct perf_event *event) +{ +	struct event_constraint *c = intel_get_event_constraints(cpuc, event); + +	/* Handle special quirk on in_tx_checkpointed only in counter 2 */ +	if (event->hw.config & HSW_IN_TX_CHECKPOINTED) { +		if (c->idxmsk64 & (1U << 2)) +			return &counter2_constraint; +		return &emptyconstraint; +	} + +	return c; +} +  PMU_FORMAT_ATTR(event,	"config:0-7"	);  PMU_FORMAT_ATTR(umask,	"config:8-15"	);  PMU_FORMAT_ATTR(edge,	"config:18"	); @@ -1653,6 +1717,8 @@ PMU_FORMAT_ATTR(pc,	"config:19"	);  PMU_FORMAT_ATTR(any,	"config:21"	); /* v3 + */  PMU_FORMAT_ATTR(inv,	"config:23"	);  PMU_FORMAT_ATTR(cmask,	"config:24-31"	); +PMU_FORMAT_ATTR(in_tx,  "config:32"); +PMU_FORMAT_ATTR(in_tx_cp, "config:33");  static struct attribute *intel_arch_formats_attr[] = {  	&format_attr_event.attr, @@ -1807,6 +1873,8 @@ static struct attribute *intel_arch3_formats_attr[] = {  	&format_attr_any.attr,  	&format_attr_inv.attr,  	&format_attr_cmask.attr, +	&format_attr_in_tx.attr, +	&format_attr_in_tx_cp.attr,  	&format_attr_offcore_rsp.attr, /* XXX do NHM/WSM + SNB breakout */  	&format_attr_ldlat.attr, /* PEBS load latency */ @@ -1966,6 +2034,15 @@ static __init void intel_nehalem_quirk(void)  	}  } +EVENT_ATTR_STR(mem-loads,      mem_ld_hsw,     "event=0xcd,umask=0x1,ldlat=3"); +EVENT_ATTR_STR(mem-stores,     mem_st_hsw,     "event=0xd0,umask=0x82") + +static struct attribute *hsw_events_attrs[] = { +	EVENT_PTR(mem_ld_hsw), +	EVENT_PTR(mem_st_hsw), +	NULL +}; +  __init int intel_pmu_init(void)  {  	union cpuid10_edx edx; @@ -2189,6 +2266,31 @@ __init int intel_pmu_init(void)  		break; +	case 60: /* Haswell Client */ +	case 70: +	case 71: +	case 63: +	case 69: +		x86_pmu.late_ack = true; +		memcpy(hw_cache_event_ids, snb_hw_cache_event_ids, sizeof(hw_cache_event_ids)); +		memcpy(hw_cache_extra_regs, snb_hw_cache_extra_regs, sizeof(hw_cache_extra_regs)); + +		intel_pmu_lbr_init_snb(); + +		x86_pmu.event_constraints = intel_hsw_event_constraints; +		x86_pmu.pebs_constraints = intel_hsw_pebs_event_constraints; +		x86_pmu.extra_regs = intel_snb_extra_regs; +		x86_pmu.pebs_aliases = intel_pebs_aliases_snb; +		/* all extra regs are per-cpu when HT is on */ +		x86_pmu.er_flags |= ERF_HAS_RSP_1; +		x86_pmu.er_flags |= ERF_NO_HT_SHARING; + +		x86_pmu.hw_config = hsw_hw_config; +		x86_pmu.get_event_constraints = hsw_get_event_constraints; +		x86_pmu.cpu_events = hsw_events_attrs; +		pr_cont("Haswell events, "); +		break; +  	default:  		switch (x86_pmu.version) {  		case 1: @@ -2227,7 +2329,7 @@ __init int intel_pmu_init(void)  		 * counter, so do not extend mask to generic counters  		 */  		for_each_event_constraint(c, x86_pmu.event_constraints) { -			if (c->cmask != X86_RAW_EVENT_MASK +			if (c->cmask != FIXED_EVENT_FLAGS  			    || c->idxmsk64 == INTEL_PMC_MSK_FIXED_REF_CYCLES) {  				continue;  			} @@ -2237,5 +2339,12 @@ __init int intel_pmu_init(void)  		}  	} +	/* Support full width counters using alternative MSR range */ +	if (x86_pmu.intel_cap.full_width_write) { +		x86_pmu.max_period = x86_pmu.cntval_mask; +		x86_pmu.perfctr = MSR_IA32_PMC0; +		pr_cont("full-width counters, "); +	} +  	return 0;  } diff --git a/arch/x86/kernel/cpu/perf_event_intel_ds.c b/arch/x86/kernel/cpu/perf_event_intel_ds.c index 60250f68705..3065c57a63c 100644 --- a/arch/x86/kernel/cpu/perf_event_intel_ds.c +++ b/arch/x86/kernel/cpu/perf_event_intel_ds.c @@ -107,6 +107,19 @@ static u64 precise_store_data(u64 status)  	return val;  } +static u64 precise_store_data_hsw(u64 status) +{ +	union perf_mem_data_src dse; + +	dse.val = 0; +	dse.mem_op = PERF_MEM_OP_STORE; +	dse.mem_lvl = PERF_MEM_LVL_NA; +	if (status & 1) +		dse.mem_lvl = PERF_MEM_LVL_L1; +	/* Nothing else supported. Sorry. */ +	return dse.val; +} +  static u64 load_latency_data(u64 status)  {  	union intel_x86_pebs_dse dse; @@ -165,6 +178,22 @@ struct pebs_record_nhm {  	u64 status, dla, dse, lat;  }; +/* + * Same as pebs_record_nhm, with two additional fields. + */ +struct pebs_record_hsw { +	struct pebs_record_nhm nhm; +	/* +	 * Real IP of the event. In the Intel documentation this +	 * is called eventingrip. +	 */ +	u64 real_ip; +	/* +	 * TSX tuning information field: abort cycles and abort flags. +	 */ +	u64 tsx_tuning; +}; +  void init_debug_store_on_cpu(int cpu)  {  	struct debug_store *ds = per_cpu(cpu_hw_events, cpu).ds; @@ -548,6 +577,42 @@ struct event_constraint intel_ivb_pebs_event_constraints[] = {          EVENT_CONSTRAINT_END  }; +struct event_constraint intel_hsw_pebs_event_constraints[] = { +	INTEL_UEVENT_CONSTRAINT(0x01c0, 0x2), /* INST_RETIRED.PRECDIST */ +	INTEL_PST_HSW_CONSTRAINT(0x01c2, 0xf), /* UOPS_RETIRED.ALL */ +	INTEL_UEVENT_CONSTRAINT(0x02c2, 0xf), /* UOPS_RETIRED.RETIRE_SLOTS */ +	INTEL_EVENT_CONSTRAINT(0xc4, 0xf),    /* BR_INST_RETIRED.* */ +	INTEL_UEVENT_CONSTRAINT(0x01c5, 0xf), /* BR_MISP_RETIRED.CONDITIONAL */ +	INTEL_UEVENT_CONSTRAINT(0x04c5, 0xf), /* BR_MISP_RETIRED.ALL_BRANCHES */ +	INTEL_UEVENT_CONSTRAINT(0x20c5, 0xf), /* BR_MISP_RETIRED.NEAR_TAKEN */ +	INTEL_PLD_CONSTRAINT(0x01cd, 0x8),    /* MEM_TRANS_RETIRED.* */ +	/* MEM_UOPS_RETIRED.STLB_MISS_LOADS */ +	INTEL_UEVENT_CONSTRAINT(0x11d0, 0xf), +	/* MEM_UOPS_RETIRED.STLB_MISS_STORES */ +	INTEL_UEVENT_CONSTRAINT(0x12d0, 0xf), +	INTEL_UEVENT_CONSTRAINT(0x21d0, 0xf), /* MEM_UOPS_RETIRED.LOCK_LOADS */ +	INTEL_UEVENT_CONSTRAINT(0x41d0, 0xf), /* MEM_UOPS_RETIRED.SPLIT_LOADS */ +	/* MEM_UOPS_RETIRED.SPLIT_STORES */ +	INTEL_UEVENT_CONSTRAINT(0x42d0, 0xf), +	INTEL_UEVENT_CONSTRAINT(0x81d0, 0xf), /* MEM_UOPS_RETIRED.ALL_LOADS */ +	INTEL_PST_HSW_CONSTRAINT(0x82d0, 0xf), /* MEM_UOPS_RETIRED.ALL_STORES */ +	INTEL_UEVENT_CONSTRAINT(0x01d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.L1_HIT */ +	INTEL_UEVENT_CONSTRAINT(0x02d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.L2_HIT */ +	INTEL_UEVENT_CONSTRAINT(0x04d1, 0xf), /* MEM_LOAD_UOPS_RETIRED.L3_HIT */ +	/* MEM_LOAD_UOPS_RETIRED.HIT_LFB */ +	INTEL_UEVENT_CONSTRAINT(0x40d1, 0xf), +	/* MEM_LOAD_UOPS_LLC_HIT_RETIRED.XSNP_MISS */ +	INTEL_UEVENT_CONSTRAINT(0x01d2, 0xf), +	/* MEM_LOAD_UOPS_LLC_HIT_RETIRED.XSNP_HIT */ +	INTEL_UEVENT_CONSTRAINT(0x02d2, 0xf), +	/* MEM_LOAD_UOPS_LLC_MISS_RETIRED.LOCAL_DRAM */ +	INTEL_UEVENT_CONSTRAINT(0x01d3, 0xf), +	INTEL_UEVENT_CONSTRAINT(0x04c8, 0xf), /* HLE_RETIRED.Abort */ +	INTEL_UEVENT_CONSTRAINT(0x04c9, 0xf), /* RTM_RETIRED.Abort */ + +	EVENT_CONSTRAINT_END +}; +  struct event_constraint *intel_pebs_constraints(struct perf_event *event)  {  	struct event_constraint *c; @@ -588,6 +653,12 @@ void intel_pmu_pebs_disable(struct perf_event *event)  	struct hw_perf_event *hwc = &event->hw;  	cpuc->pebs_enabled &= ~(1ULL << hwc->idx); + +	if (event->hw.constraint->flags & PERF_X86_EVENT_PEBS_LDLAT) +		cpuc->pebs_enabled &= ~(1ULL << (hwc->idx + 32)); +	else if (event->hw.constraint->flags & PERF_X86_EVENT_PEBS_ST) +		cpuc->pebs_enabled &= ~(1ULL << 63); +  	if (cpuc->enabled)  		wrmsrl(MSR_IA32_PEBS_ENABLE, cpuc->pebs_enabled); @@ -697,6 +768,7 @@ static void __intel_pmu_pebs_event(struct perf_event *event,  	 */  	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);  	struct pebs_record_nhm *pebs = __pebs; +	struct pebs_record_hsw *pebs_hsw = __pebs;  	struct perf_sample_data data;  	struct pt_regs regs;  	u64 sample_type; @@ -706,7 +778,8 @@ static void __intel_pmu_pebs_event(struct perf_event *event,  		return;  	fll = event->hw.flags & PERF_X86_EVENT_PEBS_LDLAT; -	fst = event->hw.flags & PERF_X86_EVENT_PEBS_ST; +	fst = event->hw.flags & (PERF_X86_EVENT_PEBS_ST | +				 PERF_X86_EVENT_PEBS_ST_HSW);  	perf_sample_data_init(&data, 0, event->hw.last_period); @@ -717,9 +790,6 @@ static void __intel_pmu_pebs_event(struct perf_event *event,  	 * if PEBS-LL or PreciseStore  	 */  	if (fll || fst) { -		if (sample_type & PERF_SAMPLE_ADDR) -			data.addr = pebs->dla; -  		/*  		 * Use latency for weight (only avail with PEBS-LL)  		 */ @@ -732,6 +802,9 @@ static void __intel_pmu_pebs_event(struct perf_event *event,  		if (sample_type & PERF_SAMPLE_DATA_SRC) {  			if (fll)  				data.data_src.val = load_latency_data(pebs->dse); +			else if (event->hw.flags & PERF_X86_EVENT_PEBS_ST_HSW) +				data.data_src.val = +					precise_store_data_hsw(pebs->dse);  			else  				data.data_src.val = precise_store_data(pebs->dse);  		} @@ -753,11 +826,18 @@ static void __intel_pmu_pebs_event(struct perf_event *event,  	regs.bp = pebs->bp;  	regs.sp = pebs->sp; -	if (event->attr.precise_ip > 1 && intel_pmu_pebs_fixup_ip(®s)) +	if (event->attr.precise_ip > 1 && x86_pmu.intel_cap.pebs_format >= 2) { +		regs.ip = pebs_hsw->real_ip; +		regs.flags |= PERF_EFLAGS_EXACT; +	} else if (event->attr.precise_ip > 1 && intel_pmu_pebs_fixup_ip(®s))  		regs.flags |= PERF_EFLAGS_EXACT;  	else  		regs.flags &= ~PERF_EFLAGS_EXACT; +	if ((event->attr.sample_type & PERF_SAMPLE_ADDR) && +		x86_pmu.intel_cap.pebs_format >= 1) +		data.addr = pebs->dla; +  	if (has_branch_stack(event))  		data.br_stack = &cpuc->lbr_stack; @@ -806,35 +886,22 @@ static void intel_pmu_drain_pebs_core(struct pt_regs *iregs)  	__intel_pmu_pebs_event(event, iregs, at);  } -static void intel_pmu_drain_pebs_nhm(struct pt_regs *iregs) +static void __intel_pmu_drain_pebs_nhm(struct pt_regs *iregs, void *at, +					void *top)  {  	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events);  	struct debug_store *ds = cpuc->ds; -	struct pebs_record_nhm *at, *top;  	struct perf_event *event = NULL;  	u64 status = 0; -	int bit, n; - -	if (!x86_pmu.pebs_active) -		return; - -	at  = (struct pebs_record_nhm *)(unsigned long)ds->pebs_buffer_base; -	top = (struct pebs_record_nhm *)(unsigned long)ds->pebs_index; +	int bit;  	ds->pebs_index = ds->pebs_buffer_base; -	n = top - at; -	if (n <= 0) -		return; - -	/* -	 * Should not happen, we program the threshold at 1 and do not -	 * set a reset value. -	 */ -	WARN_ONCE(n > x86_pmu.max_pebs_events, "Unexpected number of pebs records %d\n", n); +	for (; at < top; at += x86_pmu.pebs_record_size) { +		struct pebs_record_nhm *p = at; -	for ( ; at < top; at++) { -		for_each_set_bit(bit, (unsigned long *)&at->status, x86_pmu.max_pebs_events) { +		for_each_set_bit(bit, (unsigned long *)&p->status, +				 x86_pmu.max_pebs_events) {  			event = cpuc->events[bit];  			if (!test_bit(bit, cpuc->active_mask))  				continue; @@ -857,6 +924,61 @@ static void intel_pmu_drain_pebs_nhm(struct pt_regs *iregs)  	}  } +static void intel_pmu_drain_pebs_nhm(struct pt_regs *iregs) +{ +	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); +	struct debug_store *ds = cpuc->ds; +	struct pebs_record_nhm *at, *top; +	int n; + +	if (!x86_pmu.pebs_active) +		return; + +	at  = (struct pebs_record_nhm *)(unsigned long)ds->pebs_buffer_base; +	top = (struct pebs_record_nhm *)(unsigned long)ds->pebs_index; + +	ds->pebs_index = ds->pebs_buffer_base; + +	n = top - at; +	if (n <= 0) +		return; + +	/* +	 * Should not happen, we program the threshold at 1 and do not +	 * set a reset value. +	 */ +	WARN_ONCE(n > x86_pmu.max_pebs_events, +		  "Unexpected number of pebs records %d\n", n); + +	return __intel_pmu_drain_pebs_nhm(iregs, at, top); +} + +static void intel_pmu_drain_pebs_hsw(struct pt_regs *iregs) +{ +	struct cpu_hw_events *cpuc = &__get_cpu_var(cpu_hw_events); +	struct debug_store *ds = cpuc->ds; +	struct pebs_record_hsw *at, *top; +	int n; + +	if (!x86_pmu.pebs_active) +		return; + +	at  = (struct pebs_record_hsw *)(unsigned long)ds->pebs_buffer_base; +	top = (struct pebs_record_hsw *)(unsigned long)ds->pebs_index; + +	n = top - at; +	if (n <= 0) +		return; +	/* +	 * Should not happen, we program the threshold at 1 and do not +	 * set a reset value. +	 */ +	WARN_ONCE(n > x86_pmu.max_pebs_events, +		  "Unexpected number of pebs records %d\n", n); + +	return __intel_pmu_drain_pebs_nhm(iregs, at, top); +} +  /*   * BTS, PEBS probe and setup   */ @@ -888,6 +1010,12 @@ void intel_ds_init(void)  			x86_pmu.drain_pebs = intel_pmu_drain_pebs_nhm;  			break; +		case 2: +			pr_cont("PEBS fmt2%c, ", pebs_type); +			x86_pmu.pebs_record_size = sizeof(struct pebs_record_hsw); +			x86_pmu.drain_pebs = intel_pmu_drain_pebs_hsw; +			break; +  		default:  			printk(KERN_CONT "no PEBS fmt%d%c, ", format, pebs_type);  			x86_pmu.pebs = 0; diff --git a/arch/x86/kernel/cpu/perf_event_intel_lbr.c b/arch/x86/kernel/cpu/perf_event_intel_lbr.c index d978353c939..d5be06a5005 100644 --- a/arch/x86/kernel/cpu/perf_event_intel_lbr.c +++ b/arch/x86/kernel/cpu/perf_event_intel_lbr.c @@ -12,6 +12,16 @@ enum {  	LBR_FORMAT_LIP		= 0x01,  	LBR_FORMAT_EIP		= 0x02,  	LBR_FORMAT_EIP_FLAGS	= 0x03, +	LBR_FORMAT_EIP_FLAGS2	= 0x04, +	LBR_FORMAT_MAX_KNOWN    = LBR_FORMAT_EIP_FLAGS2, +}; + +static enum { +	LBR_EIP_FLAGS		= 1, +	LBR_TSX			= 2, +} lbr_desc[LBR_FORMAT_MAX_KNOWN + 1] = { +	[LBR_FORMAT_EIP_FLAGS]  = LBR_EIP_FLAGS, +	[LBR_FORMAT_EIP_FLAGS2] = LBR_EIP_FLAGS | LBR_TSX,  };  /* @@ -56,6 +66,8 @@ enum {  	 LBR_FAR)  #define LBR_FROM_FLAG_MISPRED  (1ULL << 63) +#define LBR_FROM_FLAG_IN_TX    (1ULL << 62) +#define LBR_FROM_FLAG_ABORT    (1ULL << 61)  #define for_each_branch_sample_type(x) \  	for ((x) = PERF_SAMPLE_BRANCH_USER; \ @@ -81,9 +93,13 @@ enum {  	X86_BR_JMP      = 1 << 9, /* jump */  	X86_BR_IRQ      = 1 << 10,/* hw interrupt or trap or fault */  	X86_BR_IND_CALL = 1 << 11,/* indirect calls */ +	X86_BR_ABORT    = 1 << 12,/* transaction abort */ +	X86_BR_IN_TX    = 1 << 13,/* in transaction */ +	X86_BR_NO_TX    = 1 << 14,/* not in transaction */  };  #define X86_BR_PLM (X86_BR_USER | X86_BR_KERNEL) +#define X86_BR_ANYTX (X86_BR_NO_TX | X86_BR_IN_TX)  #define X86_BR_ANY       \  	(X86_BR_CALL    |\ @@ -95,6 +111,7 @@ enum {  	 X86_BR_JCC     |\  	 X86_BR_JMP	 |\  	 X86_BR_IRQ	 |\ +	 X86_BR_ABORT	 |\  	 X86_BR_IND_CALL)  #define X86_BR_ALL (X86_BR_PLM | X86_BR_ANY) @@ -270,21 +287,31 @@ static void intel_pmu_lbr_read_64(struct cpu_hw_events *cpuc)  	for (i = 0; i < x86_pmu.lbr_nr; i++) {  		unsigned long lbr_idx = (tos - i) & mask; -		u64 from, to, mis = 0, pred = 0; +		u64 from, to, mis = 0, pred = 0, in_tx = 0, abort = 0; +		int skip = 0; +		int lbr_flags = lbr_desc[lbr_format];  		rdmsrl(x86_pmu.lbr_from + lbr_idx, from);  		rdmsrl(x86_pmu.lbr_to   + lbr_idx, to); -		if (lbr_format == LBR_FORMAT_EIP_FLAGS) { +		if (lbr_flags & LBR_EIP_FLAGS) {  			mis = !!(from & LBR_FROM_FLAG_MISPRED);  			pred = !mis; -			from = (u64)((((s64)from) << 1) >> 1); +			skip = 1; +		} +		if (lbr_flags & LBR_TSX) { +			in_tx = !!(from & LBR_FROM_FLAG_IN_TX); +			abort = !!(from & LBR_FROM_FLAG_ABORT); +			skip = 3;  		} +		from = (u64)((((s64)from) << skip) >> skip);  		cpuc->lbr_entries[i].from	= from;  		cpuc->lbr_entries[i].to		= to;  		cpuc->lbr_entries[i].mispred	= mis;  		cpuc->lbr_entries[i].predicted	= pred; +		cpuc->lbr_entries[i].in_tx	= in_tx; +		cpuc->lbr_entries[i].abort	= abort;  		cpuc->lbr_entries[i].reserved	= 0;  	}  	cpuc->lbr_stack.nr = i; @@ -310,7 +337,7 @@ void intel_pmu_lbr_read(void)   * - in case there is no HW filter   * - in case the HW filter has errata or limitations   */ -static int intel_pmu_setup_sw_lbr_filter(struct perf_event *event) +static void intel_pmu_setup_sw_lbr_filter(struct perf_event *event)  {  	u64 br_type = event->attr.branch_sample_type;  	int mask = 0; @@ -318,11 +345,8 @@ static int intel_pmu_setup_sw_lbr_filter(struct perf_event *event)  	if (br_type & PERF_SAMPLE_BRANCH_USER)  		mask |= X86_BR_USER; -	if (br_type & PERF_SAMPLE_BRANCH_KERNEL) { -		if (perf_paranoid_kernel() && !capable(CAP_SYS_ADMIN)) -			return -EACCES; +	if (br_type & PERF_SAMPLE_BRANCH_KERNEL)  		mask |= X86_BR_KERNEL; -	}  	/* we ignore BRANCH_HV here */ @@ -337,13 +361,21 @@ static int intel_pmu_setup_sw_lbr_filter(struct perf_event *event)  	if (br_type & PERF_SAMPLE_BRANCH_IND_CALL)  		mask |= X86_BR_IND_CALL; + +	if (br_type & PERF_SAMPLE_BRANCH_ABORT_TX) +		mask |= X86_BR_ABORT; + +	if (br_type & PERF_SAMPLE_BRANCH_IN_TX) +		mask |= X86_BR_IN_TX; + +	if (br_type & PERF_SAMPLE_BRANCH_NO_TX) +		mask |= X86_BR_NO_TX; +  	/*  	 * stash actual user request into reg, it may  	 * be used by fixup code for some CPU  	 */  	event->hw.branch_reg.reg = mask; - -	return 0;  }  /* @@ -391,9 +423,7 @@ int intel_pmu_setup_lbr_filter(struct perf_event *event)  	/*  	 * setup SW LBR filter  	 */ -	ret = intel_pmu_setup_sw_lbr_filter(event); -	if (ret) -		return ret; +	intel_pmu_setup_sw_lbr_filter(event);  	/*  	 * setup HW LBR filter, if any @@ -415,7 +445,7 @@ int intel_pmu_setup_lbr_filter(struct perf_event *event)   * decoded (e.g., text page not present), then X86_BR_NONE is   * returned.   */ -static int branch_type(unsigned long from, unsigned long to) +static int branch_type(unsigned long from, unsigned long to, int abort)  {  	struct insn insn;  	void *addr; @@ -435,6 +465,9 @@ static int branch_type(unsigned long from, unsigned long to)  	if (from == 0 || to == 0)  		return X86_BR_NONE; +	if (abort) +		return X86_BR_ABORT | to_plm; +  	if (from_plm == X86_BR_USER) {  		/*  		 * can happen if measuring at the user level only @@ -581,7 +614,13 @@ intel_pmu_lbr_filter(struct cpu_hw_events *cpuc)  		from = cpuc->lbr_entries[i].from;  		to = cpuc->lbr_entries[i].to; -		type = branch_type(from, to); +		type = branch_type(from, to, cpuc->lbr_entries[i].abort); +		if (type != X86_BR_NONE && (br_sel & X86_BR_ANYTX)) { +			if (cpuc->lbr_entries[i].in_tx) +				type |= X86_BR_IN_TX; +			else +				type |= X86_BR_NO_TX; +		}  		/* if type does not correspond, then discard */  		if (type == X86_BR_NONE || (br_sel & type) != type) { diff --git a/arch/x86/kernel/cpu/perf_event_intel_uncore.c b/arch/x86/kernel/cpu/perf_event_intel_uncore.c index 52441a2af53..1fb6c72717b 100644 --- a/arch/x86/kernel/cpu/perf_event_intel_uncore.c +++ b/arch/x86/kernel/cpu/perf_event_intel_uncore.c @@ -314,8 +314,8 @@ static struct uncore_event_desc snbep_uncore_imc_events[] = {  static struct uncore_event_desc snbep_uncore_qpi_events[] = {  	INTEL_UNCORE_EVENT_DESC(clockticks,       "event=0x14"),  	INTEL_UNCORE_EVENT_DESC(txl_flits_active, "event=0x00,umask=0x06"), -	INTEL_UNCORE_EVENT_DESC(drs_data,         "event=0x02,umask=0x08"), -	INTEL_UNCORE_EVENT_DESC(ncb_data,         "event=0x03,umask=0x04"), +	INTEL_UNCORE_EVENT_DESC(drs_data,         "event=0x102,umask=0x08"), +	INTEL_UNCORE_EVENT_DESC(ncb_data,         "event=0x103,umask=0x04"),  	{ /* end: all zeroes */ },  }; @@ -536,7 +536,7 @@ __snbep_cbox_get_constraint(struct intel_uncore_box *box, struct perf_event *eve  	if (!uncore_box_is_fake(box))  		reg1->alloc |= alloc; -	return 0; +	return NULL;  fail:  	for (; i >= 0; i--) {  		if (alloc & (0x1 << i)) @@ -644,7 +644,7 @@ snbep_pcu_get_constraint(struct intel_uncore_box *box, struct perf_event *event)  	    (!uncore_box_is_fake(box) && reg1->alloc))  		return NULL;  again: -	mask = 0xff << (idx * 8); +	mask = 0xffULL << (idx * 8);  	raw_spin_lock_irqsave(&er->lock, flags);  	if (!__BITS_VALUE(atomic_read(&er->ref), idx, 8) ||  	    !((config1 ^ er->config) & mask)) { @@ -1923,7 +1923,7 @@ static u64 nhmex_mbox_alter_er(struct perf_event *event, int new_idx, bool modif  {  	struct hw_perf_event *hwc = &event->hw;  	struct hw_perf_event_extra *reg1 = &hwc->extra_reg; -	int idx, orig_idx = __BITS_VALUE(reg1->idx, 0, 8); +	u64 idx, orig_idx = __BITS_VALUE(reg1->idx, 0, 8);  	u64 config = reg1->config;  	/* get the non-shared control bits and shift them */ @@ -2723,15 +2723,16 @@ static void uncore_put_event_constraint(struct intel_uncore_box *box, struct per  static int uncore_assign_events(struct intel_uncore_box *box, int assign[], int n)  {  	unsigned long used_mask[BITS_TO_LONGS(UNCORE_PMC_IDX_MAX)]; -	struct event_constraint *c, *constraints[UNCORE_PMC_IDX_MAX]; +	struct event_constraint *c;  	int i, wmin, wmax, ret = 0;  	struct hw_perf_event *hwc;  	bitmap_zero(used_mask, UNCORE_PMC_IDX_MAX);  	for (i = 0, wmin = UNCORE_PMC_IDX_MAX, wmax = 0; i < n; i++) { +		hwc = &box->event_list[i]->hw;  		c = uncore_get_event_constraint(box, box->event_list[i]); -		constraints[i] = c; +		hwc->constraint = c;  		wmin = min(wmin, c->weight);  		wmax = max(wmax, c->weight);  	} @@ -2739,7 +2740,7 @@ static int uncore_assign_events(struct intel_uncore_box *box, int assign[], int  	/* fastpath, try to reuse previous register */  	for (i = 0; i < n; i++) {  		hwc = &box->event_list[i]->hw; -		c = constraints[i]; +		c = hwc->constraint;  		/* never assigned */  		if (hwc->idx == -1) @@ -2759,7 +2760,8 @@ static int uncore_assign_events(struct intel_uncore_box *box, int assign[], int  	}  	/* slow path */  	if (i != n) -		ret = perf_assign_events(constraints, n, wmin, wmax, assign); +		ret = perf_assign_events(box->event_list, n, +					 wmin, wmax, assign);  	if (!assign || ret) {  		for (i = 0; i < n; i++) @@ -3295,7 +3297,7 @@ static void __init uncore_pci_exit(void)  /* CPU hot plug/unplug are serialized by cpu_add_remove_lock mutex */  static LIST_HEAD(boxes_to_free); -static void __cpuinit uncore_kfree_boxes(void) +static void uncore_kfree_boxes(void)  {  	struct intel_uncore_box *box; @@ -3307,7 +3309,7 @@ static void __cpuinit uncore_kfree_boxes(void)  	}  } -static void __cpuinit uncore_cpu_dying(int cpu) +static void uncore_cpu_dying(int cpu)  {  	struct intel_uncore_type *type;  	struct intel_uncore_pmu *pmu; @@ -3326,7 +3328,7 @@ static void __cpuinit uncore_cpu_dying(int cpu)  	}  } -static int __cpuinit uncore_cpu_starting(int cpu) +static int uncore_cpu_starting(int cpu)  {  	struct intel_uncore_type *type;  	struct intel_uncore_pmu *pmu; @@ -3369,7 +3371,7 @@ static int __cpuinit uncore_cpu_starting(int cpu)  	return 0;  } -static int __cpuinit uncore_cpu_prepare(int cpu, int phys_id) +static int uncore_cpu_prepare(int cpu, int phys_id)  {  	struct intel_uncore_type *type;  	struct intel_uncore_pmu *pmu; @@ -3395,7 +3397,7 @@ static int __cpuinit uncore_cpu_prepare(int cpu, int phys_id)  	return 0;  } -static void __cpuinit +static void  uncore_change_context(struct intel_uncore_type **uncores, int old_cpu, int new_cpu)  {  	struct intel_uncore_type *type; @@ -3433,7 +3435,7 @@ uncore_change_context(struct intel_uncore_type **uncores, int old_cpu, int new_c  	}  } -static void __cpuinit uncore_event_exit_cpu(int cpu) +static void uncore_event_exit_cpu(int cpu)  {  	int i, phys_id, target; @@ -3461,7 +3463,7 @@ static void __cpuinit uncore_event_exit_cpu(int cpu)  	uncore_change_context(pci_uncores, cpu, target);  } -static void __cpuinit uncore_event_init_cpu(int cpu) +static void uncore_event_init_cpu(int cpu)  {  	int i, phys_id; @@ -3477,8 +3479,8 @@ static void __cpuinit uncore_event_init_cpu(int cpu)  	uncore_change_context(pci_uncores, -1, cpu);  } -static int - __cpuinit uncore_cpu_notifier(struct notifier_block *self, unsigned long action, void *hcpu) +static int uncore_cpu_notifier(struct notifier_block *self, +			       unsigned long action, void *hcpu)  {  	unsigned int cpu = (long)hcpu; @@ -3518,7 +3520,7 @@ static int  	return NOTIFY_OK;  } -static struct notifier_block uncore_cpu_nb __cpuinitdata = { +static struct notifier_block uncore_cpu_nb = {  	.notifier_call	= uncore_cpu_notifier,  	/*  	 * to migrate uncore events, our notifier should be executed diff --git a/arch/x86/kernel/cpu/perf_event_intel_uncore.h b/arch/x86/kernel/cpu/perf_event_intel_uncore.h index f9528917f6e..47b3d00c9d8 100644 --- a/arch/x86/kernel/cpu/perf_event_intel_uncore.h +++ b/arch/x86/kernel/cpu/perf_event_intel_uncore.h @@ -337,10 +337,10 @@  		 NHMEX_M_PMON_CTL_SET_FLAG_SEL_MASK)  #define NHMEX_M_PMON_ZDP_CTL_FVC_MASK		(((1 << 11) - 1) | (1 << 23)) -#define NHMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(n)	(0x7 << (11 + 3 * (n))) +#define NHMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(n)	(0x7ULL << (11 + 3 * (n)))  #define WSMEX_M_PMON_ZDP_CTL_FVC_MASK		(((1 << 12) - 1) | (1 << 24)) -#define WSMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(n)	(0x7 << (12 + 3 * (n))) +#define WSMEX_M_PMON_ZDP_CTL_FVC_EVENT_MASK(n)	(0x7ULL << (12 + 3 * (n)))  /*   * use the 9~13 bits to select event If the 7th bit is not set, diff --git a/arch/x86/kernel/cpu/powerflags.c b/arch/x86/kernel/cpu/powerflags.c index 7b3fe56b1c2..31f0f335ed2 100644 --- a/arch/x86/kernel/cpu/powerflags.c +++ b/arch/x86/kernel/cpu/powerflags.c @@ -11,10 +11,10 @@ const char *const x86_power_flags[32] = {  	"fid",  /* frequency id control */  	"vid",  /* voltage id control */  	"ttp",  /* thermal trip */ -	"tm", -	"stc", -	"100mhzsteps", -	"hwpstate", +	"tm",	/* hardware thermal control */ +	"stc",	/* software thermal control */ +	"100mhzsteps", /* 100 MHz multiplier control */ +	"hwpstate", /* hardware P-state control */  	"",	/* tsc invariant mapped to constant_tsc */  	"cpb",  /* core performance boost */  	"eff_freq_ro", /* Readonly aperf/mperf */ diff --git a/arch/x86/kernel/cpu/proc.c b/arch/x86/kernel/cpu/proc.c index 37a198bd48c..aee6317b902 100644 --- a/arch/x86/kernel/cpu/proc.c +++ b/arch/x86/kernel/cpu/proc.c @@ -37,8 +37,8 @@ static void show_cpuinfo_misc(struct seq_file *m, struct cpuinfo_x86 *c)  		   static_cpu_has_bug(X86_BUG_FDIV) ? "yes" : "no",  		   static_cpu_has_bug(X86_BUG_F00F) ? "yes" : "no",  		   static_cpu_has_bug(X86_BUG_COMA) ? "yes" : "no", -		   c->hard_math ? "yes" : "no", -		   c->hard_math ? "yes" : "no", +		   static_cpu_has(X86_FEATURE_FPU) ? "yes" : "no", +		   static_cpu_has(X86_FEATURE_FPU) ? "yes" : "no",  		   c->cpuid_level,  		   c->wp_works_ok ? "yes" : "no");  } diff --git a/arch/x86/kernel/cpu/rdrand.c b/arch/x86/kernel/cpu/rdrand.c index feca286c2bb..88db010845c 100644 --- a/arch/x86/kernel/cpu/rdrand.c +++ b/arch/x86/kernel/cpu/rdrand.c @@ -52,7 +52,7 @@ static inline int rdrand_long(unsigned long *v)   */  #define RESEED_LOOP ((512*128)/sizeof(unsigned long)) -void __cpuinit x86_init_rdrand(struct cpuinfo_x86 *c) +void x86_init_rdrand(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_ARCH_RANDOM  	unsigned long tmp; diff --git a/arch/x86/kernel/cpu/scattered.c b/arch/x86/kernel/cpu/scattered.c index d92b5dad15d..f2cc63e9cf0 100644 --- a/arch/x86/kernel/cpu/scattered.c +++ b/arch/x86/kernel/cpu/scattered.c @@ -24,13 +24,13 @@ enum cpuid_regs {  	CR_EBX  }; -void __cpuinit init_scattered_cpuid_features(struct cpuinfo_x86 *c) +void init_scattered_cpuid_features(struct cpuinfo_x86 *c)  {  	u32 max_level;  	u32 regs[4];  	const struct cpuid_bit *cb; -	static const struct cpuid_bit __cpuinitconst cpuid_bits[] = { +	static const struct cpuid_bit cpuid_bits[] = {  		{ X86_FEATURE_DTHERM,		CR_EAX, 0, 0x00000006, 0 },  		{ X86_FEATURE_IDA,		CR_EAX, 1, 0x00000006, 0 },  		{ X86_FEATURE_ARAT,		CR_EAX, 2, 0x00000006, 0 }, diff --git a/arch/x86/kernel/cpu/topology.c b/arch/x86/kernel/cpu/topology.c index 4397e987a1c..4c60eaf0571 100644 --- a/arch/x86/kernel/cpu/topology.c +++ b/arch/x86/kernel/cpu/topology.c @@ -26,7 +26,7 @@   * exists, use it for populating initial_apicid and cpu topology   * detection.   */ -void __cpuinit detect_extended_topology(struct cpuinfo_x86 *c) +void detect_extended_topology(struct cpuinfo_x86 *c)  {  #ifdef CONFIG_SMP  	unsigned int eax, ebx, ecx, edx, sub_index; diff --git a/arch/x86/kernel/cpu/transmeta.c b/arch/x86/kernel/cpu/transmeta.c index 28000743bbb..aa0430d69b9 100644 --- a/arch/x86/kernel/cpu/transmeta.c +++ b/arch/x86/kernel/cpu/transmeta.c @@ -5,7 +5,7 @@  #include <asm/msr.h>  #include "cpu.h" -static void __cpuinit early_init_transmeta(struct cpuinfo_x86 *c) +static void early_init_transmeta(struct cpuinfo_x86 *c)  {  	u32 xlvl; @@ -17,7 +17,7 @@ static void __cpuinit early_init_transmeta(struct cpuinfo_x86 *c)  	}  } -static void __cpuinit init_transmeta(struct cpuinfo_x86 *c) +static void init_transmeta(struct cpuinfo_x86 *c)  {  	unsigned int cap_mask, uk, max, dummy;  	unsigned int cms_rev1, cms_rev2; @@ -98,7 +98,7 @@ static void __cpuinit init_transmeta(struct cpuinfo_x86 *c)  #endif  } -static const struct cpu_dev __cpuinitconst transmeta_cpu_dev = { +static const struct cpu_dev transmeta_cpu_dev = {  	.c_vendor	= "Transmeta",  	.c_ident	= { "GenuineTMx86", "TransmetaCPU" },  	.c_early_init	= early_init_transmeta, diff --git a/arch/x86/kernel/cpu/umc.c b/arch/x86/kernel/cpu/umc.c index fd2c37bf7ac..202759a1412 100644 --- a/arch/x86/kernel/cpu/umc.c +++ b/arch/x86/kernel/cpu/umc.c @@ -8,7 +8,7 @@   * so no special init takes place.   */ -static const struct cpu_dev __cpuinitconst umc_cpu_dev = { +static const struct cpu_dev umc_cpu_dev = {  	.c_vendor	= "UMC",  	.c_ident	= { "UMC UMC UMC" },  	.c_models = { diff --git a/arch/x86/kernel/cpu/vmware.c b/arch/x86/kernel/cpu/vmware.c index 03a36321ec5..7076878404e 100644 --- a/arch/x86/kernel/cpu/vmware.c +++ b/arch/x86/kernel/cpu/vmware.c @@ -122,7 +122,7 @@ static bool __init vmware_platform(void)   * so that the kernel could just trust the hypervisor with providing a   * reliable virtual TSC that is suitable for timekeeping.   */ -static void __cpuinit vmware_set_cpu_features(struct cpuinfo_x86 *c) +static void vmware_set_cpu_features(struct cpuinfo_x86 *c)  {  	set_cpu_cap(c, X86_FEATURE_CONSTANT_TSC);  	set_cpu_cap(c, X86_FEATURE_TSC_RELIABLE); | 
