675357362a
This reverts commit 43858b4f25cf0adc5c2ca9cf5ce5fdf2532941e5. The reason I removed the leave_mm() calls in question is because the heuristic wasn't needed after that patch. With the original version of my PCID series, we never flushed a "lazy cpu" (i.e. a CPU running kernel thread) due a flush on the loaded mm. Unfortunately, that caused architectural issues, so now I've reinstated these flushes on non-PCID systems in: commit b956575bed91 ("x86/mm: Flush more aggressively in lazy TLB mode"). That, in turn, gives us a power management and occasionally performance regression as compared to old kernels: a process that goes into a deep idle state on a given CPU and gets its mm flushed due to activity on a different CPU will wake the idle CPU. Reinstate the old ugly heuristic: if a CPU goes into ACPI C3 or an intel_idle state that is likely to cause a TLB flush gets its mm switched to init_mm before going idle. FWIW, this heuristic is lousy. Whether we should change CR3 before idle isn't a good hint except insofar as the performance hit is a bit lower if the TLB is getting flushed by the idle code anyway. What we really want to know is whether we anticipate being idle long enough that the mm is likely to be flushed before we wake up. This is more a matter of the expected latency than the idle state that gets chosen. This heuristic also completely fails on systems that don't know whether the TLB will be flushed (e.g. AMD systems?). OTOH it may be a bit obsolete anyway -- PCID systems don't presently benefit from this heuristic at all. We also shouldn't do this callback from innermost bit of the idle code due to the RCU nastiness it causes. All the information need is available before rcu_idle_enter() needs to happen. Signed-off-by: Andy Lutomirski <luto@kernel.org> Cc: Borislav Petkov <bp@alien8.de> Cc: Borislav Petkov <bpetkov@suse.de> Cc: Brian Gerst <brgerst@gmail.com> Cc: Denys Vlasenko <dvlasenk@redhat.com> Cc: H. Peter Anvin <hpa@zytor.com> Cc: Josh Poimboeuf <jpoimboe@redhat.com> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Thomas Gleixner <tglx@linutronix.de> Fixes: 43858b4f25cf "x86/mm: Stop calling leave_mm() in idle code" Link: http://lkml.kernel.org/r/c513bbd4e653747213e05bc7062de000bf0202a5.1509793738.git.luto@kernel.org Signed-off-by: Ingo Molnar <mingo@kernel.org>
151 lines
4.1 KiB
C
151 lines
4.1 KiB
C
/*
|
|
* Copyright (C) 1999 VA Linux Systems
|
|
* Copyright (C) 1999 Walt Drummond <drummond@valinux.com>
|
|
* Copyright (C) 2000,2001 J.I. Lee <jung-ik.lee@intel.com>
|
|
* Copyright (C) 2001,2002 Paul Diefenbaugh <paul.s.diefenbaugh@intel.com>
|
|
*
|
|
* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*
|
|
* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
|
*/
|
|
|
|
#ifndef _ASM_ACPI_H
|
|
#define _ASM_ACPI_H
|
|
|
|
#ifdef __KERNEL__
|
|
|
|
#include <acpi/pdc_intel.h>
|
|
|
|
#include <linux/init.h>
|
|
#include <linux/numa.h>
|
|
#include <asm/numa.h>
|
|
|
|
#ifdef CONFIG_ACPI
|
|
extern int acpi_lapic;
|
|
#define acpi_disabled 0 /* ACPI always enabled on IA64 */
|
|
#define acpi_noirq 0 /* ACPI always enabled on IA64 */
|
|
#define acpi_pci_disabled 0 /* ACPI PCI always enabled on IA64 */
|
|
#define acpi_strict 1 /* no ACPI spec workarounds on IA64 */
|
|
|
|
static inline bool acpi_has_cpu_in_madt(void)
|
|
{
|
|
return !!acpi_lapic;
|
|
}
|
|
#endif
|
|
#define acpi_processor_cstate_check(x) (x) /* no idle limits on IA64 :) */
|
|
static inline void disable_acpi(void) { }
|
|
|
|
#ifdef CONFIG_IA64_GENERIC
|
|
const char *acpi_get_sysname (void);
|
|
#else
|
|
static inline const char *acpi_get_sysname (void)
|
|
{
|
|
# if defined (CONFIG_IA64_HP_SIM)
|
|
return "hpsim";
|
|
# elif defined (CONFIG_IA64_HP_ZX1)
|
|
return "hpzx1";
|
|
# elif defined (CONFIG_IA64_HP_ZX1_SWIOTLB)
|
|
return "hpzx1_swiotlb";
|
|
# elif defined (CONFIG_IA64_SGI_SN2)
|
|
return "sn2";
|
|
# elif defined (CONFIG_IA64_SGI_UV)
|
|
return "uv";
|
|
# elif defined (CONFIG_IA64_DIG)
|
|
return "dig";
|
|
# elif defined(CONFIG_IA64_DIG_VTD)
|
|
return "dig_vtd";
|
|
# else
|
|
# error Unknown platform. Fix acpi.c.
|
|
# endif
|
|
}
|
|
#endif
|
|
int acpi_request_vector (u32 int_type);
|
|
int acpi_gsi_to_irq (u32 gsi, unsigned int *irq);
|
|
|
|
/* Low-level suspend routine. */
|
|
extern int acpi_suspend_lowlevel(void);
|
|
|
|
extern unsigned long acpi_wakeup_address;
|
|
|
|
/*
|
|
* Record the cpei override flag and current logical cpu. This is
|
|
* useful for CPU removal.
|
|
*/
|
|
extern unsigned int can_cpei_retarget(void);
|
|
extern unsigned int is_cpu_cpei_target(unsigned int cpu);
|
|
extern void set_cpei_target_cpu(unsigned int cpu);
|
|
extern unsigned int get_cpei_target_cpu(void);
|
|
extern void prefill_possible_map(void);
|
|
#ifdef CONFIG_ACPI_HOTPLUG_CPU
|
|
extern int additional_cpus;
|
|
#else
|
|
#define additional_cpus 0
|
|
#endif
|
|
|
|
#ifdef CONFIG_ACPI_NUMA
|
|
#if MAX_NUMNODES > 256
|
|
#define MAX_PXM_DOMAINS MAX_NUMNODES
|
|
#else
|
|
#define MAX_PXM_DOMAINS (256)
|
|
#endif
|
|
extern int pxm_to_nid_map[MAX_PXM_DOMAINS];
|
|
extern int __initdata nid_to_pxm_map[MAX_NUMNODES];
|
|
#endif
|
|
|
|
static inline bool arch_has_acpi_pdc(void) { return true; }
|
|
static inline void arch_acpi_set_pdc_bits(u32 *buf)
|
|
{
|
|
buf[2] |= ACPI_PDC_EST_CAPABILITY_SMP;
|
|
}
|
|
|
|
#define acpi_unlazy_tlb(x)
|
|
|
|
#ifdef CONFIG_ACPI_NUMA
|
|
extern cpumask_t early_cpu_possible_map;
|
|
#define for_each_possible_early_cpu(cpu) \
|
|
for_each_cpu((cpu), &early_cpu_possible_map)
|
|
|
|
static inline void per_cpu_scan_finalize(int min_cpus, int reserve_cpus)
|
|
{
|
|
int low_cpu, high_cpu;
|
|
int cpu;
|
|
int next_nid = 0;
|
|
|
|
low_cpu = cpumask_weight(&early_cpu_possible_map);
|
|
|
|
high_cpu = max(low_cpu, min_cpus);
|
|
high_cpu = min(high_cpu + reserve_cpus, NR_CPUS);
|
|
|
|
for (cpu = low_cpu; cpu < high_cpu; cpu++) {
|
|
cpumask_set_cpu(cpu, &early_cpu_possible_map);
|
|
if (node_cpuid[cpu].nid == NUMA_NO_NODE) {
|
|
node_cpuid[cpu].nid = next_nid;
|
|
next_nid++;
|
|
if (next_nid >= num_online_nodes())
|
|
next_nid = 0;
|
|
}
|
|
}
|
|
}
|
|
|
|
extern void acpi_numa_fixup(void);
|
|
|
|
#endif /* CONFIG_ACPI_NUMA */
|
|
|
|
#endif /*__KERNEL__*/
|
|
|
|
#endif /*_ASM_ACPI_H*/
|