Merge branch 'x86-platform-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/tip (57e88b43) · Commits · e / devices / android_kernel_oneplus_sm8150

MAINTAINERS

+2 −0

Original line number	Diff line number	Diff line
		@@ -6312,6 +6312,7 @@ L: devel@linuxdriverproject.org
		S: Maintained
		F: Documentation/networking/netvsc.txt
		F: arch/x86/include/asm/mshyperv.h
		F: arch/x86/include/asm/trace/hyperv.h
		F: arch/x86/include/uapi/asm/hyperv.h
		F: arch/x86/kernel/cpu/mshyperv.c
		F: arch/x86/hyperv
		@@ -6325,6 +6326,7 @@ F: drivers/uio/uio_hv_generic.c
		F: drivers/video/fbdev/hyperv_fb.c
		F: net/vmw_vsock/hyperv_transport.c
		F: include/linux/hyperv.h
		F: include/uapi/linux/hyperv.h
		F: tools/hv/
		F: Documentation/ABI/stable/sysfs-bus-vmbus

arch/x86/Kbuild

+1 −1

Original line number	Diff line number	Diff line
		@@ -8,7 +8,7 @@ obj-$(CONFIG_KVM) += kvm/
		obj-$(CONFIG_XEN) += xen/

		# Hyper-V paravirtualization support
		obj-$(CONFIG_HYPERVISOR_GUEST) += hyperv/
		obj-$(subst m,y,$(CONFIG_HYPERV)) += hyperv/

		obj-y += realmode/
		obj-y += kernel/

arch/x86/hyperv/Makefile

+1 −1

Original line number	Diff line number	Diff line
		obj-y := hv_init.o
		obj-y := hv_init.o mmu.o

arch/x86/hyperv/hv_init.c

+40 −50

Original line number	Diff line number	Diff line
		@@ -26,6 +26,8 @@
		#include <linux/mm.h>
		#include <linux/clockchips.h>
		#include <linux/hyperv.h>
		#include <linux/slab.h>
		#include <linux/cpuhotplug.h>

		#ifdef CONFIG_HYPERV_TSCPAGE

		@@ -75,10 +77,25 @@ static struct clocksource hyperv_cs_msr = {
		.flags = CLOCK_SOURCE_IS_CONTINUOUS,
		};

		static void *hypercall_pg;
		void *hv_hypercall_pg;
		EXPORT_SYMBOL_GPL(hv_hypercall_pg);
		struct clocksource *hyperv_cs;
		EXPORT_SYMBOL_GPL(hyperv_cs);

		u32 *hv_vp_index;
		EXPORT_SYMBOL_GPL(hv_vp_index);

		static int hv_cpu_init(unsigned int cpu)
		{
		u64 msr_vp_index;

		hv_get_vp_index(msr_vp_index);

		hv_vp_index[smp_processor_id()] = msr_vp_index;

		return 0;
		}

		/*
		* This function is to be invoked early in the boot sequence after the
		* hypervisor has been detected.
		@@ -94,6 +111,16 @@ void hyperv_init(void)
		if (x86_hyper != &x86_hyper_ms_hyperv)
		return;

		/* Allocate percpu VP index */
		hv_vp_index = kmalloc_array(num_possible_cpus(), sizeof(*hv_vp_index),
		GFP_KERNEL);
		if (!hv_vp_index)
		return;

		if (cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "x86/hyperv_init:online",
		hv_cpu_init, NULL) < 0)
		goto free_vp_index;

		/*
		* Setup the hypercall page and enable hypercalls.
		* 1. Register the guest ID
		@@ -102,17 +129,19 @@ void hyperv_init(void)
		guest_id = generate_guest_id(0, LINUX_VERSION_CODE, 0);
		wrmsrl(HV_X64_MSR_GUEST_OS_ID, guest_id);

		hypercall_pg = __vmalloc(PAGE_SIZE, GFP_KERNEL, PAGE_KERNEL_RX);
		if (hypercall_pg == NULL) {
		hv_hypercall_pg = __vmalloc(PAGE_SIZE, GFP_KERNEL, PAGE_KERNEL_RX);
		if (hv_hypercall_pg == NULL) {
		wrmsrl(HV_X64_MSR_GUEST_OS_ID, 0);
		return;
		goto free_vp_index;
		}

		rdmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);
		hypercall_msr.enable = 1;
		hypercall_msr.guest_physical_address = vmalloc_to_pfn(hypercall_pg);
		hypercall_msr.guest_physical_address = vmalloc_to_pfn(hv_hypercall_pg);
		wrmsrl(HV_X64_MSR_HYPERCALL, hypercall_msr.as_uint64);

		hyper_alloc_mmu();

		/*
		* Register Hyper-V specific clocksource.
		*/
		@@ -148,6 +177,12 @@ void hyperv_init(void)
		hyperv_cs = &hyperv_cs_msr;
		if (ms_hyperv.features & HV_X64_MSR_TIME_REF_COUNT_AVAILABLE)
		clocksource_register_hz(&hyperv_cs_msr, NSEC_PER_SEC/100);

		return;

		free_vp_index:
		kfree(hv_vp_index);
		hv_vp_index = NULL;
		}

		/*
		@@ -170,51 +205,6 @@ void hyperv_cleanup(void)
		}
		EXPORT_SYMBOL_GPL(hyperv_cleanup);

		/*
		* hv_do_hypercall- Invoke the specified hypercall
		*/
		u64 hv_do_hypercall(u64 control, void input, void output)
		{
		u64 input_address = (input) ? virt_to_phys(input) : 0;
		u64 output_address = (output) ? virt_to_phys(output) : 0;
		#ifdef CONFIG_X86_64
		u64 hv_status = 0;

		if (!hypercall_pg)
		return (u64)ULLONG_MAX;

		__asm__ __volatile__("mov %0, %%r8" : : "r" (output_address) : "r8");
		__asm__ __volatile__("call *%3" : "=a" (hv_status) :
		"c" (control), "d" (input_address),
		"m" (hypercall_pg));

		return hv_status;

		#else

		u32 control_hi = control >> 32;
		u32 control_lo = control & 0xFFFFFFFF;
		u32 hv_status_hi = 1;
		u32 hv_status_lo = 1;
		u32 input_address_hi = input_address >> 32;
		u32 input_address_lo = input_address & 0xFFFFFFFF;
		u32 output_address_hi = output_address >> 32;
		u32 output_address_lo = output_address & 0xFFFFFFFF;

		if (!hypercall_pg)
		return (u64)ULLONG_MAX;

		__asm__ __volatile__ ("call *%8" : "=d"(hv_status_hi),
		"=a"(hv_status_lo) : "d" (control_hi),
		"a" (control_lo), "b" (input_address_hi),
		"c" (input_address_lo), "D"(output_address_hi),
		"S"(output_address_lo), "m" (hypercall_pg));

		return hv_status_lo \| ((u64)hv_status_hi << 32);
		#endif /* !x86_64 */
		}
		EXPORT_SYMBOL_GPL(hv_do_hypercall);

		void hyperv_report_panic(struct pt_regs *regs)
		{
		static bool panic_reported;

arch/x86/hyperv/mmu.c

0 → 100644

+272 −0

Original line number	Diff line number	Diff line
		#define pr_fmt(fmt) "Hyper-V: " fmt

		#include <linux/hyperv.h>
		#include <linux/log2.h>
		#include <linux/slab.h>
		#include <linux/types.h>

		#include <asm/fpu/api.h>
		#include <asm/mshyperv.h>
		#include <asm/msr.h>
		#include <asm/tlbflush.h>

		#define CREATE_TRACE_POINTS
		#include <asm/trace/hyperv.h>

		/* HvFlushVirtualAddressSpace, HvFlushVirtualAddressList hypercalls */
		struct hv_flush_pcpu {
		u64 address_space;
		u64 flags;
		u64 processor_mask;
		u64 gva_list[];
		};

		/* HvFlushVirtualAddressSpaceEx, HvFlushVirtualAddressListEx hypercalls */
		struct hv_flush_pcpu_ex {
		u64 address_space;
		u64 flags;
		struct {
		u64 format;
		u64 valid_bank_mask;
		u64 bank_contents[];
		} hv_vp_set;
		u64 gva_list[];
		};

		/* Each gva in gva_list encodes up to 4096 pages to flush */
		#define HV_TLB_FLUSH_UNIT (4096 * PAGE_SIZE)

		static struct hv_flush_pcpu __percpu *pcpu_flush;

		static struct hv_flush_pcpu_ex __percpu *pcpu_flush_ex;

		/*
		* Fills in gva_list starting from offset. Returns the number of items added.
		*/
		static inline int fill_gva_list(u64 gva_list[], int offset,
		unsigned long start, unsigned long end)
		{
		int gva_n = offset;
		unsigned long cur = start, diff;

		do {
		diff = end > cur ? end - cur : 0;

		gva_list[gva_n] = cur & PAGE_MASK;
		/*
		* Lower 12 bits encode the number of additional
		* pages to flush (in addition to the 'cur' page).
		*/
		if (diff >= HV_TLB_FLUSH_UNIT)
		gva_list[gva_n] \|= ~PAGE_MASK;
		else if (diff)
		gva_list[gva_n] \|= (diff - 1) >> PAGE_SHIFT;

		cur += HV_TLB_FLUSH_UNIT;
		gva_n++;

		} while (cur < end);

		return gva_n - offset;
		}

		/* Return the number of banks in the resulting vp_set */
		static inline int cpumask_to_vp_set(struct hv_flush_pcpu_ex *flush,
		const struct cpumask *cpus)
		{
		int cpu, vcpu, vcpu_bank, vcpu_offset, nr_bank = 1;

		/*
		* Some banks may end up being empty but this is acceptable.
		*/
		for_each_cpu(cpu, cpus) {
		vcpu = hv_cpu_number_to_vp_number(cpu);
		vcpu_bank = vcpu / 64;
		vcpu_offset = vcpu % 64;

		/* valid_bank_mask can represent up to 64 banks */
		if (vcpu_bank >= 64)
		return 0;

		__set_bit(vcpu_offset, (unsigned long *)
		&flush->hv_vp_set.bank_contents[vcpu_bank]);
		if (vcpu_bank >= nr_bank)
		nr_bank = vcpu_bank + 1;
		}
		flush->hv_vp_set.valid_bank_mask = GENMASK_ULL(nr_bank - 1, 0);

		return nr_bank;
		}

		static void hyperv_flush_tlb_others(const struct cpumask *cpus,
		const struct flush_tlb_info *info)
		{
		int cpu, vcpu, gva_n, max_gvas;
		struct hv_flush_pcpu *flush;
		u64 status = U64_MAX;
		unsigned long flags;

		trace_hyperv_mmu_flush_tlb_others(cpus, info);

		if (!pcpu_flush \|\| !hv_hypercall_pg)
		goto do_native;

		if (cpumask_empty(cpus))
		return;

		local_irq_save(flags);

		flush = this_cpu_ptr(pcpu_flush);

		if (info->mm) {
		flush->address_space = virt_to_phys(info->mm->pgd);
		flush->flags = 0;
		} else {
		flush->address_space = 0;
		flush->flags = HV_FLUSH_ALL_VIRTUAL_ADDRESS_SPACES;
		}

		flush->processor_mask = 0;
		if (cpumask_equal(cpus, cpu_present_mask)) {
		flush->flags \|= HV_FLUSH_ALL_PROCESSORS;
		} else {
		for_each_cpu(cpu, cpus) {
		vcpu = hv_cpu_number_to_vp_number(cpu);
		if (vcpu >= 64)
		goto do_native;

		__set_bit(vcpu, (unsigned long *)
		&flush->processor_mask);
		}
		}

		/*
		* We can flush not more than max_gvas with one hypercall. Flush the
		* whole address space if we were asked to do more.
		*/
		max_gvas = (PAGE_SIZE - sizeof(*flush)) / sizeof(flush->gva_list[0]);

		if (info->end == TLB_FLUSH_ALL) {
		flush->flags \|= HV_FLUSH_NON_GLOBAL_MAPPINGS_ONLY;
		status = hv_do_hypercall(HVCALL_FLUSH_VIRTUAL_ADDRESS_SPACE,
		flush, NULL);
		} else if (info->end &&
		((info->end - info->start)/HV_TLB_FLUSH_UNIT) > max_gvas) {
		status = hv_do_hypercall(HVCALL_FLUSH_VIRTUAL_ADDRESS_SPACE,
		flush, NULL);
		} else {
		gva_n = fill_gva_list(flush->gva_list, 0,
		info->start, info->end);
		status = hv_do_rep_hypercall(HVCALL_FLUSH_VIRTUAL_ADDRESS_LIST,
		gva_n, 0, flush, NULL);
		}

		local_irq_restore(flags);

		if (!(status & HV_HYPERCALL_RESULT_MASK))
		return;
		do_native:
		native_flush_tlb_others(cpus, info);
		}

		static void hyperv_flush_tlb_others_ex(const struct cpumask *cpus,
		const struct flush_tlb_info *info)
		{
		int nr_bank = 0, max_gvas, gva_n;
		struct hv_flush_pcpu_ex *flush;
		u64 status = U64_MAX;
		unsigned long flags;

		trace_hyperv_mmu_flush_tlb_others(cpus, info);

		if (!pcpu_flush_ex \|\| !hv_hypercall_pg)
		goto do_native;

		if (cpumask_empty(cpus))
		return;

		local_irq_save(flags);

		flush = this_cpu_ptr(pcpu_flush_ex);

		if (info->mm) {
		flush->address_space = virt_to_phys(info->mm->pgd);
		flush->flags = 0;
		} else {
		flush->address_space = 0;
		flush->flags = HV_FLUSH_ALL_VIRTUAL_ADDRESS_SPACES;
		}

		flush->hv_vp_set.valid_bank_mask = 0;

		if (!cpumask_equal(cpus, cpu_present_mask)) {
		flush->hv_vp_set.format = HV_GENERIC_SET_SPARCE_4K;
		nr_bank = cpumask_to_vp_set(flush, cpus);
		}

		if (!nr_bank) {
		flush->hv_vp_set.format = HV_GENERIC_SET_ALL;
		flush->flags \|= HV_FLUSH_ALL_PROCESSORS;
		}

		/*
		* We can flush not more than max_gvas with one hypercall. Flush the
		* whole address space if we were asked to do more.
		*/
		max_gvas =
		(PAGE_SIZE - sizeof(flush) - nr_bank
		sizeof(flush->hv_vp_set.bank_contents[0])) /
		sizeof(flush->gva_list[0]);

		if (info->end == TLB_FLUSH_ALL) {
		flush->flags \|= HV_FLUSH_NON_GLOBAL_MAPPINGS_ONLY;
		status = hv_do_rep_hypercall(
		HVCALL_FLUSH_VIRTUAL_ADDRESS_SPACE_EX,
		0, nr_bank + 2, flush, NULL);
		} else if (info->end &&
		((info->end - info->start)/HV_TLB_FLUSH_UNIT) > max_gvas) {
		status = hv_do_rep_hypercall(
		HVCALL_FLUSH_VIRTUAL_ADDRESS_SPACE_EX,
		0, nr_bank + 2, flush, NULL);
		} else {
		gva_n = fill_gva_list(flush->gva_list, nr_bank,
		info->start, info->end);
		status = hv_do_rep_hypercall(
		HVCALL_FLUSH_VIRTUAL_ADDRESS_LIST_EX,
		gva_n, nr_bank + 2, flush, NULL);
		}

		local_irq_restore(flags);

		if (!(status & HV_HYPERCALL_RESULT_MASK))
		return;
		do_native:
		native_flush_tlb_others(cpus, info);
		}

		void hyperv_setup_mmu_ops(void)
		{
		if (!(ms_hyperv.hints & HV_X64_REMOTE_TLB_FLUSH_RECOMMENDED))
		return;

		setup_clear_cpu_cap(X86_FEATURE_PCID);

		if (!(ms_hyperv.hints & HV_X64_EX_PROCESSOR_MASKS_RECOMMENDED)) {
		pr_info("Using hypercall for remote TLB flush\n");
		pv_mmu_ops.flush_tlb_others = hyperv_flush_tlb_others;
		} else {
		pr_info("Using ext hypercall for remote TLB flush\n");
		pv_mmu_ops.flush_tlb_others = hyperv_flush_tlb_others_ex;
		}
		}

		void hyper_alloc_mmu(void)
		{
		if (!(ms_hyperv.hints & HV_X64_REMOTE_TLB_FLUSH_RECOMMENDED))
		return;

		if (!(ms_hyperv.hints & HV_X64_EX_PROCESSOR_MASKS_RECOMMENDED))
		pcpu_flush = __alloc_percpu(PAGE_SIZE, PAGE_SIZE);
		else
		pcpu_flush_ex = __alloc_percpu(PAGE_SIZE, PAGE_SIZE);
		}