KVM: arm/arm64: Enforce PTE mappings at stage2 when needed
commit6794ad5443("KVM: arm/arm64: Fix unintended stage 2 PMD mappings") made the checks to skip huge mappings, stricter. However it introduced a bug where we still use huge mappings, ignoring the flag to use PTE mappings, by not reseting the vma_pagesize to PAGE_SIZE. Also, the checks do not cover the PUD huge pages, that was under review during the same period. This patch fixes both the issues. Fixes :6794ad5443("KVM: arm/arm64: Fix unintended stage 2 PMD mappings") Reported-by: Zenghui Yu <yuzenghui@huawei.com> Cc: Zenghui Yu <yuzenghui@huawei.com> Cc: Christoffer Dall <christoffer.dall@arm.com> Signed-off-by: Suzuki K Poulose <suzuki.poulose@arm.com> Signed-off-by: Marc Zyngier <marc.zyngier@arm.com>
This commit is contained in:
		
							parent
							
								
									7494cec6cb
								
							
						
					
					
						commit
						a80868f398
					
				| @ -1594,8 +1594,9 @@ static void kvm_send_hwpoison_signal(unsigned long address, | |||||||
| 	send_sig_mceerr(BUS_MCEERR_AR, (void __user *)address, lsb, current); | 	send_sig_mceerr(BUS_MCEERR_AR, (void __user *)address, lsb, current); | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static bool fault_supports_stage2_pmd_mappings(struct kvm_memory_slot *memslot, | static bool fault_supports_stage2_huge_mapping(struct kvm_memory_slot *memslot, | ||||||
| 					       unsigned long hva) | 					       unsigned long hva, | ||||||
|  | 					       unsigned long map_size) | ||||||
| { | { | ||||||
| 	gpa_t gpa_start; | 	gpa_t gpa_start; | ||||||
| 	hva_t uaddr_start, uaddr_end; | 	hva_t uaddr_start, uaddr_end; | ||||||
| @ -1610,34 +1611,34 @@ static bool fault_supports_stage2_pmd_mappings(struct kvm_memory_slot *memslot, | |||||||
| 
 | 
 | ||||||
| 	/*
 | 	/*
 | ||||||
| 	 * Pages belonging to memslots that don't have the same alignment | 	 * Pages belonging to memslots that don't have the same alignment | ||||||
| 	 * within a PMD for userspace and IPA cannot be mapped with stage-2 | 	 * within a PMD/PUD for userspace and IPA cannot be mapped with stage-2 | ||||||
| 	 * PMD entries, because we'll end up mapping the wrong pages. | 	 * PMD/PUD entries, because we'll end up mapping the wrong pages. | ||||||
| 	 * | 	 * | ||||||
| 	 * Consider a layout like the following: | 	 * Consider a layout like the following: | ||||||
| 	 * | 	 * | ||||||
| 	 *    memslot->userspace_addr: | 	 *    memslot->userspace_addr: | ||||||
| 	 *    +-----+--------------------+--------------------+---+ | 	 *    +-----+--------------------+--------------------+---+ | ||||||
| 	 *    |abcde|fgh  Stage-1 PMD    |    Stage-1 PMD   tv|xyz| | 	 *    |abcde|fgh  Stage-1 block  |    Stage-1 block tv|xyz| | ||||||
| 	 *    +-----+--------------------+--------------------+---+ | 	 *    +-----+--------------------+--------------------+---+ | ||||||
| 	 * | 	 * | ||||||
| 	 *    memslot->base_gfn << PAGE_SIZE: | 	 *    memslot->base_gfn << PAGE_SIZE: | ||||||
| 	 *      +---+--------------------+--------------------+-----+ | 	 *      +---+--------------------+--------------------+-----+ | ||||||
| 	 *      |abc|def  Stage-2 PMD    |    Stage-2 PMD     |tvxyz| | 	 *      |abc|def  Stage-2 block  |    Stage-2 block   |tvxyz| | ||||||
| 	 *      +---+--------------------+--------------------+-----+ | 	 *      +---+--------------------+--------------------+-----+ | ||||||
| 	 * | 	 * | ||||||
| 	 * If we create those stage-2 PMDs, we'll end up with this incorrect | 	 * If we create those stage-2 blocks, we'll end up with this incorrect | ||||||
| 	 * mapping: | 	 * mapping: | ||||||
| 	 *   d -> f | 	 *   d -> f | ||||||
| 	 *   e -> g | 	 *   e -> g | ||||||
| 	 *   f -> h | 	 *   f -> h | ||||||
| 	 */ | 	 */ | ||||||
| 	if ((gpa_start & ~S2_PMD_MASK) != (uaddr_start & ~S2_PMD_MASK)) | 	if ((gpa_start & (map_size - 1)) != (uaddr_start & (map_size - 1))) | ||||||
| 		return false; | 		return false; | ||||||
| 
 | 
 | ||||||
| 	/*
 | 	/*
 | ||||||
| 	 * Next, let's make sure we're not trying to map anything not covered | 	 * Next, let's make sure we're not trying to map anything not covered | ||||||
| 	 * by the memslot. This means we have to prohibit PMD size mappings | 	 * by the memslot. This means we have to prohibit block size mappings | ||||||
| 	 * for the beginning and end of a non-PMD aligned and non-PMD sized | 	 * for the beginning and end of a non-block aligned and non-block sized | ||||||
| 	 * memory slot (illustrated by the head and tail parts of the | 	 * memory slot (illustrated by the head and tail parts of the | ||||||
| 	 * userspace view above containing pages 'abcde' and 'xyz', | 	 * userspace view above containing pages 'abcde' and 'xyz', | ||||||
| 	 * respectively). | 	 * respectively). | ||||||
| @ -1646,8 +1647,8 @@ static bool fault_supports_stage2_pmd_mappings(struct kvm_memory_slot *memslot, | |||||||
| 	 * userspace_addr or the base_gfn, as both are equally aligned (per | 	 * userspace_addr or the base_gfn, as both are equally aligned (per | ||||||
| 	 * the check above) and equally sized. | 	 * the check above) and equally sized. | ||||||
| 	 */ | 	 */ | ||||||
| 	return (hva & S2_PMD_MASK) >= uaddr_start && | 	return (hva & ~(map_size - 1)) >= uaddr_start && | ||||||
| 	       (hva & S2_PMD_MASK) + S2_PMD_SIZE <= uaddr_end; | 	       (hva & ~(map_size - 1)) + map_size <= uaddr_end; | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| static int user_mem_abort(struct kvm_vcpu *vcpu, phys_addr_t fault_ipa, | static int user_mem_abort(struct kvm_vcpu *vcpu, phys_addr_t fault_ipa, | ||||||
| @ -1676,12 +1677,6 @@ static int user_mem_abort(struct kvm_vcpu *vcpu, phys_addr_t fault_ipa, | |||||||
| 		return -EFAULT; | 		return -EFAULT; | ||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	if (!fault_supports_stage2_pmd_mappings(memslot, hva)) |  | ||||||
| 		force_pte = true; |  | ||||||
| 
 |  | ||||||
| 	if (logging_active) |  | ||||||
| 		force_pte = true; |  | ||||||
| 
 |  | ||||||
| 	/* Let's check if we will get back a huge page backed by hugetlbfs */ | 	/* Let's check if we will get back a huge page backed by hugetlbfs */ | ||||||
| 	down_read(¤t->mm->mmap_sem); | 	down_read(¤t->mm->mmap_sem); | ||||||
| 	vma = find_vma_intersection(current->mm, hva, hva + 1); | 	vma = find_vma_intersection(current->mm, hva, hva + 1); | ||||||
| @ -1692,6 +1687,12 @@ static int user_mem_abort(struct kvm_vcpu *vcpu, phys_addr_t fault_ipa, | |||||||
| 	} | 	} | ||||||
| 
 | 
 | ||||||
| 	vma_pagesize = vma_kernel_pagesize(vma); | 	vma_pagesize = vma_kernel_pagesize(vma); | ||||||
|  | 	if (logging_active || | ||||||
|  | 	    !fault_supports_stage2_huge_mapping(memslot, hva, vma_pagesize)) { | ||||||
|  | 		force_pte = true; | ||||||
|  | 		vma_pagesize = PAGE_SIZE; | ||||||
|  | 	} | ||||||
|  | 
 | ||||||
| 	/*
 | 	/*
 | ||||||
| 	 * The stage2 has a minimum of 2 level table (For arm64 see | 	 * The stage2 has a minimum of 2 level table (For arm64 see | ||||||
| 	 * kvm_arm_setup_stage2()). Hence, we are guaranteed that we can | 	 * kvm_arm_setup_stage2()). Hence, we are guaranteed that we can | ||||||
| @ -1699,11 +1700,9 @@ static int user_mem_abort(struct kvm_vcpu *vcpu, phys_addr_t fault_ipa, | |||||||
| 	 * As for PUD huge maps, we must make sure that we have at least | 	 * As for PUD huge maps, we must make sure that we have at least | ||||||
| 	 * 3 levels, i.e, PMD is not folded. | 	 * 3 levels, i.e, PMD is not folded. | ||||||
| 	 */ | 	 */ | ||||||
| 	if ((vma_pagesize == PMD_SIZE || | 	if (vma_pagesize == PMD_SIZE || | ||||||
| 	     (vma_pagesize == PUD_SIZE && kvm_stage2_has_pmd(kvm))) && | 	    (vma_pagesize == PUD_SIZE && kvm_stage2_has_pmd(kvm))) | ||||||
| 	    !force_pte) { |  | ||||||
| 		gfn = (fault_ipa & huge_page_mask(hstate_vma(vma))) >> PAGE_SHIFT; | 		gfn = (fault_ipa & huge_page_mask(hstate_vma(vma))) >> PAGE_SHIFT; | ||||||
| 	} |  | ||||||
| 	up_read(¤t->mm->mmap_sem); | 	up_read(¤t->mm->mmap_sem); | ||||||
| 
 | 
 | ||||||
| 	/* We need minimum second+third level pages */ | 	/* We need minimum second+third level pages */ | ||||||
|  | |||||||
		Loading…
	
		Reference in New Issue
	
	Block a user