diff options
Diffstat (limited to 'arch/arm64/mm/context.c')
| -rw-r--r-- | arch/arm64/mm/context.c | 85 | 
1 files changed, 51 insertions, 34 deletions
| diff --git a/arch/arm64/mm/context.c b/arch/arm64/mm/context.c index ab9f5f0fb2c7..301417ae2ba8 100644 --- a/arch/arm64/mm/context.c +++ b/arch/arm64/mm/context.c @@ -39,7 +39,16 @@ static cpumask_t tlb_flush_pending;  #define ASID_MASK		(~GENMASK(asid_bits - 1, 0))  #define ASID_FIRST_VERSION	(1UL << asid_bits) -#define NUM_USER_ASIDS		ASID_FIRST_VERSION + +#ifdef CONFIG_UNMAP_KERNEL_AT_EL0 +#define NUM_USER_ASIDS		(ASID_FIRST_VERSION >> 1) +#define asid2idx(asid)		(((asid) & ~ASID_MASK) >> 1) +#define idx2asid(idx)		(((idx) << 1) & ~ASID_MASK) +#else +#define NUM_USER_ASIDS		(ASID_FIRST_VERSION) +#define asid2idx(asid)		((asid) & ~ASID_MASK) +#define idx2asid(idx)		asid2idx(idx) +#endif  /* Get the ASIDBits supported by the current CPU */  static u32 get_cpu_asid_bits(void) @@ -79,13 +88,6 @@ void verify_cpu_asid_bits(void)  	}  } -static void set_reserved_asid_bits(void) -{ -	if (IS_ENABLED(CONFIG_QCOM_FALKOR_ERRATUM_1003) && -	    cpus_have_const_cap(ARM64_WORKAROUND_QCOM_FALKOR_E1003)) -		__set_bit(FALKOR_RESERVED_ASID, asid_map); -} -  static void flush_context(unsigned int cpu)  {  	int i; @@ -94,14 +96,6 @@ static void flush_context(unsigned int cpu)  	/* Update the list of reserved ASIDs and the ASID bitmap. */  	bitmap_clear(asid_map, 0, NUM_USER_ASIDS); -	set_reserved_asid_bits(); - -	/* -	 * Ensure the generation bump is observed before we xchg the -	 * active_asids. -	 */ -	smp_wmb(); -  	for_each_possible_cpu(i) {  		asid = atomic64_xchg_relaxed(&per_cpu(active_asids, i), 0);  		/* @@ -113,11 +107,14 @@ static void flush_context(unsigned int cpu)  		 */  		if (asid == 0)  			asid = per_cpu(reserved_asids, i); -		__set_bit(asid & ~ASID_MASK, asid_map); +		__set_bit(asid2idx(asid), asid_map);  		per_cpu(reserved_asids, i) = asid;  	} -	/* Queue a TLB invalidate and flush the I-cache if necessary. */ +	/* +	 * Queue a TLB invalidation for each CPU to perform on next +	 * context-switch +	 */  	cpumask_setall(&tlb_flush_pending);  } @@ -165,16 +162,16 @@ static u64 new_context(struct mm_struct *mm, unsigned int cpu)  		 * We had a valid ASID in a previous life, so try to re-use  		 * it if possible.  		 */ -		asid &= ~ASID_MASK; -		if (!__test_and_set_bit(asid, asid_map)) +		if (!__test_and_set_bit(asid2idx(asid), asid_map))  			return newasid;  	}  	/*  	 * Allocate a free ASID. If we can't find one, take a note of the -	 * currently active ASIDs and mark the TLBs as requiring flushes. -	 * We always count from ASID #1, as we use ASID #0 when setting a -	 * reserved TTBR0 for the init_mm. +	 * currently active ASIDs and mark the TLBs as requiring flushes.  We +	 * always count from ASID #2 (index 1), as we use ASID #0 when setting +	 * a reserved TTBR0 for the init_mm and we allocate ASIDs in even/odd +	 * pairs.  	 */  	asid = find_next_zero_bit(asid_map, NUM_USER_ASIDS, cur_idx);  	if (asid != NUM_USER_ASIDS) @@ -191,25 +188,35 @@ static u64 new_context(struct mm_struct *mm, unsigned int cpu)  set_asid:  	__set_bit(asid, asid_map);  	cur_idx = asid; -	return asid | generation; +	return idx2asid(asid) | generation;  }  void check_and_switch_context(struct mm_struct *mm, unsigned int cpu)  {  	unsigned long flags; -	u64 asid; +	u64 asid, old_active_asid;  	asid = atomic64_read(&mm->context.id);  	/* -	 * The memory ordering here is subtle. We rely on the control -	 * dependency between the generation read and the update of -	 * active_asids to ensure that we are synchronised with a -	 * parallel rollover (i.e. this pairs with the smp_wmb() in -	 * flush_context). +	 * The memory ordering here is subtle. +	 * If our active_asids is non-zero and the ASID matches the current +	 * generation, then we update the active_asids entry with a relaxed +	 * cmpxchg. Racing with a concurrent rollover means that either: +	 * +	 * - We get a zero back from the cmpxchg and end up waiting on the +	 *   lock. Taking the lock synchronises with the rollover and so +	 *   we are forced to see the updated generation. +	 * +	 * - We get a valid ASID back from the cmpxchg, which means the +	 *   relaxed xchg in flush_context will treat us as reserved +	 *   because atomic RmWs are totally ordered for a given location.  	 */ -	if (!((asid ^ atomic64_read(&asid_generation)) >> asid_bits) -	    && atomic64_xchg_relaxed(&per_cpu(active_asids, cpu), asid)) +	old_active_asid = atomic64_read(&per_cpu(active_asids, cpu)); +	if (old_active_asid && +	    !((asid ^ atomic64_read(&asid_generation)) >> asid_bits) && +	    atomic64_cmpxchg_relaxed(&per_cpu(active_asids, cpu), +				     old_active_asid, asid))  		goto switch_mm_fastpath;  	raw_spin_lock_irqsave(&cpu_asid_lock, flags); @@ -227,6 +234,9 @@ void check_and_switch_context(struct mm_struct *mm, unsigned int cpu)  	raw_spin_unlock_irqrestore(&cpu_asid_lock, flags);  switch_mm_fastpath: + +	arm64_apply_bp_hardening(); +  	/*  	 * Defer TTBR0_EL1 setting for user threads to uaccess_enable() when  	 * emulating PAN. @@ -235,6 +245,15 @@ switch_mm_fastpath:  		cpu_switch_mm(mm->pgd, mm);  } +/* Errata workaround post TTBRx_EL1 update. */ +asmlinkage void post_ttbr_update_workaround(void) +{ +	asm(ALTERNATIVE("nop; nop; nop", +			"ic iallu; dsb nsh; isb", +			ARM64_WORKAROUND_CAVIUM_27456, +			CONFIG_CAVIUM_ERRATUM_27456)); +} +  static int asids_init(void)  {  	asid_bits = get_cpu_asid_bits(); @@ -250,8 +269,6 @@ static int asids_init(void)  		panic("Failed to allocate bitmap for %lu ASIDs\n",  		      NUM_USER_ASIDS); -	set_reserved_asid_bits(); -  	pr_info("ASID allocator initialised with %lu entries\n", NUM_USER_ASIDS);  	return 0;  } | 
