/* SPDX-License-Identifier: GPL-2.0-or-later */ #ifndef _ASM_POWERPC_PARAVIRT_H #define _ASM_POWERPC_PARAVIRT_H #include #include #ifdef CONFIG_PPC64 #include #include #include #endif #ifdef CONFIG_PPC_SPLPAR #include #include #include DECLARE_STATIC_KEY_FALSE(shared_processor); static inline bool is_shared_processor(void) { return static_branch_unlikely(&shared_processor); } #ifdef CONFIG_PARAVIRT_TIME_ACCOUNTING extern struct static_key paravirt_steal_enabled; extern struct static_key paravirt_steal_rq_enabled; u64 pseries_paravirt_steal_clock(int cpu); static inline u64 paravirt_steal_clock(int cpu) { return pseries_paravirt_steal_clock(cpu); } #endif /* If bit 0 is set, the cpu has been ceded, conferred, or preempted */ static inline u32 yield_count_of(int cpu) { __be32 yield_count = READ_ONCE(lppaca_of(cpu).yield_count); return be32_to_cpu(yield_count); } /* * Spinlock code confers and prods, so don't trace the hcalls because the * tracing code takes spinlocks which can cause recursion deadlocks. * * These calls are made while the lock is not held: the lock slowpath yields if * it can not acquire the lock, and unlock slow path might prod if a waiter has * yielded). So this may not be a problem for simple spin locks because the * tracing does not technically recurse on the lock, but we avoid it anyway. * * However the queued spin lock contended path is more strictly ordered: the * H_CONFER hcall is made after the task has queued itself on the lock, so then * recursing on that lock will cause the task to then queue up again behind the * first instance (or worse: queued spinlocks use tricks that assume a context * never waits on more than one spinlock, so such recursion may cause random * corruption in the lock code). */ static inline void yield_to_preempted(int cpu, u32 yield_count) { plpar_hcall_norets_notrace(H_CONFER, get_hard_smp_processor_id(cpu), yield_count); } static inline void prod_cpu(int cpu) { plpar_hcall_norets_notrace(H_PROD, get_hard_smp_processor_id(cpu)); } static inline void yield_to_any(void) { plpar_hcall_norets_notrace(H_CONFER, -1, 0); } static inline bool is_vcpu_idle(int vcpu) { return lppaca_of(vcpu).idle; } static inline bool vcpu_is_dispatched(int vcpu) { /* * This is the yield_count. An "odd" value (low bit on) means that * the processor is yielded (either because of an OS yield or a * hypervisor preempt). An even value implies that the processor is * currently executing. */ return (!(yield_count_of(vcpu) & 1)); } #else static inline bool is_shared_processor(void) { return false; } static inline u32 yield_count_of(int cpu) { return 0; } extern void ___bad_yield_to_preempted(void); static inline void yield_to_preempted(int cpu, u32 yield_count) { ___bad_yield_to_preempted(); /* This would be a bug */ } extern void ___bad_yield_to_any(void); static inline void yield_to_any(void) { ___bad_yield_to_any(); /* This would be a bug */ } extern void ___bad_prod_cpu(void); static inline void prod_cpu(int cpu) { ___bad_prod_cpu(); /* This would be a bug */ } static inline bool is_vcpu_idle(int vcpu) { return false; } static inline bool vcpu_is_dispatched(int vcpu) { return true; } #endif #define vcpu_is_preempted vcpu_is_preempted static inline bool vcpu_is_preempted(int cpu) { /* * The dispatch/yield bit alone is an imperfect indicator of * whether the hypervisor has dispatched @cpu to run on a physical * processor. When it is clear, @cpu is definitely not preempted. * But when it is set, it means only that it *might* be, subject to * other conditions. So we check other properties of the VM and * @cpu first, resorting to the yield count last. */ /* * Hypervisor preemption isn't possible in dedicated processor * mode by definition. */ if (!is_shared_processor()) return false; /* * If the hypervisor has dispatched the target CPU on a physical * processor, then the target CPU is definitely not preempted. */ if (vcpu_is_dispatched(cpu)) return false; /* * if the target CPU is not dispatched and the guest OS * has not marked the CPU idle, then it is hypervisor preempted. */ if (!is_vcpu_idle(cpu)) return true; #ifdef CONFIG_PPC_SPLPAR if (!is_kvm_guest()) { int first_cpu, i; /* * The result of vcpu_is_preempted() is used in a * speculative way, and is always subject to invalidation * by events internal and external to Linux. While we can * be called in preemptable context (in the Linux sense), * we're not accessing per-cpu resources in a way that can * race destructively with Linux scheduler preemption and * migration, and callers can tolerate the potential for * error introduced by sampling the CPU index without * pinning the task to it. So it is permissible to use * raw_smp_processor_id() here to defeat the preempt debug * warnings that can arise from using smp_processor_id() * in arbitrary contexts. */ first_cpu = cpu_first_thread_sibling(raw_smp_processor_id()); /* * The PowerVM hypervisor dispatches VMs on a whole core * basis. So we know that a thread sibling of the executing CPU * cannot have been preempted by the hypervisor, even if it * has called H_CONFER, which will set the yield bit. */ if (cpu_first_thread_sibling(cpu) == first_cpu) return false; /* * The specific target CPU was marked by guest OS as idle, but * then also check all other cpus in the core for PowerVM * because it does core scheduling and one of the vcpu * of the core getting preempted by hypervisor implies * other vcpus can also be considered preempted. */ first_cpu = cpu_first_thread_sibling(cpu); for (i = first_cpu; i < first_cpu + threads_per_core; i++) { if (i == cpu) continue; if (vcpu_is_dispatched(i)) return false; if (!is_vcpu_idle(i)) return true; } } #endif /* * None of the threads in target CPU's core are running but none of * them were preempted too. Hence assume the target CPU to be * non-preempted. */ return false; } static inline bool pv_is_native_spin_unlock(void) { return !is_shared_processor(); } #endif /* _ASM_POWERPC_PARAVIRT_H */