x86/mm: Improve switch_mm() barrier comments

author Andy Lutomirski <luto@kernel.org>

Tue, 12 Jan 2016 20:47:40 +0000 (12:47 -0800)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sun, 31 Jan 2016 19:28:55 +0000 (11:28 -0800)
author Andy Lutomirski <luto@kernel.org>
Tue, 12 Jan 2016 20:47:40 +0000 (12:47 -0800)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sun, 31 Jan 2016 19:28:55 +0000 (11:28 -0800)
diff --git a/arch/x86/include/asm/mmu_context.h b/arch/x86/include/asm/mmu_context.h

index 1edc9cd198b8538bd7d70da33b369d0d7e5743a8..bfd9b2a35a0b14aa879ac9973202ef882dae52d7 100644 (file)
--- a/arch/x86/include/asm/mmu_context.h
+++ b/arch/x86/include/asm/mmu_context.h
@@ -132,14 +132,16 @@ static inline void switch_mm(struct mm_struct *prev, struct mm_struct *next,
                  * be sent, and CPU 0's TLB will contain a stale entry.)
                  *
                  * The bad outcome can occur if either CPU's load is
-                * reordered before that CPU's store, so both CPUs much
+                * reordered before that CPU's store, so both CPUs must
                  * execute full barriers to prevent this from happening.
                  *
                  * Thus, switch_mm needs a full barrier between the
                  * store to mm_cpumask and any operation that could load
-                * from next->pgd.  This barrier synchronizes with
-                * remote TLB flushers.  Fortunately, load_cr3 is
-                * serializing and thus acts as a full barrier.
+                * from next->pgd.  TLB fills are special and can happen
+                * due to instruction fetches or for no reason at all,
+                * and neither LOCK nor MFENCE orders them.
+                * Fortunately, load_cr3() is serializing and gives the
+                * ordering guarantee we need.
                  *
                  */
                 load_cr3(next->pgd);
@@ -188,9 +190,8 @@ static inline void switch_mm(struct mm_struct *prev, struct mm_struct *next,
                          * tlb flush IPI delivery. We must reload CR3
                          * to make sure to use no freed page tables.
                          *
-                        * As above, this is a barrier that forces
-                        * TLB repopulation to be ordered after the
-                        * store to mm_cpumask.
+                        * As above, load_cr3() is serializing and orders TLB
+                        * fills with respect to the mm_cpumask write.
                          */
                         load_cr3(next->pgd);
                         trace_tlb_flush(TLB_FLUSH_ON_TASK_SWITCH, TLB_FLUSH_ALL);
author	Andy Lutomirski <luto@kernel.org>
	Tue, 12 Jan 2016 20:47:40 +0000 (12:47 -0800)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sun, 31 Jan 2016 19:28:55 +0000 (11:28 -0800)