URL https://opencores.org/ocsvn/or1k/or1k/trunk

Subversion Repositories or1k

[/] [or1k/] [trunk/] [linux/] [linux-2.4/] [arch/] [x86_64/] [kernel/] [smp.c] - Blame information for rev 1765

Details | Compare with Previous | View Log


/*
 *      Intel SMP support routines.
 *
 *      (c) 1995 Alan Cox, Building #3 <alan@redhat.com>
 *      (c) 1998-99, 2000 Ingo Molnar <mingo@redhat.com>
 *      (c) 2002,2003 Andi Kleen, SuSE Labs.
 *
 *      This code is released under the GNU General Public License version 2 or
 *      later.
 */
 
#include <linux/init.h>
 
#include <linux/mm.h>
#include <linux/irq.h>
#include <linux/delay.h>
#include <linux/spinlock.h>
#include <linux/smp_lock.h>
#include <linux/kernel_stat.h>
#include <linux/mc146818rtc.h>
 
#include <asm/mtrr.h>
#include <asm/pgalloc.h>
 
/*
 *      Some notes on x86 processor bugs affecting SMP operation:
 *
 *      Pentium, Pentium Pro, II, III (and all CPUs) have bugs.
 *      The Linux implications for SMP are handled as follows:
 *
 *      Pentium III / [Xeon]
 *              None of the E1AP-E3AP errata are visible to the user.
 *
 *      E1AP.   see PII A1AP
 *      E2AP.   see PII A2AP
 *      E3AP.   see PII A3AP
 *
 *      Pentium II / [Xeon]
 *              None of the A1AP-A3AP errata are visible to the user.
 *
 *      A1AP.   see PPro 1AP
 *      A2AP.   see PPro 2AP
 *      A3AP.   see PPro 7AP
 *
 *      Pentium Pro
 *              None of 1AP-9AP errata are visible to the normal user,
 *      except occasional delivery of 'spurious interrupt' as trap #15.
 *      This is very rare and a non-problem.
 *
 *      1AP.    Linux maps APIC as non-cacheable
 *      2AP.    worked around in hardware
 *      3AP.    fixed in C0 and above steppings microcode update.
 *              Linux does not use excessive STARTUP_IPIs.
 *      4AP.    worked around in hardware
 *      5AP.    symmetric IO mode (normal Linux operation) not affected.
 *              'noapic' mode has vector 0xf filled out properly.
 *      6AP.    'noapic' mode might be affected - fixed in later steppings
 *      7AP.    We do not assume writes to the LVT deassering IRQs
 *      8AP.    We do not enable low power mode (deep sleep) during MP bootup
 *      9AP.    We do not use mixed mode
 *
 *      Pentium
 *              There is a marginal case where REP MOVS on 100MHz SMP
 *      machines with B stepping processors can fail. XXX should provide
 *      an L1cache=Writethrough or L1cache=off option.
 *
 *              B stepping CPUs may hang. There are hardware work arounds
 *      for this. We warn about it in case your board doesnt have the work
 *      arounds. Basically thats so I can tell anyone with a B stepping
 *      CPU and SMP problems "tough".
 *
 *      Specific items [From Pentium Processor Specification Update]
 *
 *      1AP.    Linux doesn't use remote read
 *      2AP.    Linux doesn't trust APIC errors
 *      3AP.    We work around this
 *      4AP.    Linux never generated 3 interrupts of the same priority
 *              to cause a lost local interrupt.
 *      5AP.    Remote read is never used
 *      6AP.    not affected - worked around in hardware
 *      7AP.    not affected - worked around in hardware
 *      8AP.    worked around in hardware - we get explicit CS errors if not
 *      9AP.    only 'noapic' mode affected. Might generate spurious
 *              interrupts, we log only the first one and count the
 *              rest silently.
 *      10AP.   not affected - worked around in hardware
 *      11AP.   Linux reads the APIC between writes to avoid this, as per
 *              the documentation. Make sure you preserve this as it affects
 *              the C stepping chips too.
 *      12AP.   not affected - worked around in hardware
 *      13AP.   not affected - worked around in hardware
 *      14AP.   we always deassert INIT during bootup
 *      15AP.   not affected - worked around in hardware
 *      16AP.   not affected - worked around in hardware
 *      17AP.   not affected - worked around in hardware
 *      18AP.   not affected - worked around in hardware
 *      19AP.   not affected - worked around in BIOS
 *
 *      If this sounds worrying believe me these bugs are either ___RARE___,
 *      or are signal timing bugs worked around in hardware and there's
 *      about nothing of note with C stepping upwards.
 */
 
/* The 'big kernel lock' */
spinlock_cacheline_t kernel_flag_cacheline = {SPIN_LOCK_UNLOCKED};
 
struct tlb_state cpu_tlbstate[NR_CPUS] __cacheline_aligned = {[0 ... NR_CPUS-1] = { &init_mm, 0, }};
 
/*
 * the following functions deal with sending IPIs between CPUs.
 *
 * We use 'broadcast', CPU->CPU IPIs and self-IPIs too.
 */
 
static inline unsigned int __prepare_ICR (unsigned int shortcut, int vector)
{
        unsigned int icr =  APIC_DM_FIXED | shortcut | vector | APIC_DEST_LOGICAL;
        return icr;
}
 
static inline int __prepare_ICR2 (unsigned int mask)
{
        return SET_APIC_DEST_FIELD(mask);
}
 
static inline void __send_IPI_shortcut(unsigned int shortcut, int vector)
{
        /*
         * Subtle. In the case of the 'never do double writes' workaround
         * we have to lock out interrupts to be safe.  As we don't care
         * of the value read we use an atomic rmw access to avoid costly
         * cli/sti.  Otherwise we use an even cheaper single atomic write
         * to the APIC.
         */
        unsigned int cfg;
 
        /*
         * Wait for idle.
         */
        apic_wait_icr_idle();
 
        /*
         * No need to touch the target chip field
         */
        cfg = __prepare_ICR(shortcut, vector);
 
        /*
         * Send the IPI. The write to APIC_ICR fires this off.
         */
        apic_write_around(APIC_ICR, cfg);
}
 
static inline void send_IPI_allbutself(int vector)
{
        /*
         * if there are no other CPUs in the system then
         * we get an APIC send error if we try to broadcast.
         * thus we have to avoid sending IPIs in this case.
         */
        if (smp_num_cpus > 1)
                __send_IPI_shortcut(APIC_DEST_ALLBUT, vector);
}
 
static inline void send_IPI_all(int vector)
{
        __send_IPI_shortcut(APIC_DEST_ALLINC, vector);
}
 
void send_IPI_self(int vector)
{
        __send_IPI_shortcut(APIC_DEST_SELF, vector);
}
 
static inline void send_IPI_mask(int mask, int vector)
{
        unsigned long cfg;
        unsigned long flags;
 
        __save_flags(flags);
        __cli();
 
        /*
         * Wait for idle.
         */
        apic_wait_icr_idle();
 
        /*
         * prepare target chip field
         */
        cfg = __prepare_ICR2(mask);
        apic_write_around(APIC_ICR2, cfg);
 
        /*
         * program the ICR
         */
        cfg = __prepare_ICR(0, vector);
 
        /*
         * Send the IPI. The write to APIC_ICR fires this off.
         */
        apic_write_around(APIC_ICR, cfg);
        __restore_flags(flags);
}
 
/*
 *      Smarter SMP flushing macros.
 *              c/o Linus Torvalds.
 *
 *      These mean you can really definitely utterly forget about
 *      writing to user space from interrupts. (Its not allowed anyway).
 *
 *      Optimizations Manfred Spraul <manfred@colorfullife.com>
 */
 
static volatile unsigned long flush_cpumask;
static struct mm_struct * flush_mm;
static unsigned long flush_va;
static spinlock_t tlbstate_lock = SPIN_LOCK_UNLOCKED;
#define FLUSH_ALL       0xffffffff
 
/*
 * We cannot call mmdrop() because we are in interrupt context,
 * instead update mm->cpu_vm_mask.
 */
static void inline leave_mm (unsigned long cpu)
{
        if (cpu_tlbstate[cpu].state == TLBSTATE_OK)
                BUG();
        clear_bit(cpu, &cpu_tlbstate[cpu].active_mm->cpu_vm_mask);
        /* flush TLB before it goes away. this stops speculative prefetches */
        __flush_tlb();
}
 
/*
 *
 * The flush IPI assumes that a thread switch happens in this order:
 * [cpu0: the cpu that switches]
 * 1) switch_mm() either 1a) or 1b)
 * 1a) thread switch to a different mm
 * 1a1) clear_bit(cpu, &old_mm->cpu_vm_mask);
 *      Stop ipi delivery for the old mm. This is not synchronized with
 *      the other cpus, but smp_invalidate_interrupt ignore flush ipis
 *      for the wrong mm, and in the worst case we perform a superflous
 *      tlb flush.
 * 1a2) set cpu_tlbstate to TLBSTATE_OK
 *      Now the smp_invalidate_interrupt won't call leave_mm if cpu0
 *      was in lazy tlb mode.
 * 1a3) update cpu_tlbstate[].active_mm
 *      Now cpu0 accepts tlb flushes for the new mm.
 * 1a4) set_bit(cpu, &new_mm->cpu_vm_mask);
 *      Now the other cpus will send tlb flush ipis.
 * 1a4) change cr3.
 * 1b) thread switch without mm change
 *      cpu_tlbstate[].active_mm is correct, cpu0 already handles
 *      flush ipis.
 * 1b1) set cpu_tlbstate to TLBSTATE_OK
 * 1b2) test_and_set the cpu bit in cpu_vm_mask.
 *      Atomically set the bit [other cpus will start sending flush ipis],
 *      and test the bit.
 * 1b3) if the bit was 0: leave_mm was called, flush the tlb.
 * 2) switch %%esp, ie current
 *
 * The interrupt must handle 2 special cases:
 * - cr3 is changed before %%esp, ie. it cannot use current->{active_,}mm.
 * - the cpu performs speculative tlb reads, i.e. even if the cpu only
 *   runs in kernel space, the cpu could load tlb entries for user space
 *   pages.
 *
 * The good news is that cpu_tlbstate is local to each cpu, no
 * write/read ordering problems.
 */
 
/*
 * TLB flush IPI:
 *
 * 1) Flush the tlb entries if the cpu uses the mm that's being flushed.
 * 2) Leave the mm if we are in the lazy tlb mode.
 */
 
asmlinkage void smp_invalidate_interrupt (void)
{
        unsigned long cpu = smp_processor_id();
 
        if (!test_bit(cpu, &flush_cpumask))
                return;
                /*
                 * This was a BUG() but until someone can quote me the
                 * line from the intel manual that guarantees an IPI to
                 * multiple CPUs is retried _only_ on the erroring CPUs
                 * its staying as a return
                 *
                 * BUG();
                 */
 
        if (flush_mm == cpu_tlbstate[cpu].active_mm) {
                if (cpu_tlbstate[cpu].state == TLBSTATE_OK) {
                        if (flush_va == FLUSH_ALL)
                                local_flush_tlb();
                        else
                                __flush_tlb_one(flush_va);
                } else
                        leave_mm(cpu);
        }
        ack_APIC_irq();
        clear_bit(cpu, &flush_cpumask);
}
 
static void flush_tlb_others (unsigned long cpumask, struct mm_struct *mm,
                                                unsigned long va)
{
        /*
         * A couple of (to be removed) sanity checks:
         *
         * - we do not send IPIs to not-yet booted CPUs.
         * - current CPU must not be in mask
         * - mask must exist :)
         */
        if (!cpumask)
                BUG();
        if ((cpumask & cpu_online_map) != cpumask)
                BUG();
        if (cpumask & (1 << smp_processor_id()))
                BUG();
        if (!mm)
                BUG();
 
        /*
         * i'm not happy about this global shared spinlock in the
         * MM hot path, but we'll see how contended it is.
         * Temporarily this turns IRQs off, so that lockups are
         * detected by the NMI watchdog.
         */
        spin_lock(&tlbstate_lock);
 
        flush_mm = mm;
        flush_va = va;
        atomic_set_mask(cpumask, &flush_cpumask);
        /*
         * We have to send the IPI only to
         * CPUs affected.
         */
        send_IPI_mask(cpumask, INVALIDATE_TLB_VECTOR);
 
        while (flush_cpumask)
                /* nothing. lockup detection does not belong here */;
 
        flush_mm = NULL;
        flush_va = 0;
        spin_unlock(&tlbstate_lock);
}
 
void flush_tlb_current_task(void)
{
        struct mm_struct *mm = current->mm;
        unsigned long cpu_mask = mm->cpu_vm_mask & ~(1 << smp_processor_id());
 
        local_flush_tlb();
        if (cpu_mask)
                flush_tlb_others(cpu_mask, mm, FLUSH_ALL);
}
 
void flush_tlb_mm (struct mm_struct * mm)
{
        unsigned long cpu_mask = mm->cpu_vm_mask & ~(1 << smp_processor_id());
 
        if (current->active_mm == mm) {
                if (current->mm)
                        local_flush_tlb();
                else
                        leave_mm(smp_processor_id());
        }
        if (cpu_mask)
                flush_tlb_others(cpu_mask, mm, FLUSH_ALL);
}
 
void flush_tlb_page(struct vm_area_struct * vma, unsigned long va)
{
        struct mm_struct *mm = vma->vm_mm;
        unsigned long cpu_mask = mm->cpu_vm_mask & ~(1 << smp_processor_id());
 
        if (current->active_mm == mm) {
                if(current->mm)
                        __flush_tlb_one(va);
                 else
                        leave_mm(smp_processor_id());
        }
 
        if (cpu_mask)
                flush_tlb_others(cpu_mask, mm, va);
}
 
static inline void do_flush_tlb_all_local(void)
{
        unsigned long cpu = smp_processor_id();
 
        __flush_tlb_all();
        if (cpu_tlbstate[cpu].state == TLBSTATE_LAZY)
                leave_mm(cpu);
}
 
static void flush_tlb_all_ipi(void* info)
{
        do_flush_tlb_all_local();
}
 
void flush_tlb_all(void)
{
        smp_call_function (flush_tlb_all_ipi,0,1,1);
 
        do_flush_tlb_all_local();
}
 
/*
 * this function sends a 'reschedule' IPI to another CPU.
 * it goes straight through and wastes no time serializing
 * anything. Worst case is that we lose a reschedule ...
 */
 
void smp_send_reschedule(int cpu)
{
        send_IPI_mask(1 << cpu, RESCHEDULE_VECTOR);
}
 
/*
 * Structure and data for smp_call_function(). This is designed to minimise
 * static memory requirements. It also looks cleaner.
 */
static spinlock_t call_lock = SPIN_LOCK_UNLOCKED;
 
struct call_data_struct {
        void (*func) (void *info);
        void *info;
        atomic_t started;
        atomic_t finished;
        int wait;
};
 
static struct call_data_struct * call_data;
 
/*
 * this function sends a 'generic call function' IPI to all other CPUs
 * in the system.
 */
 
int smp_call_function (void (*func) (void *info), void *info, int nonatomic,
                        int wait)
/*
 * [SUMMARY] Run a function on all other CPUs.
 * <func> The function to run. This must be fast and non-blocking.
 * <info> An arbitrary pointer to pass to the function.
 * <nonatomic> currently unused.
 * <wait> If true, wait (atomically) until function has completed on other CPUs.
 * [RETURNS] 0 on success, else a negative status code. Does not return until
 * remote CPUs are nearly ready to execute <<func>> or are or have executed.
 *
 * You must not call this function with disabled interrupts or from a
 * hardware interrupt handler or from a bottom half handler.
 */
{
        struct call_data_struct data;
        int cpus = smp_num_cpus-1;
 
        if (!cpus)
                return 0;
 
        data.func = func;
        data.info = info;
        atomic_set(&data.started, 0);
        data.wait = wait;
        if (wait)
                atomic_set(&data.finished, 0);
 
        spin_lock(&call_lock);
        call_data = &data;
        wmb();
        /* Send a message to all other CPUs and wait for them to respond */
        send_IPI_allbutself(CALL_FUNCTION_VECTOR);
 
        /* Wait for response */
        while (atomic_read(&data.started) != cpus)
                barrier();
 
        if (wait)
                while (atomic_read(&data.finished) != cpus)
                        barrier();
        spin_unlock(&call_lock);
 
        return 0;
}
 
void smp_stop_cpu(void)
{
        /*
         * Remove this CPU:
         */
        clear_bit(smp_processor_id(), &cpu_online_map);
        __cli();
        disable_local_APIC();
        __sti();
}
 
static void smp_really_stop_cpu(void *dummy)
{
        smp_stop_cpu();
        for (;;)
                asm("hlt");
}
 
/*
 * this function calls the 'stop' function on all other CPUs in the system.
 */
 
void smp_send_stop(void)
{
        smp_call_function(smp_really_stop_cpu, NULL, 1, 0);
        smp_stop_cpu();
}
 
/*
 * Reschedule call back. Nothing to do,
 * all the work is done automatically when
 * we return from the interrupt.
 */
asmlinkage void smp_reschedule_interrupt(void)
{
        ack_APIC_irq();
}
 
asmlinkage void smp_call_function_interrupt(void)
{
        void (*func) (void *info) = call_data->func;
        void *info = call_data->info;
        int wait = call_data->wait;
 
        ack_APIC_irq();
        /*
         * Notify initiating CPU that I've grabbed the data and am
         * about to execute the function
         */
        mb();
        atomic_inc(&call_data->started);
        /*
         * At this point the info structure may be out of scope unless wait==1
         */
        (*func)(info);
        if (wait) {
                mb();
                atomic_inc(&call_data->finished);
        }
}

Browse

Tools

Subversion Repositories or1k

[/] [or1k/] [trunk/] [linux/] [linux-2.4/] [arch/] [x86_64/] [kernel/] [smp.c] - Blame information for rev 1765

Line No.	Rev	Author	Line
1	1275	phoenix	`/*`
2			`* Intel SMP support routines.`
3			`*`
4			`* (c) 1995 Alan Cox, Building #3 <alan@redhat.com>`
5			`* (c) 1998-99, 2000 Ingo Molnar <mingo@redhat.com>`
6			`* (c) 2002,2003 Andi Kleen, SuSE Labs.`
7			`*`
8			`* This code is released under the GNU General Public License version 2 or`
9			`* later.`
10			`*/`
11
12			`#include <linux/init.h>`
13
14			`#include <linux/mm.h>`
15			`#include <linux/irq.h>`
16			`#include <linux/delay.h>`
17			`#include <linux/spinlock.h>`
18			`#include <linux/smp_lock.h>`
19			`#include <linux/kernel_stat.h>`
20			`#include <linux/mc146818rtc.h>`
21
22			`#include <asm/mtrr.h>`
23			`#include <asm/pgalloc.h>`
24
25			`/*`
26			`* Some notes on x86 processor bugs affecting SMP operation:`
27			`*`
28			`* Pentium, Pentium Pro, II, III (and all CPUs) have bugs.`
29			`* The Linux implications for SMP are handled as follows:`
30			`*`
31			`* Pentium III / [Xeon]`
32			`* None of the E1AP-E3AP errata are visible to the user.`
33			`*`
34			`* E1AP. see PII A1AP`
35			`* E2AP. see PII A2AP`
36			`* E3AP. see PII A3AP`
37			`*`
38			`* Pentium II / [Xeon]`
39			`* None of the A1AP-A3AP errata are visible to the user.`
40			`*`
41			`* A1AP. see PPro 1AP`
42			`* A2AP. see PPro 2AP`
43			`* A3AP. see PPro 7AP`
44			`*`
45			`* Pentium Pro`
46			`* None of 1AP-9AP errata are visible to the normal user,`
47			`* except occasional delivery of 'spurious interrupt' as trap #15.`
48			`* This is very rare and a non-problem.`
49			`*`
50			`* 1AP. Linux maps APIC as non-cacheable`
51			`* 2AP. worked around in hardware`
52			`* 3AP. fixed in C0 and above steppings microcode update.`
53			`* Linux does not use excessive STARTUP_IPIs.`
54			`* 4AP. worked around in hardware`
55			`* 5AP. symmetric IO mode (normal Linux operation) not affected.`
56			`* 'noapic' mode has vector 0xf filled out properly.`
57			`* 6AP. 'noapic' mode might be affected - fixed in later steppings`
58			`* 7AP. We do not assume writes to the LVT deassering IRQs`
59			`* 8AP. We do not enable low power mode (deep sleep) during MP bootup`
60			`* 9AP. We do not use mixed mode`
61			`*`
62			`* Pentium`
63			`* There is a marginal case where REP MOVS on 100MHz SMP`
64			`* machines with B stepping processors can fail. XXX should provide`
65			`* an L1cache=Writethrough or L1cache=off option.`
66			`*`
67			`* B stepping CPUs may hang. There are hardware work arounds`
68			`* for this. We warn about it in case your board doesnt have the work`
69			`* arounds. Basically thats so I can tell anyone with a B stepping`
70			`* CPU and SMP problems "tough".`
71			`*`
72			`* Specific items [From Pentium Processor Specification Update]`
73			`*`
74			`* 1AP. Linux doesn't use remote read`
75			`* 2AP. Linux doesn't trust APIC errors`
76			`* 3AP. We work around this`
77			`* 4AP. Linux never generated 3 interrupts of the same priority`
78			`* to cause a lost local interrupt.`
79			`* 5AP. Remote read is never used`
80			`* 6AP. not affected - worked around in hardware`
81			`* 7AP. not affected - worked around in hardware`
82			`* 8AP. worked around in hardware - we get explicit CS errors if not`
83			`* 9AP. only 'noapic' mode affected. Might generate spurious`
84			`* interrupts, we log only the first one and count the`
85			`* rest silently.`
86			`* 10AP. not affected - worked around in hardware`
87			`* 11AP. Linux reads the APIC between writes to avoid this, as per`
88			`* the documentation. Make sure you preserve this as it affects`
89			`* the C stepping chips too.`
90			`* 12AP. not affected - worked around in hardware`
91			`* 13AP. not affected - worked around in hardware`
92			`* 14AP. we always deassert INIT during bootup`
93			`* 15AP. not affected - worked around in hardware`
94			`* 16AP. not affected - worked around in hardware`
95			`* 17AP. not affected - worked around in hardware`
96			`* 18AP. not affected - worked around in hardware`
97			`* 19AP. not affected - worked around in BIOS`
98			`*`
99			`* If this sounds worrying believe me these bugs are either ___RARE___,`
100			`* or are signal timing bugs worked around in hardware and there's`
101			`* about nothing of note with C stepping upwards.`
102			`*/`
103
104			`/* The 'big kernel lock' */`
105			`spinlock_cacheline_t kernel_flag_cacheline = {SPIN_LOCK_UNLOCKED};`
106
107			`struct tlb_state cpu_tlbstate[NR_CPUS] __cacheline_aligned = {[0 ... NR_CPUS-1] = { &init_mm, 0, }};`
108
109			`/*`
110			`* the following functions deal with sending IPIs between CPUs.`
111			`*`
112			`* We use 'broadcast', CPU->CPU IPIs and self-IPIs too.`
113			`*/`
114
115			`static inline unsigned int __prepare_ICR (unsigned int shortcut, int vector)`
116			`{`
117			`unsigned int icr = APIC_DM_FIXED \| shortcut \| vector \| APIC_DEST_LOGICAL;`
118			`return icr;`
119			`}`
120
121			`static inline int __prepare_ICR2 (unsigned int mask)`
122			`{`
123			`return SET_APIC_DEST_FIELD(mask);`
124			`}`
125
126			`static inline void __send_IPI_shortcut(unsigned int shortcut, int vector)`
127			`{`
128			`/*`
129			`* Subtle. In the case of the 'never do double writes' workaround`
130			`* we have to lock out interrupts to be safe. As we don't care`
131			`* of the value read we use an atomic rmw access to avoid costly`
132			`* cli/sti. Otherwise we use an even cheaper single atomic write`
133			`* to the APIC.`
134			`*/`
135			`unsigned int cfg;`
136
137			`/*`
138			`* Wait for idle.`
139			`*/`
140			`apic_wait_icr_idle();`
141
142			`/*`
143			`* No need to touch the target chip field`
144			`*/`
145			`cfg = __prepare_ICR(shortcut, vector);`
146
147			`/*`
148			`* Send the IPI. The write to APIC_ICR fires this off.`
149			`*/`
150			`apic_write_around(APIC_ICR, cfg);`
151			`}`
152
153			`static inline void send_IPI_allbutself(int vector)`
154			`{`
155			`/*`
156			`* if there are no other CPUs in the system then`
157			`* we get an APIC send error if we try to broadcast.`
158			`* thus we have to avoid sending IPIs in this case.`
159			`*/`
160			`if (smp_num_cpus > 1)`
161			`__send_IPI_shortcut(APIC_DEST_ALLBUT, vector);`
162			`}`
163
164			`static inline void send_IPI_all(int vector)`
165			`{`
166			`__send_IPI_shortcut(APIC_DEST_ALLINC, vector);`
167			`}`
168
169			`void send_IPI_self(int vector)`
170			`{`
171			`__send_IPI_shortcut(APIC_DEST_SELF, vector);`
172			`}`
173
174			`static inline void send_IPI_mask(int mask, int vector)`
175			`{`
176			`unsigned long cfg;`
177			`unsigned long flags;`
178
179			`__save_flags(flags);`
180			`__cli();`
181
182			`/*`
183			`* Wait for idle.`
184			`*/`
185			`apic_wait_icr_idle();`
186
187			`/*`
188			`* prepare target chip field`
189			`*/`
190			`cfg = __prepare_ICR2(mask);`
191			`apic_write_around(APIC_ICR2, cfg);`
192
193			`/*`
194			`* program the ICR`
195			`*/`
196			`cfg = __prepare_ICR(0, vector);`
197
198			`/*`
199			`* Send the IPI. The write to APIC_ICR fires this off.`
200			`*/`
201			`apic_write_around(APIC_ICR, cfg);`
202			`__restore_flags(flags);`
203			`}`
204
205			`/*`
206			`* Smarter SMP flushing macros.`
207			`* c/o Linus Torvalds.`
208			`*`
209			`* These mean you can really definitely utterly forget about`
210			`* writing to user space from interrupts. (Its not allowed anyway).`
211			`*`
212			`* Optimizations Manfred Spraul <manfred@colorfullife.com>`
213			`*/`
214
215			`static volatile unsigned long flush_cpumask;`
216			`static struct mm_struct * flush_mm;`
217			`static unsigned long flush_va;`
218			`static spinlock_t tlbstate_lock = SPIN_LOCK_UNLOCKED;`
219			`#define FLUSH_ALL 0xffffffff`
220
221			`/*`
222			`* We cannot call mmdrop() because we are in interrupt context,`
223			`* instead update mm->cpu_vm_mask.`
224			`*/`
225			`static void inline leave_mm (unsigned long cpu)`
226			`{`
227			`if (cpu_tlbstate[cpu].state == TLBSTATE_OK)`
228			`BUG();`
229			`clear_bit(cpu, &cpu_tlbstate[cpu].active_mm->cpu_vm_mask);`
230			`/* flush TLB before it goes away. this stops speculative prefetches */`
231			`__flush_tlb();`
232			`}`
233
234			`/*`
235			`*`
236			`* The flush IPI assumes that a thread switch happens in this order:`
237			`* [cpu0: the cpu that switches]`
238			`* 1) switch_mm() either 1a) or 1b)`
239			`* 1a) thread switch to a different mm`
240			`* 1a1) clear_bit(cpu, &old_mm->cpu_vm_mask);`
241			`* Stop ipi delivery for the old mm. This is not synchronized with`
242			`* the other cpus, but smp_invalidate_interrupt ignore flush ipis`
243			`* for the wrong mm, and in the worst case we perform a superflous`
244			`* tlb flush.`
245			`* 1a2) set cpu_tlbstate to TLBSTATE_OK`
246			`* Now the smp_invalidate_interrupt won't call leave_mm if cpu0`
247			`* was in lazy tlb mode.`
248			`* 1a3) update cpu_tlbstate[].active_mm`
249			`* Now cpu0 accepts tlb flushes for the new mm.`
250			`* 1a4) set_bit(cpu, &new_mm->cpu_vm_mask);`
251			`* Now the other cpus will send tlb flush ipis.`
252			`* 1a4) change cr3.`
253			`* 1b) thread switch without mm change`
254			`* cpu_tlbstate[].active_mm is correct, cpu0 already handles`
255			`* flush ipis.`
256			`* 1b1) set cpu_tlbstate to TLBSTATE_OK`
257			`* 1b2) test_and_set the cpu bit in cpu_vm_mask.`
258			`* Atomically set the bit [other cpus will start sending flush ipis],`
259			`* and test the bit.`
260			`* 1b3) if the bit was 0: leave_mm was called, flush the tlb.`
261			`* 2) switch %%esp, ie current`
262			`*`
263			`* The interrupt must handle 2 special cases:`
264			`* - cr3 is changed before %%esp, ie. it cannot use current->{active_,}mm.`
265			`* - the cpu performs speculative tlb reads, i.e. even if the cpu only`
266			`* runs in kernel space, the cpu could load tlb entries for user space`
267			`* pages.`
268			`*`
269			`* The good news is that cpu_tlbstate is local to each cpu, no`
270			`* write/read ordering problems.`
271			`*/`
272
273			`/*`
274			`* TLB flush IPI:`
275			`*`
276			`* 1) Flush the tlb entries if the cpu uses the mm that's being flushed.`
277			`* 2) Leave the mm if we are in the lazy tlb mode.`
278			`*/`
279
280			`asmlinkage void smp_invalidate_interrupt (void)`
281			`{`
282			`unsigned long cpu = smp_processor_id();`
283
284			`if (!test_bit(cpu, &flush_cpumask))`
285			`return;`
286			`/*`
287			`* This was a BUG() but until someone can quote me the`
288			`* line from the intel manual that guarantees an IPI to`
289			`* multiple CPUs is retried _only_ on the erroring CPUs`
290			`* its staying as a return`
291			`*`
292			`* BUG();`
293			`*/`
294
295			`if (flush_mm == cpu_tlbstate[cpu].active_mm) {`
296			`if (cpu_tlbstate[cpu].state == TLBSTATE_OK) {`
297			`if (flush_va == FLUSH_ALL)`
298			`local_flush_tlb();`
299			`else`
300			`__flush_tlb_one(flush_va);`
301			`} else`
302			`leave_mm(cpu);`
303			`}`
304			`ack_APIC_irq();`
305			`clear_bit(cpu, &flush_cpumask);`
306			`}`
307
308			`static void flush_tlb_others (unsigned long cpumask, struct mm_struct *mm,`
309			`unsigned long va)`
310			`{`
311			`/*`
312			`* A couple of (to be removed) sanity checks:`
313			`*`
314			`* - we do not send IPIs to not-yet booted CPUs.`
315			`* - current CPU must not be in mask`
316			`* - mask must exist :)`
317			`*/`
318			`if (!cpumask)`
319			`BUG();`
320			`if ((cpumask & cpu_online_map) != cpumask)`
321			`BUG();`
322			`if (cpumask & (1 << smp_processor_id()))`
323			`BUG();`
324			`if (!mm)`
325			`BUG();`
326
327			`/*`
328			`* i'm not happy about this global shared spinlock in the`
329			`* MM hot path, but we'll see how contended it is.`
330			`* Temporarily this turns IRQs off, so that lockups are`
331			`* detected by the NMI watchdog.`
332			`*/`
333			`spin_lock(&tlbstate_lock);`
334
335			`flush_mm = mm;`
336			`flush_va = va;`
337			`atomic_set_mask(cpumask, &flush_cpumask);`
338			`/*`
339			`* We have to send the IPI only to`
340			`* CPUs affected.`
341			`*/`
342			`send_IPI_mask(cpumask, INVALIDATE_TLB_VECTOR);`
343
344			`while (flush_cpumask)`
345			`/* nothing. lockup detection does not belong here */;`
346
347			`flush_mm = NULL;`
348			`flush_va = 0;`
349			`spin_unlock(&tlbstate_lock);`
350			`}`
351
352			`void flush_tlb_current_task(void)`
353			`{`
354			`struct mm_struct *mm = current->mm;`
355			`unsigned long cpu_mask = mm->cpu_vm_mask & ~(1 << smp_processor_id());`
356
357			`local_flush_tlb();`
358			`if (cpu_mask)`
359			`flush_tlb_others(cpu_mask, mm, FLUSH_ALL);`
360			`}`
361
362			`void flush_tlb_mm (struct mm_struct * mm)`
363			`{`
364			`unsigned long cpu_mask = mm->cpu_vm_mask & ~(1 << smp_processor_id());`
365
366			`if (current->active_mm == mm) {`
367			`if (current->mm)`
368			`local_flush_tlb();`
369			`else`
370			`leave_mm(smp_processor_id());`
371			`}`
372			`if (cpu_mask)`
373			`flush_tlb_others(cpu_mask, mm, FLUSH_ALL);`
374			`}`
375
376			`void flush_tlb_page(struct vm_area_struct * vma, unsigned long va)`
377			`{`
378			`struct mm_struct *mm = vma->vm_mm;`
379			`unsigned long cpu_mask = mm->cpu_vm_mask & ~(1 << smp_processor_id());`
380
381			`if (current->active_mm == mm) {`
382			`if(current->mm)`
383			`__flush_tlb_one(va);`
384			`else`
385			`leave_mm(smp_processor_id());`
386			`}`
387
388			`if (cpu_mask)`
389			`flush_tlb_others(cpu_mask, mm, va);`
390			`}`
391
392			`static inline void do_flush_tlb_all_local(void)`
393			`{`
394			`unsigned long cpu = smp_processor_id();`
395
396			`__flush_tlb_all();`
397			`if (cpu_tlbstate[cpu].state == TLBSTATE_LAZY)`
398			`leave_mm(cpu);`
399			`}`
400
401			`static void flush_tlb_all_ipi(void* info)`
402			`{`
403			`do_flush_tlb_all_local();`
404			`}`
405
406			`void flush_tlb_all(void)`
407			`{`
408			`smp_call_function (flush_tlb_all_ipi,0,1,1);`
409
410			`do_flush_tlb_all_local();`
411			`}`
412
413			`/*`
414			`* this function sends a 'reschedule' IPI to another CPU.`
415			`* it goes straight through and wastes no time serializing`
416			`* anything. Worst case is that we lose a reschedule ...`
417			`*/`
418
419			`void smp_send_reschedule(int cpu)`
420			`{`
421			`send_IPI_mask(1 << cpu, RESCHEDULE_VECTOR);`
422			`}`
423
424			`/*`
425			`* Structure and data for smp_call_function(). This is designed to minimise`
426			`* static memory requirements. It also looks cleaner.`
427			`*/`
428			`static spinlock_t call_lock = SPIN_LOCK_UNLOCKED;`
429
430			`struct call_data_struct {`
431			`void (func) (void info);`
432			`void *info;`
433			`atomic_t started;`
434			`atomic_t finished;`
435			`int wait;`
436			`};`
437
438			`static struct call_data_struct * call_data;`
439
440			`/*`
441			`* this function sends a 'generic call function' IPI to all other CPUs`
442			`* in the system.`
443			`*/`
444
445			`int smp_call_function (void (func) (void info), void *info, int nonatomic,`
446			`int wait)`
447			`/*`
448			`* [SUMMARY] Run a function on all other CPUs.`
449			`* <func> The function to run. This must be fast and non-blocking.`
450			`* <info> An arbitrary pointer to pass to the function.`
451			`* <nonatomic> currently unused.`
452			`* <wait> If true, wait (atomically) until function has completed on other CPUs.`
453			`* [RETURNS] 0 on success, else a negative status code. Does not return until`
454			`* remote CPUs are nearly ready to execute <<func>> or are or have executed.`
455			`*`
456			`* You must not call this function with disabled interrupts or from a`
457			`* hardware interrupt handler or from a bottom half handler.`
458			`*/`
459			`{`
460			`struct call_data_struct data;`
461			`int cpus = smp_num_cpus-1;`
462
463			`if (!cpus)`
464			`return 0;`
465
466			`data.func = func;`
467			`data.info = info;`
468			`atomic_set(&data.started, 0);`
469			`data.wait = wait;`
470			`if (wait)`
471			`atomic_set(&data.finished, 0);`
472
473			`spin_lock(&call_lock);`
474			`call_data = &data;`
475			`wmb();`
476			`/* Send a message to all other CPUs and wait for them to respond */`
477			`send_IPI_allbutself(CALL_FUNCTION_VECTOR);`
478
479			`/* Wait for response */`
480			`while (atomic_read(&data.started) != cpus)`
481			`barrier();`
482
483			`if (wait)`
484			`while (atomic_read(&data.finished) != cpus)`
485			`barrier();`
486			`spin_unlock(&call_lock);`
487
488			`return 0;`
489			`}`
490
491			`void smp_stop_cpu(void)`
492			`{`
493			`/*`
494			`* Remove this CPU:`
495			`*/`
496			`clear_bit(smp_processor_id(), &cpu_online_map);`
497			`__cli();`
498			`disable_local_APIC();`
499			`__sti();`
500			`}`
501
502			`static void smp_really_stop_cpu(void *dummy)`
503			`{`
504			`smp_stop_cpu();`
505			`for (;;)`
506			`asm("hlt");`
507			`}`
508
509			`/*`
510			`* this function calls the 'stop' function on all other CPUs in the system.`
511			`*/`
512
513			`void smp_send_stop(void)`
514			`{`
515			`smp_call_function(smp_really_stop_cpu, NULL, 1, 0);`
516			`smp_stop_cpu();`
517			`}`
518
519			`/*`
520			`* Reschedule call back. Nothing to do,`
521			`* all the work is done automatically when`
522			`* we return from the interrupt.`
523			`*/`
524			`asmlinkage void smp_reschedule_interrupt(void)`
525			`{`
526			`ack_APIC_irq();`
527			`}`
528
529			`asmlinkage void smp_call_function_interrupt(void)`
530			`{`
531			`void (func) (void info) = call_data->func;`
532			`void *info = call_data->info;`
533			`int wait = call_data->wait;`
534
535			`ack_APIC_irq();`
536			`/*`
537			`* Notify initiating CPU that I've grabbed the data and am`
538			`* about to execute the function`
539			`*/`
540			`mb();`
541			`atomic_inc(&call_data->started);`
542			`/*`
543			`* At this point the info structure may be out of scope unless wait==1`
544			`*/`
545			`(*func)(info);`
546			`if (wait) {`
547			`mb();`
548			`atomic_inc(&call_data->finished);`
549			`}`
550			`}`