123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666 |
- /*
- * Copyright (C) 2009,2010,2011 Imagination Technologies Ltd.
- *
- * Copyright (C) 2002 ARM Limited, All Rights Reserved.
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License version 2 as
- * published by the Free Software Foundation.
- */
- #include <linux/atomic.h>
- #include <linux/completion.h>
- #include <linux/delay.h>
- #include <linux/init.h>
- #include <linux/spinlock.h>
- #include <linux/sched.h>
- #include <linux/interrupt.h>
- #include <linux/cache.h>
- #include <linux/profile.h>
- #include <linux/errno.h>
- #include <linux/mm.h>
- #include <linux/err.h>
- #include <linux/cpu.h>
- #include <linux/smp.h>
- #include <linux/seq_file.h>
- #include <linux/irq.h>
- #include <linux/bootmem.h>
- #include <asm/cacheflush.h>
- #include <asm/cachepart.h>
- #include <asm/core_reg.h>
- #include <asm/cpu.h>
- #include <asm/global_lock.h>
- #include <asm/metag_mem.h>
- #include <asm/mmu_context.h>
- #include <asm/pgtable.h>
- #include <asm/pgalloc.h>
- #include <asm/processor.h>
- #include <asm/setup.h>
- #include <asm/tlbflush.h>
- #include <asm/hwthread.h>
- #include <asm/traps.h>
- #define SYSC_DCPART(n) (SYSC_DCPART0 + SYSC_xCPARTn_STRIDE * (n))
- #define SYSC_ICPART(n) (SYSC_ICPART0 + SYSC_xCPARTn_STRIDE * (n))
- DECLARE_PER_CPU(PTBI, pTBI);
- void *secondary_data_stack;
- /*
- * structures for inter-processor calls
- * - A collection of single bit ipi messages.
- */
- struct ipi_data {
- spinlock_t lock;
- unsigned long ipi_count;
- unsigned long bits;
- };
- static DEFINE_PER_CPU(struct ipi_data, ipi_data) = {
- .lock = __SPIN_LOCK_UNLOCKED(ipi_data.lock),
- };
- static DEFINE_SPINLOCK(boot_lock);
- static DECLARE_COMPLETION(cpu_running);
- /*
- * "thread" is assumed to be a valid Meta hardware thread ID.
- */
- static int boot_secondary(unsigned int thread, struct task_struct *idle)
- {
- u32 val;
- /*
- * set synchronisation state between this boot processor
- * and the secondary one
- */
- spin_lock(&boot_lock);
- core_reg_write(TXUPC_ID, 0, thread, (unsigned int)secondary_startup);
- core_reg_write(TXUPC_ID, 1, thread, 0);
- /*
- * Give the thread privilege (PSTAT) and clear potentially problematic
- * bits in the process (namely ISTAT, CBMarker, CBMarkerI, LSM_STEP).
- */
- core_reg_write(TXUCT_ID, TXSTATUS_REGNUM, thread, TXSTATUS_PSTAT_BIT);
- /* Clear the minim enable bit. */
- val = core_reg_read(TXUCT_ID, TXPRIVEXT_REGNUM, thread);
- core_reg_write(TXUCT_ID, TXPRIVEXT_REGNUM, thread, val & ~0x80);
- /*
- * set the ThreadEnable bit (0x1) in the TXENABLE register
- * for the specified thread - off it goes!
- */
- val = core_reg_read(TXUCT_ID, TXENABLE_REGNUM, thread);
- core_reg_write(TXUCT_ID, TXENABLE_REGNUM, thread, val | 0x1);
- /*
- * now the secondary core is starting up let it run its
- * calibrations, then wait for it to finish
- */
- spin_unlock(&boot_lock);
- return 0;
- }
- /**
- * describe_cachepart_change: describe a change to cache partitions.
- * @thread: Hardware thread number.
- * @label: Label of cache type, e.g. "dcache" or "icache".
- * @sz: Total size of the cache.
- * @old: Old cache partition configuration (*CPART* register).
- * @new: New cache partition configuration (*CPART* register).
- *
- * If the cache partition has changed, prints a message to the log describing
- * those changes.
- */
- static void describe_cachepart_change(unsigned int thread, const char *label,
- unsigned int sz, unsigned int old,
- unsigned int new)
- {
- unsigned int lor1, land1, gor1, gand1;
- unsigned int lor2, land2, gor2, gand2;
- unsigned int diff = old ^ new;
- if (!diff)
- return;
- pr_info("Thread %d: %s partition changed:", thread, label);
- if (diff & (SYSC_xCPARTL_OR_BITS | SYSC_xCPARTL_AND_BITS)) {
- lor1 = (old & SYSC_xCPARTL_OR_BITS) >> SYSC_xCPARTL_OR_S;
- lor2 = (new & SYSC_xCPARTL_OR_BITS) >> SYSC_xCPARTL_OR_S;
- land1 = (old & SYSC_xCPARTL_AND_BITS) >> SYSC_xCPARTL_AND_S;
- land2 = (new & SYSC_xCPARTL_AND_BITS) >> SYSC_xCPARTL_AND_S;
- pr_cont(" L:%#x+%#x->%#x+%#x",
- (lor1 * sz) >> 4,
- ((land1 + 1) * sz) >> 4,
- (lor2 * sz) >> 4,
- ((land2 + 1) * sz) >> 4);
- }
- if (diff & (SYSC_xCPARTG_OR_BITS | SYSC_xCPARTG_AND_BITS)) {
- gor1 = (old & SYSC_xCPARTG_OR_BITS) >> SYSC_xCPARTG_OR_S;
- gor2 = (new & SYSC_xCPARTG_OR_BITS) >> SYSC_xCPARTG_OR_S;
- gand1 = (old & SYSC_xCPARTG_AND_BITS) >> SYSC_xCPARTG_AND_S;
- gand2 = (new & SYSC_xCPARTG_AND_BITS) >> SYSC_xCPARTG_AND_S;
- pr_cont(" G:%#x+%#x->%#x+%#x",
- (gor1 * sz) >> 4,
- ((gand1 + 1) * sz) >> 4,
- (gor2 * sz) >> 4,
- ((gand2 + 1) * sz) >> 4);
- }
- if (diff & SYSC_CWRMODE_BIT)
- pr_cont(" %sWR",
- (new & SYSC_CWRMODE_BIT) ? "+" : "-");
- if (diff & SYSC_DCPART_GCON_BIT)
- pr_cont(" %sGCOn",
- (new & SYSC_DCPART_GCON_BIT) ? "+" : "-");
- pr_cont("\n");
- }
- /**
- * setup_smp_cache: ensure cache coherency for new SMP thread.
- * @thread: New hardware thread number.
- *
- * Ensures that coherency is enabled and that the threads share the same cache
- * partitions.
- */
- static void setup_smp_cache(unsigned int thread)
- {
- unsigned int this_thread, lflags;
- unsigned int dcsz, dcpart_this, dcpart_old, dcpart_new;
- unsigned int icsz, icpart_old, icpart_new;
- /*
- * Copy over the current thread's cache partition configuration to the
- * new thread so that they share cache partitions.
- */
- __global_lock2(lflags);
- this_thread = hard_processor_id();
- /* Share dcache partition */
- dcpart_this = metag_in32(SYSC_DCPART(this_thread));
- dcpart_old = metag_in32(SYSC_DCPART(thread));
- dcpart_new = dcpart_this;
- #if PAGE_OFFSET < LINGLOBAL_BASE
- /*
- * For the local data cache to be coherent the threads must also have
- * GCOn enabled.
- */
- dcpart_new |= SYSC_DCPART_GCON_BIT;
- metag_out32(dcpart_new, SYSC_DCPART(this_thread));
- #endif
- metag_out32(dcpart_new, SYSC_DCPART(thread));
- /* Share icache partition too */
- icpart_new = metag_in32(SYSC_ICPART(this_thread));
- icpart_old = metag_in32(SYSC_ICPART(thread));
- metag_out32(icpart_new, SYSC_ICPART(thread));
- __global_unlock2(lflags);
- /*
- * Log if the cache partitions were altered so the user is aware of any
- * potential unintentional cache wastage.
- */
- dcsz = get_dcache_size();
- icsz = get_dcache_size();
- describe_cachepart_change(this_thread, "dcache", dcsz,
- dcpart_this, dcpart_new);
- describe_cachepart_change(thread, "dcache", dcsz,
- dcpart_old, dcpart_new);
- describe_cachepart_change(thread, "icache", icsz,
- icpart_old, icpart_new);
- }
- int __cpu_up(unsigned int cpu, struct task_struct *idle)
- {
- unsigned int thread = cpu_2_hwthread_id[cpu];
- int ret;
- load_pgd(swapper_pg_dir, thread);
- flush_tlb_all();
- setup_smp_cache(thread);
- /*
- * Tell the secondary CPU where to find its idle thread's stack.
- */
- secondary_data_stack = task_stack_page(idle);
- wmb();
- /*
- * Now bring the CPU into our world.
- */
- ret = boot_secondary(thread, idle);
- if (ret == 0) {
- /*
- * CPU was successfully started, wait for it
- * to come online or time out.
- */
- wait_for_completion_timeout(&cpu_running,
- msecs_to_jiffies(1000));
- if (!cpu_online(cpu))
- ret = -EIO;
- }
- secondary_data_stack = NULL;
- if (ret) {
- pr_crit("CPU%u: processor failed to boot\n", cpu);
- /*
- * FIXME: We need to clean up the new idle thread. --rmk
- */
- }
- return ret;
- }
- #ifdef CONFIG_HOTPLUG_CPU
- /*
- * __cpu_disable runs on the processor to be shutdown.
- */
- int __cpu_disable(void)
- {
- unsigned int cpu = smp_processor_id();
- /*
- * Take this CPU offline. Once we clear this, we can't return,
- * and we must not schedule until we're ready to give up the cpu.
- */
- set_cpu_online(cpu, false);
- /*
- * OK - migrate IRQs away from this CPU
- */
- migrate_irqs();
- /*
- * Flush user cache and TLB mappings, and then remove this CPU
- * from the vm mask set of all processes.
- */
- flush_cache_all();
- local_flush_tlb_all();
- clear_tasks_mm_cpumask(cpu);
- return 0;
- }
- /*
- * called on the thread which is asking for a CPU to be shutdown -
- * waits until shutdown has completed, or it is timed out.
- */
- void __cpu_die(unsigned int cpu)
- {
- if (!cpu_wait_death(cpu, 1))
- pr_err("CPU%u: unable to kill\n", cpu);
- }
- /*
- * Called from the idle thread for the CPU which has been shutdown.
- *
- * Note that we do not return from this function. If this cpu is
- * brought online again it will need to run secondary_startup().
- */
- void cpu_die(void)
- {
- local_irq_disable();
- idle_task_exit();
- (void)cpu_report_death();
- asm ("XOR TXENABLE, D0Re0,D0Re0\n");
- }
- #endif /* CONFIG_HOTPLUG_CPU */
- /*
- * Called by both boot and secondaries to move global data into
- * per-processor storage.
- */
- void smp_store_cpu_info(unsigned int cpuid)
- {
- struct cpuinfo_metag *cpu_info = &per_cpu(cpu_data, cpuid);
- cpu_info->loops_per_jiffy = loops_per_jiffy;
- }
- /*
- * This is the secondary CPU boot entry. We're using this CPUs
- * idle thread stack and the global page tables.
- */
- asmlinkage void secondary_start_kernel(void)
- {
- struct mm_struct *mm = &init_mm;
- unsigned int cpu = smp_processor_id();
- /*
- * All kernel threads share the same mm context; grab a
- * reference and switch to it.
- */
- atomic_inc(&mm->mm_users);
- atomic_inc(&mm->mm_count);
- current->active_mm = mm;
- cpumask_set_cpu(cpu, mm_cpumask(mm));
- enter_lazy_tlb(mm, current);
- local_flush_tlb_all();
- /*
- * TODO: Some day it might be useful for each Linux CPU to
- * have its own TBI structure. That would allow each Linux CPU
- * to run different interrupt handlers for the same IRQ
- * number.
- *
- * For now, simply copying the pointer to the boot CPU's TBI
- * structure is sufficient because we always want to run the
- * same interrupt handler whatever CPU takes the interrupt.
- */
- per_cpu(pTBI, cpu) = __TBI(TBID_ISTAT_BIT);
- if (!per_cpu(pTBI, cpu))
- panic("No TBI found!");
- per_cpu_trap_init(cpu);
- preempt_disable();
- setup_priv();
- notify_cpu_starting(cpu);
- pr_info("CPU%u (thread %u): Booted secondary processor\n",
- cpu, cpu_2_hwthread_id[cpu]);
- calibrate_delay();
- smp_store_cpu_info(cpu);
- /*
- * OK, now it's safe to let the boot CPU continue
- */
- set_cpu_online(cpu, true);
- complete(&cpu_running);
- /*
- * Enable local interrupts.
- */
- tbi_startup_interrupt(TBID_SIGNUM_TRT);
- local_irq_enable();
- /*
- * OK, it's off to the idle thread for us
- */
- cpu_startup_entry(CPUHP_ONLINE);
- }
- void __init smp_cpus_done(unsigned int max_cpus)
- {
- int cpu;
- unsigned long bogosum = 0;
- for_each_online_cpu(cpu)
- bogosum += per_cpu(cpu_data, cpu).loops_per_jiffy;
- pr_info("SMP: Total of %d processors activated (%lu.%02lu BogoMIPS).\n",
- num_online_cpus(),
- bogosum / (500000/HZ),
- (bogosum / (5000/HZ)) % 100);
- }
- void __init smp_prepare_cpus(unsigned int max_cpus)
- {
- unsigned int cpu = smp_processor_id();
- init_new_context(current, &init_mm);
- current_thread_info()->cpu = cpu;
- smp_store_cpu_info(cpu);
- init_cpu_present(cpu_possible_mask);
- }
- void __init smp_prepare_boot_cpu(void)
- {
- unsigned int cpu = smp_processor_id();
- per_cpu(pTBI, cpu) = __TBI(TBID_ISTAT_BIT);
- if (!per_cpu(pTBI, cpu))
- panic("No TBI found!");
- }
- static void smp_cross_call(cpumask_t callmap, enum ipi_msg_type msg);
- static void send_ipi_message(const struct cpumask *mask, enum ipi_msg_type msg)
- {
- unsigned long flags;
- unsigned int cpu;
- cpumask_t map;
- cpumask_clear(&map);
- local_irq_save(flags);
- for_each_cpu(cpu, mask) {
- struct ipi_data *ipi = &per_cpu(ipi_data, cpu);
- spin_lock(&ipi->lock);
- /*
- * KICK interrupts are queued in hardware so we'll get
- * multiple interrupts if we call smp_cross_call()
- * multiple times for one msg. The problem is that we
- * only have one bit for each message - we can't queue
- * them in software.
- *
- * The first time through ipi_handler() we'll clear
- * the msg bit, having done all the work. But when we
- * return we'll get _another_ interrupt (and another,
- * and another until we've handled all the queued
- * KICKs). Running ipi_handler() when there's no work
- * to do is bad because that's how kick handler
- * chaining detects who the KICK was intended for.
- * See arch/metag/kernel/kick.c for more details.
- *
- * So only add 'cpu' to 'map' if we haven't already
- * queued a KICK interrupt for 'msg'.
- */
- if (!(ipi->bits & (1 << msg))) {
- ipi->bits |= 1 << msg;
- cpumask_set_cpu(cpu, &map);
- }
- spin_unlock(&ipi->lock);
- }
- /*
- * Call the platform specific cross-CPU call function.
- */
- smp_cross_call(map, msg);
- local_irq_restore(flags);
- }
- void arch_send_call_function_ipi_mask(const struct cpumask *mask)
- {
- send_ipi_message(mask, IPI_CALL_FUNC);
- }
- void arch_send_call_function_single_ipi(int cpu)
- {
- send_ipi_message(cpumask_of(cpu), IPI_CALL_FUNC);
- }
- void show_ipi_list(struct seq_file *p)
- {
- unsigned int cpu;
- seq_puts(p, "IPI:");
- for_each_present_cpu(cpu)
- seq_printf(p, " %10lu", per_cpu(ipi_data, cpu).ipi_count);
- seq_putc(p, '\n');
- }
- static DEFINE_SPINLOCK(stop_lock);
- /*
- * Main handler for inter-processor interrupts
- *
- * For Meta, the ipimask now only identifies a single
- * category of IPI (Bit 1 IPIs have been replaced by a
- * different mechanism):
- *
- * Bit 0 - Inter-processor function call
- */
- static int do_IPI(void)
- {
- unsigned int cpu = smp_processor_id();
- struct ipi_data *ipi = &per_cpu(ipi_data, cpu);
- unsigned long msgs, nextmsg;
- int handled = 0;
- ipi->ipi_count++;
- spin_lock(&ipi->lock);
- msgs = ipi->bits;
- nextmsg = msgs & -msgs;
- ipi->bits &= ~nextmsg;
- spin_unlock(&ipi->lock);
- if (nextmsg) {
- handled = 1;
- nextmsg = ffz(~nextmsg);
- switch (nextmsg) {
- case IPI_RESCHEDULE:
- scheduler_ipi();
- break;
- case IPI_CALL_FUNC:
- generic_smp_call_function_interrupt();
- break;
- default:
- pr_crit("CPU%u: Unknown IPI message 0x%lx\n",
- cpu, nextmsg);
- break;
- }
- }
- return handled;
- }
- void smp_send_reschedule(int cpu)
- {
- send_ipi_message(cpumask_of(cpu), IPI_RESCHEDULE);
- }
- static void stop_this_cpu(void *data)
- {
- unsigned int cpu = smp_processor_id();
- if (system_state == SYSTEM_BOOTING ||
- system_state == SYSTEM_RUNNING) {
- spin_lock(&stop_lock);
- pr_crit("CPU%u: stopping\n", cpu);
- dump_stack();
- spin_unlock(&stop_lock);
- }
- set_cpu_online(cpu, false);
- local_irq_disable();
- hard_processor_halt(HALT_OK);
- }
- void smp_send_stop(void)
- {
- smp_call_function(stop_this_cpu, NULL, 0);
- }
- /*
- * not supported here
- */
- int setup_profiling_timer(unsigned int multiplier)
- {
- return -EINVAL;
- }
- /*
- * We use KICKs for inter-processor interrupts.
- *
- * For every CPU in "callmap" the IPI data must already have been
- * stored in that CPU's "ipi_data" member prior to calling this
- * function.
- */
- static void kick_raise_softirq(cpumask_t callmap, unsigned int irq)
- {
- int cpu;
- for_each_cpu(cpu, &callmap) {
- unsigned int thread;
- thread = cpu_2_hwthread_id[cpu];
- BUG_ON(thread == BAD_HWTHREAD_ID);
- metag_out32(1, T0KICKI + (thread * TnXKICK_STRIDE));
- }
- }
- static TBIRES ipi_handler(TBIRES State, int SigNum, int Triggers,
- int Inst, PTBI pTBI, int *handled)
- {
- *handled = do_IPI();
- return State;
- }
- static struct kick_irq_handler ipi_irq = {
- .func = ipi_handler,
- };
- static void smp_cross_call(cpumask_t callmap, enum ipi_msg_type msg)
- {
- kick_raise_softirq(callmap, 1);
- }
- static inline unsigned int get_core_count(void)
- {
- int i;
- unsigned int ret = 0;
- for (i = 0; i < CONFIG_NR_CPUS; i++) {
- if (core_reg_read(TXUCT_ID, TXENABLE_REGNUM, i))
- ret++;
- }
- return ret;
- }
- /*
- * Initialise the CPU possible map early - this describes the CPUs
- * which may be present or become present in the system.
- */
- void __init smp_init_cpus(void)
- {
- unsigned int i, ncores = get_core_count();
- /* If no hwthread_map early param was set use default mapping */
- for (i = 0; i < NR_CPUS; i++)
- if (cpu_2_hwthread_id[i] == BAD_HWTHREAD_ID) {
- cpu_2_hwthread_id[i] = i;
- hwthread_id_2_cpu[i] = i;
- }
- for (i = 0; i < ncores; i++)
- set_cpu_possible(i, true);
- kick_register_func(&ipi_irq);
- }
|