[RFC PATCH v1 1/1] powerpc/85xx: Wakeup kexec smp slave cpus in second kernel

Yang,Wei Wei.Yang at windriver.com
Wed Sep 4 11:46:45 EST 2013


On 08/31/2013 05:12 PM, Yu Chen wrote:
> >From 1ccf579b871dfd5938ce958f729361a203485c74 Mon Sep 17 00:00:00 2001
> From: Yu Chen <chenyu105 at gmail.com>
> Date: Sat, 31 Aug 2013 23:52:31 +0800
> Subject: [PATCH]  powerpc/85xx: Wakeup kexec smp slave cpus in second kernel
>
> In current 85xx smp kexec implementation,master cpu reset slave cpus
> by mpic_reset_core,
> before jump to second kernel.In order to wake slave cpus up in second
> kernel,we debug
> this patch on p2041rdb.

What problem causes that you do the modification? I am just curious as 
kexec feature always is fine on our
P2041RDB board.:-)

Wei
>
> The main principle of this patch,is to get slave cpus polling for flag
> to change,
> thus waiting for master cpu to set it with non-zero cpu number(see misc_32.S).
> This flag is placed in kexec control page,so it would not be
> overlapped when copying kimage.
> The master cpu put flag's physical address in r28 as a parameter
> passed to second kernel,
> so the latter knows how to wake slave cpus up in smp_85xx_kick_cpu.
> The pseudo-code may be like:
> void slave_cpu_spin(void)
> {
>          int cpu = smp_processor_id();
>          while (*kexec_poll != cpu)
>                  ;
>          /*slave wakeup and jump*/
>          jump(*(kexec_poll+1));
> }
>
> void master_cpu_wakeup(unsigned long *kexec_poll, int cpu)
> {
>          *(kexec_poll+1) = __early_start;
>          mb();
>          *kexec_poll = cpu;
> }
>
> However,after applied this patch,we got some kernel exception during
> booting second kernel,
> I'm not sure if it's caused by improper treament of cache,or tlb,or
> other.So I put this
> patch here hoping someone can check and review it.
>
> Signed-off-by: Yu Chen <chenyu105 at gmail.com>
> ---
>   arch/powerpc/kernel/head_fsl_booke.S |    7 ++
>   arch/powerpc/kernel/misc_32.S        |   66 +++++++++++++-
>   arch/powerpc/platforms/85xx/smp.c    |  166 ++++++++++++++++++++++++++++++----
>   3 files changed, 222 insertions(+), 17 deletions(-)
>   mode change 100644 => 100755 arch/powerpc/kernel/head_fsl_booke.S
>   mode change 100644 => 100755 arch/powerpc/kernel/misc_32.S
>   mode change 100644 => 100755 arch/powerpc/platforms/85xx/smp.c
>
> diff --git a/arch/powerpc/kernel/head_fsl_booke.S
> b/arch/powerpc/kernel/head_fsl_booke.S
> old mode 100644
> new mode 100755
> index d10a7ca..63c8392
> --- a/arch/powerpc/kernel/head_fsl_booke.S
> +++ b/arch/powerpc/kernel/head_fsl_booke.S
> @@ -178,6 +178,13 @@ _ENTRY(__early_start)
>        * This is where the main kernel code starts.
>        */
>
> +#if defined(CONFIG_KEXEC) && defined(CONFIG_SMP)
> +    /* r28 contain position where slave cpus spin*/
> +    lis    r1,kexec_poll_phy at h
> +    ori    r1,r1,kexec_poll_phy at l
> +    stw    r28,0(r1)
> +#endif
> +
>       /* ptr to current */
>       lis    r2,init_task at h
>       ori    r2,r2,init_task at l
> diff --git a/arch/powerpc/kernel/misc_32.S b/arch/powerpc/kernel/misc_32.S
> old mode 100644
> new mode 100755
> index e469f30..d9eefc2
> --- a/arch/powerpc/kernel/misc_32.S
> +++ b/arch/powerpc/kernel/misc_32.S
> @@ -120,7 +120,7 @@ _GLOBAL(reloc_got2)
>       addi    r4,r4,1b at l
>       subf    r0,r4,r0
>       add    r7,r0,r7
> -2:    lwz    r0,0(r7)
> +    2:    lwz    r0,0(r7)
>       add    r0,r0,r3
>       stw    r0,0(r7)
>       addi    r7,r7,4
> @@ -692,6 +692,7 @@ _GLOBAL(__main)
>       blr
>
>   #ifdef CONFIG_KEXEC
> +#define KEXEC_MAGIC 0xdeadbeef
>       /*
>        * Must be relocatable PIC code callable as a C function.
>        */
> @@ -707,6 +708,16 @@ relocate_new_kernel:
>       mr    r30, r4
>       mr    r31, r5
>
> +#ifdef CONFIG_SMP
> +    bl    1f
> +1:    mflr    r8
> +    addi    r8,r8,kexec_flag-1b
> +    lis     r7,PAGE_OFFSET at h
> +    ori     r7,r7,PAGE_OFFSET at l
> +    /*r28 contain slave cpu spin physical address */
> +    subf    r28, r7, r8
> +#endif
> +
>   #define ENTRY_MAPPING_KEXEC_SETUP
>   #include "fsl_booke_entry_mapping.S"
>   #undef ENTRY_MAPPING_KEXEC_SETUP
> @@ -1172,4 +1183,57 @@ relocate_new_kernel_end:
>       .globl relocate_new_kernel_size
>   relocate_new_kernel_size:
>       .long relocate_new_kernel_end - relocate_new_kernel
> +#ifdef CONFIG_FSL_BOOKE
> +    /**
> +    * Slave cpus wait for kexec_flag to change
> +    */
> +    .globl relocate_smp_cpu_offset
> +relocate_smp_cpu_offset:
> +    .long relocate_smp_cpu_wait-relocate_new_kernel
> +
> +    .globl relocate_smp_cpu_wait
> +relocate_smp_cpu_wait:
> +
> +    bl    1f
> +1:    mflr    r5
> +    addi    r5,r5,kexec_flag-1b
> +    /*see if anyone calls me?*/
> +    mfspr   r24,SPRN_PIR
> +99:    lwz    r4,4(r5)
> +    cmpw    r4,r24
> +    msync
> +    bne        99b
> +
> +    msync
> +    /*r4 contains jump address*/
> +    lwz    r4,8(r5)
> +    msync
> +    lis    r5,MSR_KERNEL at h
> +    ori    r5,r5,MSR_KERNEL at l
> +    msync
> +    isync
> +    mtspr    SPRN_SRR1, r5
> +    mtspr    SPRN_SRR0, r4
> +    msync
> +    isync
> +    rfi
> +    isync
> +1:    b    1b
> +
> +    /**
> +    * kexec_flag indicates a kexec magic
> +    * kexec_flag+4 bytes supposed to be set with cpu number
> +    * kexec_flag+8 countain addr for slave cpu to jump into
> +    */
> +    .globl kexec_flag
> +kexec_flag:
> +    .long   KEXEC_MAGIC
> +    .long    0
> +    .long    0
> +relocate_smp_cpu_wait_end:
> +    .globl relocate_smp_cpu_size
> +relocate_smp_cpu_size:
> +    .long relocate_smp_cpu_wait_end-relocate_smp_cpu_wait
> +#endif
> +
>   #endif
> diff --git a/arch/powerpc/platforms/85xx/smp.c
> b/arch/powerpc/platforms/85xx/smp.c
> old mode 100644
> new mode 100755
> index 5ced4f5..c4f5c4c
> --- a/arch/powerpc/platforms/85xx/smp.c
> +++ b/arch/powerpc/platforms/85xx/smp.c
> @@ -140,6 +140,70 @@ static inline u32 read_spin_table_addr_l(void *spin_table)
>           (ulong)spin_table + sizeof(struct epapr_spin_table));
>       return in_be32(&((struct epapr_spin_table *)spin_table)->addr_l);
>   }
> +#ifdef CONFIG_KEXEC
> +
> +#define KEXEC_MAGIC 0xdeadbeef
> +#define KEXEC_RESERVE_LIMIT 0x10
> +unsigned long kexec_poll_phy;
> +extern void reserve_kexec_bootmem(unsigned long poll_phy, int size);
> +
> +/*
> + * Reserved bootmem for slave cpus kexec spin area.
> + */
> +void mpc85xx_smp_reserve_kexec(void)
> +{
> +    unsigned long kexec_poll_virt;
> +    unsigned long *kexec_magic_virt;
> +
> +    if (!kexec_poll_phy ||
> +            kexec_poll_phy >= __max_low_memory)
> +        return;
> +
> +    kexec_poll_virt = (unsigned long)phys_to_virt(kexec_poll_phy);
> +    kexec_magic_virt = (unsigned long *)kexec_poll_virt;
> +
> +    if (*kexec_magic_virt == KEXEC_MAGIC)
> +        reserve_kexec_bootmem(kexec_poll_phy, KEXEC_RESERVE_LIMIT);
> +}
> +
> +/*
> + * Kick slave cpus from kexec spin area.
> + */
> +int mpc85xx_smp_kick_kexec_cpus(int nr)
> +{
> +    unsigned long  kexec_poll_virt;
> +    unsigned long *kexec_flag_virt;
> +    unsigned long *kexec_magic_virt;
> +    unsigned long *kexec_jump_virt;
> +
> +    /*verify accessible*/
> +    if (!kexec_poll_phy ||
> +            kexec_poll_phy >= __max_low_memory)
> +        return -EBUSY;
> +
> +    kexec_poll_virt = (unsigned long)phys_to_virt(kexec_poll_phy);
> +
> +    kexec_magic_virt = (unsigned long *)kexec_poll_virt;
> +    kexec_flag_virt = (unsigned long *)kexec_poll_virt + 1;
> +    kexec_jump_virt = (unsigned long *)kexec_poll_virt + 2;
> +
> +    /*verify a valid kexec kick*/
> +    if (*kexec_magic_virt == KEXEC_MAGIC) {
> +        flush_dcache_range((ulong)kexec_poll_virt,
> +        (ulong)kexec_poll_virt + L1_CACHE_BYTES-1);
> +        *kexec_jump_virt = (unsigned long)__early_start;
> +        mb();
> +        /*kick cpu[nr] up*/
> +        *kexec_flag_virt = nr;
> +        mb();
> +        flush_dcache_range((ulong)kexec_poll_virt,
> +        (ulong)kexec_poll_virt + L1_CACHE_BYTES-1);
> +
> +        return 0;
> +    }
> +    return -EBUSY;
> +}
> +#endif
>
>   static int smp_85xx_kick_cpu(int nr)
>   {
> @@ -181,6 +245,10 @@ static int smp_85xx_kick_cpu(int nr)
>
>       local_irq_save(flags);
>   #ifdef CONFIG_PPC32
> +#ifdef CONFIG_KEXEC
> +    if (!mpc85xx_smp_kick_kexec_cpus(nr))
> +        goto kexec_kick_done;
> +#endif
>   #ifdef CONFIG_HOTPLUG_CPU
>       /* Corresponding to generic_set_cpu_dead() */
>       generic_set_cpu_up(nr);
> @@ -225,7 +293,9 @@ static int smp_85xx_kick_cpu(int nr)
>       out_be32(&spin_table->pir, hw_cpu);
>       out_be32(&spin_table->addr_l, __pa(__early_start));
>       flush_spin_table(spin_table);
> -
> +#ifdef CONFIG_KEXEC
> +kexec_kick_done:
> +#endif
>       /* Wait a bit for the CPU to ack. */
>       if (!spin_event_timeout(__secondary_hold_acknowledge == hw_cpu,
>                       10000, 100)) {
> @@ -266,7 +336,13 @@ struct smp_ops_t smp_85xx_ops = {
>   };
>
>   #ifdef CONFIG_KEXEC
> +
>   atomic_t kexec_down_cpus = ATOMIC_INIT(0);
> +atomic_t kexec_ready_to_reboot = ATOMIC_INIT(0);
> +atomic_t kexec_slave_finish = ATOMIC_INIT(0);
> +unsigned long wait_code_buffer;
> +static struct kimage *save_image;
> +extern const unsigned int relocate_smp_cpu_size;
>
>   void mpc85xx_smp_kexec_cpu_down(int crash_shutdown, int secondary)
>   {
> @@ -274,8 +350,29 @@ void mpc85xx_smp_kexec_cpu_down(int
> crash_shutdown, int secondary)
>
>       if (secondary) {
>           atomic_inc(&kexec_down_cpus);
> -        /* loop forever */
> -        while (1);
> +        mb();
> +
> +        if (crash_shutdown) {
> +            /* loop forever */
> +            while (1)
> +                ;
> +        } else {
> +            while (!atomic_read(&kexec_ready_to_reboot))
> +                cpu_relax();
> +            /*flush destination*/
> +            if (save_image)
> +                mpc85xx_smp_flush_dcache_kexec(save_image, 1);
> +
> +            flush_icache_range(wait_code_buffer,
> +                wait_code_buffer + relocate_smp_cpu_size);
> +            flush_dcache_range(wait_code_buffer,
> +                wait_code_buffer + relocate_smp_cpu_size);
> +
> +            atomic_inc(&kexec_slave_finish);
> +
> +            ((void (*)(void)) wait_code_buffer)();
> +            /* NOTREACHED */
> +        }
>       }
>   }
>
> @@ -285,13 +382,23 @@ static void mpc85xx_smp_kexec_down(void *arg)
>           ppc_md.kexec_cpu_down(0,1);
>   }
>
> -static void map_and_flush(unsigned long paddr)
> +static void map_and_flush(unsigned long paddr, int atomic)
>   {
>       struct page *page = pfn_to_page(paddr >> PAGE_SHIFT);
> -    unsigned long kaddr  = (unsigned long)kmap(page);
> +    unsigned long kaddr;
> +
> +    if (atomic)
> +        kaddr  = (unsigned long)kmap_atomic(page);
> +    else
> +        kaddr  = (unsigned long)kmap(page);
>
>       flush_dcache_range(kaddr, kaddr + PAGE_SIZE);
> -    kunmap(page);
> +    flush_icache_range(kaddr, kaddr + PAGE_SIZE);
> +
> +    if (atomic)
> +        kunmap_atomic((void *)kaddr);
> +    else
> +        kunmap(page);
>   }
>
>   /**
> @@ -300,7 +407,7 @@ static void map_and_flush(unsigned long paddr)
>    * are performed out of an overabundance of caution as interrupts are not
>    * disabled yet and we can switch cores
>    */
> -static void mpc85xx_smp_flush_dcache_kexec(struct kimage *image)
> +static void mpc85xx_smp_flush_dcache_kexec(struct kimage *image, int atomic)
>   {
>       kimage_entry_t *ptr, entry;
>       unsigned long paddr;
> @@ -312,18 +419,18 @@ static void
> mpc85xx_smp_flush_dcache_kexec(struct kimage *image)
>                ptr = (entry & IND_INDIRECTION) ?
>                   phys_to_virt(entry & PAGE_MASK) : ptr + 1) {
>               if (!(entry & IND_DESTINATION)) {
> -                map_and_flush(entry);
> +                map_and_flush(entry, atomic);
>               }
>           }
>           /* flush out last IND_DONE page */
> -        map_and_flush(entry);
> +        map_and_flush(entry, atomic);
>       } else {
>           /* crash type kexec images are copied to the crash region */
>           for (i = 0; i < image->nr_segments; i++) {
>               struct kexec_segment *seg = &image->segment[i];
>               for (paddr = seg->mem; paddr < seg->mem + seg->memsz;
>                    paddr += PAGE_SIZE) {
> -                map_and_flush(paddr);
> +                map_and_flush(paddr, atomic);
>               }
>           }
>       }
> @@ -335,13 +442,18 @@ static void
> mpc85xx_smp_flush_dcache_kexec(struct kimage *image)
>
>   static void mpc85xx_smp_machine_kexec(struct kimage *image)
>   {
> +    extern const unsigned char  relocate_smp_cpu_wait[];
> +    extern const unsigned int relocate_smp_cpu_offset;
>       int timeout = INT_MAX;
>       int i, num_cpus = num_present_cpus();
>
>       mpc85xx_smp_flush_dcache_kexec(image);
>
> -    if (image->type == KEXEC_TYPE_DEFAULT)
> +    if (image->type == KEXEC_TYPE_DEFAULT) {
> +        save_image = image;
> +        mb();
>           smp_call_function(mpc85xx_smp_kexec_down, NULL, 0);
> +    }
>
>       while ( (atomic_read(&kexec_down_cpus) != (num_cpus - 1)) &&
>           ( timeout > 0 ) )
> @@ -352,12 +464,34 @@ static void mpc85xx_smp_machine_kexec(struct
> kimage *image)
>       if ( !timeout )
>           printk(KERN_ERR "Unable to bring down secondary cpu(s)");
>
> -    for_each_online_cpu(i)
> -    {
> -        if ( i == smp_processor_id() ) continue;
> -        mpic_reset_core(i);
> -    }
> +    if (image->type == KEXEC_TYPE_DEFAULT) {
>
> +        wait_code_buffer =
> +        (unsigned long)page_address(image->control_code_page)+
> +                relocate_smp_cpu_offset;
> +
> +        /* copy slave cpu spin code to the control code page */
> +        memcpy((void *)wait_code_buffer, relocate_smp_cpu_wait,
> +                        relocate_smp_cpu_size);
> +        atomic_set(&kexec_ready_to_reboot, 1);
> +        mb();
> +        timeout = INT_MAX;
> +
> +        while ((atomic_read(&kexec_slave_finish) != (num_cpus-1)) &&
> +            (timeout > 0))
> +            timeout--;
> +
> +        if (!timeout)
> +            printk(KERN_ERR "Unable to wait for secondary cpu(s) to
> flush caches\n");
> +
> +        } else {
> +        for_each_online_cpu(i)
> +        {
> +            if (i == smp_processor_id())
> +                continue;
> +            mpic_reset_core(i);
> +        }
> +    }
>       default_machine_kexec(image);
>   }
>   #endif /* CONFIG_KEXEC */



More information about the Linuxppc-dev mailing list