*/
 int copy_thread(struct task_struct *p, const struct kernel_clone_args *args)
 {
-       unsigned long clone_flags = args->flags;
-       unsigned long usp = args->stack;
-       unsigned long tls = args->tls;
-       struct pt_regs *childregs, *kregs;
+       struct pt_regs *kregs; /* Switch frame regs */
        extern void ret_from_fork(void);
        extern void ret_from_fork_scv(void);
        extern void ret_from_kernel_thread(void);
 
        klp_init_thread_info(p);
 
-       /* Create initial stack frame. */
-       sp -= STACK_USER_INT_FRAME_SIZE;
-       *(unsigned long *)(sp + STACK_INT_FRAME_MARKER) = STACK_FRAME_REGS_MARKER;
-
-       /* Copy registers */
-       childregs = (struct pt_regs *)(sp + STACK_INT_FRAME_REGS);
-       if (unlikely(args->fn)) {
+       if (unlikely(p->flags & PF_KTHREAD)) {
                /* kernel thread */
+
+               /* Create initial minimum stack frame. */
+               sp -= STACK_FRAME_MIN_SIZE;
                ((unsigned long *)sp)[0] = 0;
-               memset(childregs, 0, sizeof(struct pt_regs));
-               childregs->gpr[1] = sp + STACK_USER_INT_FRAME_SIZE;
-#ifdef CONFIG_PPC64
-               clear_tsk_thread_flag(p, TIF_32BIT);
-               childregs->softe = IRQS_ENABLED;
-#endif
-               p->thread.regs = NULL;  /* no user register state */
-               ti->flags |= _TIF_RESTOREALL;
+
                f = ret_from_kernel_thread;
+               p->thread.regs = NULL;  /* no user register state */
+               clear_tsk_compat_task(p);
        } else {
                /* user thread */
-               struct pt_regs *regs = current_pt_regs();
-               *childregs = *regs;
-               if (usp)
-                       childregs->gpr[1] = usp;
-               ((unsigned long *)sp)[0] = childregs->gpr[1];
-               p->thread.regs = childregs;
-               if (clone_flags & CLONE_SETTLS) {
-                       if (!is_32bit_task())
-                               childregs->gpr[13] = tls;
+               struct pt_regs *childregs;
+
+               /* Create initial user return stack frame. */
+               sp -= STACK_USER_INT_FRAME_SIZE;
+               *(unsigned long *)(sp + STACK_INT_FRAME_MARKER) = STACK_FRAME_REGS_MARKER;
+
+               childregs = (struct pt_regs *)(sp + STACK_INT_FRAME_REGS);
+
+               if (unlikely(args->fn)) {
+                       /*
+                        * A user space thread, but it first runs a kernel
+                        * thread, and then returns as though it had called
+                        * execve rather than fork, so user regs will be
+                        * filled in (e.g., by kernel_execve()).
+                        */
+                       ((unsigned long *)sp)[0] = 0;
+                       memset(childregs, 0, sizeof(struct pt_regs));
+#ifdef CONFIG_PPC64
+                       childregs->softe = IRQS_ENABLED;
+#endif
+                       ti->flags |= _TIF_RESTOREALL;
+                       f = ret_from_kernel_thread;
+               } else {
+                       struct pt_regs *regs = current_pt_regs();
+                       unsigned long clone_flags = args->flags;
+                       unsigned long usp = args->stack;
+
+                       /* Copy registers */
+                       *childregs = *regs;
+                       if (usp)
+                               childregs->gpr[1] = usp;
+                       ((unsigned long *)sp)[0] = childregs->gpr[1];
+#ifdef CONFIG_PPC_IRQ_SOFT_MASK_DEBUG
+                       WARN_ON_ONCE(childregs->softe != IRQS_ENABLED);
+#endif
+                       if (clone_flags & CLONE_SETTLS) {
+                               unsigned long tls = args->tls;
+
+                               if (!is_32bit_task())
+                                       childregs->gpr[13] = tls;
+                               else
+                                       childregs->gpr[2] = tls;
+                       }
+
+                       if (trap_is_scv(regs))
+                               f = ret_from_fork_scv;
                        else
-                               childregs->gpr[2] = tls;
+                               f = ret_from_fork;
                }
 
-               if (trap_is_scv(regs))
-                       f = ret_from_fork_scv;
-               else
-                       f = ret_from_fork;
+#ifdef CONFIG_PPC64
+               if (cpu_has_feature(CPU_FTR_HAS_PPR))
+                       childregs->ppr = DEFAULT_PPR;
+#endif
+
+               childregs->msr &= ~(MSR_FP|MSR_VEC|MSR_VSX);
+               p->thread.regs = childregs;
        }
-       childregs->msr &= ~(MSR_FP|MSR_VEC|MSR_VSX);
 
        /*
         * The way this works is that at some point in the future
                p->thread.dscr_inherit = current->thread.dscr_inherit;
                p->thread.dscr = mfspr(SPRN_DSCR);
        }
-       if (cpu_has_feature(CPU_FTR_HAS_PPR))
-               childregs->ppr = DEFAULT_PPR;
 
        p->thread.tidr = 0;
 #endif