Преглед на файлове

patch from njk: make x86_64 __uniclone branchless.

Rich Felker преди 14 години
родител
ревизия
22cd9cae81
променени са 1 файла, в които са добавени 6 реда и са изтрити 6 реда
  1. 6 6
      src/thread/x86_64/clone.s

+ 6 - 6
src/thread/x86_64/clone.s

@@ -4,6 +4,7 @@
 .type   __uniclone,%function
 /* rdi = child_stack, rsi = start, rdx = pthread_struct */
 __uniclone:
+        subq    $8,%rsp         /* pad parent stack to prevent branch later */
         subq    $16,%rdi        /* grow child_stack */
         mov     %rsi,8(%rdi)    /* push start onto child_stack as return ptr */
         mov     %rdx,0(%rdi)    /* push pthread_struct onto child_stack */
@@ -13,10 +14,9 @@ __uniclone:
         movl    $56,%eax        /* clone syscall number */
         movl    $0x7d0f00,%edi  /* rdi = flags */
         mov     %r10,%rdx       /* rdx = parent_id */
-	syscall                 /* clone(flags, child_stack, parent_id,
-	                         *       child_id, tls) */
-	test	%rax,%rax
-	jnz	1f              /* if we're in the parent -> goto 1f */
-        pop     %rdi            /* restore pthread_struct from child stack */
-1:      ret
+        syscall                 /* clone(flags, child_stack, parent_id,
+                                 *       child_id, tls) */
+        pop     %rdi            /* child stack: restore pthread_struct
+                                 * parent stack: undo rsp displacement */
+        ret
 .size __uniclone,.-__uniclone