Edit

kc3-lang/libffi/src/powerpc/linux64.S

Branch :

  • Show log

    Commit

  • Author : Alan Modra
    Date : 2014-11-10 09:42:31
    Hash : fa1040c1
    Message : GO closures for powerpc linux Plus .cfi async unwind info, rearrangement of ffi_call_linux64 and ffi_call_SYSV function params to avoid register copies, tweaks to trampolines. * src/powerpc/ffitarget.h (FFI_GO_CLOSURES): Define. * src/powerpc/ffi.c (ffi_call_int): New function with extra closure param, and args rearranged on ffi_call_linux64 and ffi_call_SYSV calls, extracted from .. (ffi_call): ..here. (ffi_call_go, ffi_prep_go_closure): New functions. * src/powerpc/ffi_linux64.c (ffi_prep_closure_loc_linux64): Make hidden. Only flush insn part of ELFv2 trampoline. Don't shuffle ELFv1 trampoline. (ffi_closure_helper_LINUX64): Replace closure param with cif, fun, user_data params. * src/powerpc/ffi_powerpc.h (ffi_go_closure_sysv): Declare. (ffi_go_closure_linux64): Declare. (ffi_call_SYSV, fi_call_LINUX64): Update. (ffi_prep_closure_loc_sysv, ffi_prep_closure_loc_linux64): Declare. (ffi_closure_helper_SYSV, ffi_closure_helper_LINUX64): Update. * src/powerpc/ffi_sysv.c (ASM_NEEDS_REGISTERS): Increase to 6. (ffi_prep_closure_loc_sysv): Use bcl in trampoline, put data words last, flush just the insn part. (ffi_closure_helper_SYSV): Replace closure param with cif, fun and user_data params. * src/powerpc/linux64.S (ffi_call_LINUX64): Replace hand-written .eh_frame with .cfi directives. Adjust for changed param order. Pass extra "closure" param to user function in static chain. Add .cfi directives to describe epilogue. Don't provide traceback table for ELFv2 or _CALL_LINUX. * src/powerpc/linux64_closure.S (ffi_closure_LINUX64): Replace hand-written .eh_frame with .cfi directives. Adjust for changed ffi_closure_helper_LINUX64 params. Add .cfi directives to describe epilogue. Don't provide traceback table for ELFv2 or _CALL_LINUX. (ffi_go_closure_linux64): New function. * src/powerpc/sysv.S: Remove redundant .globl ffi_prep_args_SYSV. (ffi_call_SYSV): Make hidden. Replace hand-written .eh_frame with .cfi directives. Adjust for changed params. Pass extra "closure" param to user function in static chain. Add .cfi directives to describe epilogue. * src/powerpc/ppc_closure.S (ffi_closure_SYSV): Make hidden. Replace hand-written .eh_frame with .cfi directives. Adjust for changed ffi_closure_helper_SYSV params. Add .cfi directives to describe epilogue. Don't just use nops in the dead __NO_FPRS__ epilogues. (ffi_go_closure_sysv): New function.

  • src/powerpc/linux64.S
  • /* -----------------------------------------------------------------------
       sysv.h - Copyright (c) 2003 Jakub Jelinek <jakub@redhat.com>
    	    Copyright (c) 2008 Red Hat, Inc.
    
       PowerPC64 Assembly glue.
    
       Permission is hereby granted, free of charge, to any person obtaining
       a copy of this software and associated documentation files (the
       ``Software''), to deal in the Software without restriction, including
       without limitation the rights to use, copy, modify, merge, publish,
       distribute, sublicense, and/or sell copies of the Software, and to
       permit persons to whom the Software is furnished to do so, subject to
       the following conditions:
    
       The above copyright notice and this permission notice shall be included
       in all copies or substantial portions of the Software.
    
       THE SOFTWARE IS PROVIDED ``AS IS'', WITHOUT WARRANTY OF ANY KIND,
       EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
       MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
       NONINFRINGEMENT.  IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
       HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
       WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
       OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
       DEALINGS IN THE SOFTWARE.
       ----------------------------------------------------------------------- */
    
    #define LIBFFI_ASM
    #include <fficonfig.h>
    #include <ffi.h>
    
    #ifdef POWERPC64
    	.hidden	ffi_call_LINUX64
    	.globl	ffi_call_LINUX64
    	.text
    	.cfi_startproc
    # if _CALL_ELF == 2
    ffi_call_LINUX64:
    	addis	%r2, %r12, .TOC.-ffi_call_LINUX64@ha
    	addi	%r2, %r2, .TOC.-ffi_call_LINUX64@l
    	.localentry ffi_call_LINUX64, . - ffi_call_LINUX64
    # else
    	.section	".opd","aw"
    	.align	3
    ffi_call_LINUX64:
    #  ifdef _CALL_LINUX
    	.quad	.L.ffi_call_LINUX64,.TOC.@tocbase,0
    	.type	ffi_call_LINUX64,@function
    	.text
    .L.ffi_call_LINUX64:
    #  else
    	.hidden	.ffi_call_LINUX64
    	.globl	.ffi_call_LINUX64
    	.quad	.ffi_call_LINUX64,.TOC.@tocbase,0
    	.size	ffi_call_LINUX64,24
    	.type	.ffi_call_LINUX64,@function
    	.text
    .ffi_call_LINUX64:
    #  endif
    # endif
    	mflr	%r0
    	std	%r28, -32(%r1)
    	std	%r29, -24(%r1)
    	std	%r30, -16(%r1)
    	std	%r31, -8(%r1)
    	std	%r7, 8(%r1)	/* closure, saved in cr field.  */
    	std	%r0, 16(%r1)
    
    	mr	%r28, %r1	/* our AP.  */
    	.cfi_def_cfa_register 28
    	.cfi_offset 65, 16
    	.cfi_offset 31, -8
    	.cfi_offset 30, -16
    	.cfi_offset 29, -24
    	.cfi_offset 28, -32
    
    	stdux	%r1, %r1, %r8
    	mr	%r31, %r6	/* flags, */
    	mr	%r30, %r5	/* rvalue, */
    	mr	%r29, %r4	/* function address.  */
    /* Save toc pointer, not for the ffi_prep_args64 call, but for the later
       bctrl function call.  */
    # if _CALL_ELF == 2
    	std	%r2, 24(%r1)
    # else
    	std	%r2, 40(%r1)
    # endif
    
    	/* Call ffi_prep_args64.  */
    	mr	%r4, %r1
    # if defined _CALL_LINUX || _CALL_ELF == 2
    	bl	ffi_prep_args64
    # else
    	bl	.ffi_prep_args64
    # endif
    
    # if _CALL_ELF == 2
    	mr	%r12, %r29
    # else
    	ld	%r12, 0(%r29)
    	ld	%r2, 8(%r29)
    # endif
    	/* Now do the call.  */
    	/* Set up cr1 with bits 4-7 of the flags.  */
    	mtcrf	0x40, %r31
    
    	/* Get the address to call into CTR.  */
    	mtctr	%r12
    	/* Load all those argument registers.  */
    	ld	%r3, -32-(8*8)(%r28)
    	ld	%r4, -32-(7*8)(%r28)
    	ld	%r5, -32-(6*8)(%r28)
    	ld	%r6, -32-(5*8)(%r28)
    	bf-	5, 1f
    	ld	%r7, -32-(4*8)(%r28)
    	ld	%r8, -32-(3*8)(%r28)
    	ld	%r9, -32-(2*8)(%r28)
    	ld	%r10, -32-(1*8)(%r28)
    1:
    
    	/* Load all the FP registers.  */
    	bf-	6, 2f
    	lfd	%f1, -32-(21*8)(%r28)
    	lfd	%f2, -32-(20*8)(%r28)
    	lfd	%f3, -32-(19*8)(%r28)
    	lfd	%f4, -32-(18*8)(%r28)
    	lfd	%f5, -32-(17*8)(%r28)
    	lfd	%f6, -32-(16*8)(%r28)
    	lfd	%f7, -32-(15*8)(%r28)
    	lfd	%f8, -32-(14*8)(%r28)
    	lfd	%f9, -32-(13*8)(%r28)
    	lfd	%f10, -32-(12*8)(%r28)
    	lfd	%f11, -32-(11*8)(%r28)
    	lfd	%f12, -32-(10*8)(%r28)
    	lfd	%f13, -32-(9*8)(%r28)
    2:
    
    	/* Make the call.  */
    	ld	%r11, 8(%r28)
    	bctrl
    
    	/* This must follow the call immediately, the unwinder
    	   uses this to find out if r2 has been saved or not.  */
    # if _CALL_ELF == 2
    	ld	%r2, 24(%r1)
    # else
    	ld	%r2, 40(%r1)
    # endif
    
    	/* Now, deal with the return value.  */
    	mtcrf	0x01, %r31
    	bt	31, .Lstruct_return_value
    	bt	30, .Ldone_return_value
    	bt	29, .Lfp_return_value
    	std	%r3, 0(%r30)
    	/* Fall through...  */
    
    .Ldone_return_value:
    	/* Restore the registers we used and return.  */
    	mr	%r1, %r28
    	.cfi_def_cfa_register 1
    	ld	%r0, 16(%r28)
    	ld	%r28, -32(%r28)
    	mtlr	%r0
    	ld	%r29, -24(%r1)
    	ld	%r30, -16(%r1)
    	ld	%r31, -8(%r1)
    	blr
    
    .Lfp_return_value:
    	.cfi_def_cfa_register 28
    	bf	28, .Lfloat_return_value
    	stfd	%f1, 0(%r30)
    	mtcrf	0x02, %r31 /* cr6  */
    	bf	27, .Ldone_return_value
    	stfd	%f2, 8(%r30)
    	b	.Ldone_return_value
    .Lfloat_return_value:
    	stfs	%f1, 0(%r30)
    	b	.Ldone_return_value
    
    .Lstruct_return_value:
    	bf	29, .Lsmall_struct
    	bf	28, .Lfloat_homog_return_value
    	stfd	%f1, 0(%r30)
    	stfd	%f2, 8(%r30)
    	stfd	%f3, 16(%r30)
    	stfd	%f4, 24(%r30)
    	stfd	%f5, 32(%r30)
    	stfd	%f6, 40(%r30)
    	stfd	%f7, 48(%r30)
    	stfd	%f8, 56(%r30)
    	b	.Ldone_return_value
    
    .Lfloat_homog_return_value:
    	stfs	%f1, 0(%r30)
    	stfs	%f2, 4(%r30)
    	stfs	%f3, 8(%r30)
    	stfs	%f4, 12(%r30)
    	stfs	%f5, 16(%r30)
    	stfs	%f6, 20(%r30)
    	stfs	%f7, 24(%r30)
    	stfs	%f8, 28(%r30)
    	b	.Ldone_return_value
    
    .Lsmall_struct:
    	std	%r3, 0(%r30)
    	std	%r4, 8(%r30)
    	b	.Ldone_return_value
    
    	.cfi_endproc
    # if _CALL_ELF == 2
    	.size	ffi_call_LINUX64,.-ffi_call_LINUX64
    # else
    #  ifdef _CALL_LINUX
    	.size	ffi_call_LINUX64,.-.L.ffi_call_LINUX64
    #  else
    	.long	0
    	.byte	0,12,0,1,128,4,0,0
    	.size	.ffi_call_LINUX64,.-.ffi_call_LINUX64
    #  endif
    # endif
    
    #endif
    
    #if (defined __ELF__ && defined __linux__) || _CALL_ELF == 2
    	.section	.note.GNU-stack,"",@progbits
    #endif