-----------------------------------------------------------------------
aix.S - Copyright (c) 2002, 2009 Free Software Foundation, Inc.
based on darwin.S by John Hornkvist

PowerPC Assembly glue.

Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
``Software''), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:

The above copyright notice and this permission notice shall be included
in all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED ``AS IS'', WITHOUT WARRANTY OF ANY KIND, EXPRESS
OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY CLAIM, DAMAGES OR
OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
OTHER DEALINGS IN THE SOFTWARE.
-----------------------------------------------------------------------   

     .set r0,0
     .set r1,1
     .set r2,2
     .set r3,3
     .set r4,4
     .set r5,5
     .set r6,6
     .set r7,7
     .set r8,8
     .set r9,9
     .set r10,10
     .set r11,11
     .set r12,12
     .set r13,13
     .set r14,14
     .set r15,15
     .set r16,16
     .set r17,17
     .set r18,18
     .set r19,19
     .set r20,20
     .set r21,21
     .set r22,22
     .set r23,23
     .set r24,24
     .set r25,25
     .set r26,26
     .set r27,27
     .set r28,28
     .set r29,29
     .set r30,30
     .set r31,31
     .set f0,0
     .set f1,1
     .set f2,2
     .set f3,3
     .set f4,4
     .set f5,5
     .set f6,6
     .set f7,7
     .set f8,8
     .set f9,9
     .set f10,10
     .set f11,11
     .set f12,12
     .set f13,13
     .set f14,14
     .set f15,15
     .set f16,16
     .set f17,17
     .set f18,18
     .set f19,19
     .set f20,20
     .set f21,21

     .extern .ffi_prep_args

define LIBFFI_ASM include <fficonfig.h> include <ffi.h> define JUMPTARGET(name) name define L(x) x

     .file "aix.S"
     .toc

        void ffi_call_AIX(extended_cif *ecif, unsigned long bytes,
                  unsigned int flags, unsigned int *rvalue,
                  void (*fn)(),
                  void (*prep_args)(extended_cif*, unsigned *const));
 r3=ecif, r4=bytes, r5=flags, r6=rvalue, r7=fn, r8=prep_args
/

.csect .text

.align 2
.globl ffi_call_AIX
.globl .ffi_call_AIX

.csect ffi_call_AIX ffi_call_AIX: ifdef 64BIT

.llong .ffi_call_AIX, TOC[tc0], 0
.csect .text[PR]

.ffi_call_AIX:

/* Save registers we use.    
mflr    r0

std     r28,-32(r1)
std     r29,-24(r1)
std     r30,-16(r1)
std     r31, -8(r1)

std     r0, 16(r1)
mr      r28, r1         /* our AP.  */
stdux   r1, r1, r4

/* Save arguments over call...  */
mr      r31, r5 /* flags, */
mr      r30, r6 /* rvalue, */
mr      r29, r7 /* function address.  */
std     r2, 40(r1)

/* Call ffi_prep_args.  */
mr      r4, r1
bl      .ffi_prep_args
nop

/* Now do the call.  */
ld      r0, 0(r29)
ld      r2, 8(r29)
ld      r11, 16(r29)
/* Set up cr1 with bits 4-7 of the flags.  */
mtcrf   0x40, r31
mtctr   r0
/* Load all those argument registers.  */
// We have set up a nice stack frame, just load it into registers.
ld      r3, 40+(1*8)(r1)
ld      r4, 40+(2*8)(r1)
ld      r5, 40+(3*8)(r1)
ld      r6, 40+(4*8)(r1)
nop
ld      r7, 40+(5*8)(r1)
ld      r8, 40+(6*8)(r1)
ld      r9, 40+(7*8)(r1)
ld      r10,40+(8*8)(r1)

L1:

/* Load all the FP registers.  */
bf      6,L2 // 2f + 0x18
lfd     f1,-32-(13*8)(r28)
lfd     f2,-32-(12*8)(r28)
lfd     f3,-32-(11*8)(r28)
lfd     f4,-32-(10*8)(r28)
nop
lfd     f5,-32-(9*8)(r28)
lfd     f6,-32-(8*8)(r28)
lfd     f7,-32-(7*8)(r28)
lfd     f8,-32-(6*8)(r28)
nop
lfd     f9,-32-(5*8)(r28)
lfd     f10,-32-(4*8)(r28)
lfd     f11,-32-(3*8)(r28)
lfd     f12,-32-(2*8)(r28)
nop
lfd     f13,-32-(1*8)(r28)

L2:

/* Make the call.  */
bctrl
ld      r2, 40(r1)

/* Now, deal with the return value.  */
mtcrf   0x01, r31

bt      30, L(done_return_value)
bt      29, L(fp_return_value)
std     r3, 0(r30)

/* Fall through...  */

L(done_return_value):

/* Restore the registers we used and return.  */
mr      r1, r28
ld      r0, 16(r28)
ld      r28, -32(r1)
mtlr    r0
ld      r29, -24(r1)
ld      r30, -16(r1)
ld      r31, -8(r1)
blr

L(fp_return_value):

bf      28, L(float_return_value)
stfd    f1, 0(r30)
bf      31, L(done_return_value)
stfd    f2, 8(r30)
b       L(done_return_value)

L(float_return_value):

stfs    f1, 0(r30)
b       L(done_return_value)

else /* ! 64BIT */

.long .ffi_call_AIX, TOC[tc0], 0
.csect .text[PR]

.ffi_call_AIX:

/* Save registers we use.  */
mflr    r0

stw     r28,-16(r1)
stw     r29,-12(r1)
stw     r30, -8(r1)
stw     r31, -4(r1)

stw     r0, 8(r1)
mr      r28, r1         /* out AP.  */
stwux   r1, r1, r4

/* Save arguments over call...  */
mr      r31, r5 /* flags, */
mr      r30, r6 /* rvalue, */
mr      r29, r7 /* function address, */
stw     r2, 20(r1)

/* Call ffi_prep_args.  */
mr      r4, r1
bl      .ffi_prep_args
nop

/* Now do the call.  */
lwz     r0, 0(r29)
lwz     r2, 4(r29)
lwz     r11, 8(r29)
/* Set up cr1 with bits 4-7 of the flags.  */
mtcrf   0x40, r31
mtctr   r0
/* Load all those argument registers.  */
// We have set up a nice stack frame, just load it into registers.
lwz     r3, 20+(1*4)(r1)
lwz     r4, 20+(2*4)(r1)
lwz     r5, 20+(3*4)(r1)
lwz     r6, 20+(4*4)(r1)
nop
lwz     r7, 20+(5*4)(r1)
lwz     r8, 20+(6*4)(r1)
lwz     r9, 20+(7*4)(r1)
lwz     r10,20+(8*4)(r1)

L1:

/* Load all the FP registers.  */
bf      6,L2 // 2f + 0x18
lfd     f1,-16-(13*8)(r28)
lfd     f2,-16-(12*8)(r28)
lfd     f3,-16-(11*8)(r28)
lfd     f4,-16-(10*8)(r28)
nop
lfd     f5,-16-(9*8)(r28)
lfd     f6,-16-(8*8)(r28)
lfd     f7,-16-(7*8)(r28)
lfd     f8,-16-(6*8)(r28)
nop
lfd     f9,-16-(5*8)(r28)
lfd     f10,-16-(4*8)(r28)
lfd     f11,-16-(3*8)(r28)
lfd     f12,-16-(2*8)(r28)
nop
lfd     f13,-16-(1*8)(r28)

L2:

/* Make the call.  */
bctrl
lwz     r2, 20(r1)

/* Now, deal with the return value.  */
mtcrf   0x01, r31

bt      30, L(done_return_value)
bt      29, L(fp_return_value)
stw     r3, 0(r30)
bf      28, L(done_return_value)
stw     r4, 4(r30)

/* Fall through...  */

L(done_return_value):

/* Restore the registers we used and return.  */
mr      r1, r28
lwz     r0, 8(r28)
lwz     r28,-16(r1)
mtlr    r0
lwz     r29,-12(r1)
lwz     r30, -8(r1)
lwz     r31, -4(r1)
blr

L(fp_return_value):

bf      28, L(float_return_value)
stfd    f1, 0(r30)
b       L(done_return_value)

L(float_return_value):

stfs    f1, 0(r30)
b       L(done_return_value)

endif

.long 0
.byte 0,0,0,1,128,4,0,0

//END(ffi_call_AIX)

.csect .text

.align 2
.globl ffi_call_DARWIN
.globl .ffi_call_DARWIN

.csect ffi_call_DARWIN ffi_call_DARWIN: ifdef 64BIT

.llong .ffi_call_DARWIN, TOC[tc0], 0

else

.long .ffi_call_DARWIN, TOC[tc0], 0

endif

.csect .text[PR]

.ffi_call_DARWIN:

blr
.long 0
.byte 0,0,0,0,0,0,0,0

//END(ffi_call_DARWIN)