/* -----------------------------------------------------------------------
   v8.S - Copyright (c) 2013  The Written Word, Inc.
	  Copyright (c) 1996, 1997, 2003, 2004, 2008  Red Hat, Inc.

   SPARC Foreign Function Interface

   Permission is hereby granted, free of charge, to any person obtaining
   a copy of this software and associated documentation files (the
   ``Software''), to deal in the Software without restriction, including
   without limitation the rights to use, copy, modify, merge, publish,
   distribute, sublicense, and/or sell copies of the Software, and to
   permit persons to whom the Software is furnished to do so, subject to
   the following conditions:

   The above copyright notice and this permission notice shall be included
   in all copies or substantial portions of the Software.

   THE SOFTWARE IS PROVIDED ``AS IS'', WITHOUT WARRANTY OF ANY KIND,
   EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
   MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
   NONINFRINGEMENT.  IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
   HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
   WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
   OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
   DEALINGS IN THE SOFTWARE.
   ----------------------------------------------------------------------- */

#define LIBFFI_ASM
#include <fficonfig.h>
#include <ffi.h>
#include <ffi_cfi.h>
#include "internal.h"

#ifndef SPARC64

#define C2(X, Y)  X ## Y
#define C1(X, Y)  C2(X, Y)

#ifdef __USER_LABEL_PREFIX__
# define C(Y)	C1(__USER_LABEL_PREFIX__, Y)
#else
# define C(Y)	Y
#endif
#define L(Y)	C1(.L, Y)

	.text

#ifndef __GNUC__
        .align 8
	.globl	C(ffi_flush_icache)
	.type	C(ffi_flush_icache),#function
	FFI_HIDDEN(C(ffi_flush_icache))

C(ffi_flush_icache):
	cfi_startproc
1:	iflush %o0
	iflush %o+8
	nop
	nop
	nop
	nop
	nop
	retl
	 nop
	cfi_endproc
	.size	C(ffi_flush_icache), . - C(ffi_flush_icache)
#endif

#if defined(__sun__) && defined(__svr4__)
# define E(INDEX)	.align 16
#else
# define E(INDEX)	.align 16; .org 2b + INDEX * 16
#endif

        .align 8
	.globl	C(ffi_call_v8)
	.type	C(ffi_call_v8),#function
	FFI_HIDDEN(C(ffi_call_v8))

C(ffi_call_v8):
	cfi_startproc
	! Allocate a stack frame sized by ffi_call.
	save	%sp, %o4, %sp
	cfi_def_cfa_register(%fp)
	cfi_window_save
	cfi_register(%o7, %i7)

	mov	%i0, %o0		! copy cif
	add	%sp, 64+32, %o1		! load args area
	mov	%i2, %o2		! copy rvalue
	call	C(ffi_prep_args_v8)
	 mov	%i3, %o3		! copy avalue

	add	%sp, 32, %sp		! deallocate prep frame
	and	%o0, SPARC_FLAG_RET_MASK, %l0	! save return type
	srl	%o0, SPARC_SIZEMASK_SHIFT, %l1	! save return size
	ld	[%sp+64+4], %o0		! load all argument registers
	ld	[%sp+64+8], %o1
	ld	[%sp+64+12], %o2
	ld	[%sp+64+16], %o3
	cmp	%l0, SPARC_RET_STRUCT	! struct return needs an unimp 4
	ld	[%sp+64+20], %o4
	be	8f
	 ld	[%sp+64+24], %o5

	! Call foreign function
	call	%i1
	 mov	%i5, %g2		! load static chain

0:	call	1f		! load pc in %o7
	 sll	%l0, 4, %l0
1:	add	%o7, %l0, %o7	! o7 = 0b + ret_type*16
	jmp	%o7+(2f-0b)
	 nop

	! Note that each entry is 4 insns, enforced by the E macro.
	.align	16
2:
E(SPARC_RET_VOID)
	ret
	 restore
E(SPARC_RET_STRUCT)
	unimp
E(SPARC_RET_UINT8)
	and	%o0, 0xff, %o0
	st	%o0, [%i2]
	ret
	 restore
E(SPARC_RET_SINT8)
	sll	%o0, 24, %o0
	b	7f
	 sra	%o0, 24, %o0
E(SPARC_RET_UINT16)
	sll	%o0, 16, %o0
	b	7f
	 srl	%o0, 16, %o0
E(SPARC_RET_SINT16)
	sll	%o0, 16, %o0
	b	7f
	 sra	%o0, 16, %o0
E(SPARC_RET_UINT32)
7:	st	%o0, [%i2]
	ret
	 restore
E(SP_V8_RET_CPLX16)
	sth	%o0, [%i2+2]
	b	9f
	 srl	%o0, 16, %o0
E(SPARC_RET_INT64)
	st	%o0, [%i2]
	st	%o1, [%i2+4]
	ret
	 restore
E(SPARC_RET_INT128)
	std	%o0, [%i2]
	std	%o2, [%i2+8]
	ret
	 restore
E(SPARC_RET_F_8)
	st	%f7, [%i2+7*4]
	nop
	st	%f6, [%i2+6*4]
	nop
E(SPARC_RET_F_6)
	st	%f5, [%i2+5*4]
	nop
	st	%f4, [%i2+4*4]
	nop
E(SPARC_RET_F_4)
	st	%f3, [%i2+3*4]
	nop
	st	%f2, [%i2+2*4]
	nop
E(SPARC_RET_F_2)
	st	%f1, [%i2+4]
	st	%f0, [%i2]
	ret
	 restore
E(SP_V8_RET_CPLX8)
	stb	%o0, [%i2+1]
	b	0f
	 srl	%o0, 8, %o0
E(SPARC_RET_F_1)
	st	%f0, [%i2]
	ret
	 restore

	.align	8
9:	sth	%o0, [%i2]
	ret
	 restore
	.align	8
0:	stb	%o0, [%i2]
	ret
	 restore

	! Struct returning functions expect and skip the unimp here.
	! To make it worse, conforming callees examine the unimp and
	! make sure the low 12 bits of the unimp match the size of
	! the struct being returned.
	.align	8
8:	call	1f				! load pc in %o7
	 sll	%l1, 2, %l0			! size * 4
1:	sll	%l1, 4, %l1			! size * 16
	add	%l0, %l1, %l0			! size * 20
	add	%o7, %l0, %o7			! o7 = 8b + size*20
	jmp	%o7+(2f-8b)
	 mov	%i5, %g2			! load static chain
2:

/* The Sun assembler doesn't understand .rept 0x1000.  */
#define rept1			\
	call	%i1;		\
	 nop;			\
	unimp	(. - 2b) / 20;	\
	ret;			\
	 restore

#define rept16				\
	rept1; rept1; rept1; rept1;	\
	rept1; rept1; rept1; rept1;	\
	rept1; rept1; rept1; rept1;	\
	rept1; rept1; rept1; rept1

#define rept256				\
	rept16; rept16; rept16; rept16;	\
	rept16; rept16; rept16; rept16;	\
	rept16; rept16; rept16; rept16;	\
	rept16; rept16; rept16; rept16

	rept256; rept256; rept256; rept256
	rept256; rept256; rept256; rept256
	rept256; rept256; rept256; rept256
	rept256; rept256; rept256; rept256

	cfi_endproc
	.size	C(ffi_call_v8),. - C(ffi_call_v8)


/* 16*4 register window + 1*4 struct return + 6*4 args backing store
   + 8*4 return storage + 1*4 alignment.  */
#define	STACKFRAME	(16*4 + 4 + 6*4 + 8*4 + 4)

/* ffi_closure_v8(...)

   Receives the closure argument in %g2.   */

#ifdef HAVE_AS_REGISTER_PSEUDO_OP
	.register	%g2, #scratch
#endif

	.align 8
	.globl	C(ffi_go_closure_v8)
	.type	C(ffi_go_closure_v8),#function
	FFI_HIDDEN(C(ffi_go_closure_v8))

C(ffi_go_closure_v8):
	cfi_startproc
	save	%sp, -STACKFRAME, %sp
	cfi_def_cfa_register(%fp)
	cfi_window_save
	cfi_register(%o7, %i7)

	ld	[%g2+4], %o0			! load cif
	ld	[%g2+8], %o1			! load fun
	b	0f
	 mov	%g2, %o2			! load user_data
	cfi_endproc
	.size	C(ffi_go_closure_v8), . - C(ffi_go_closure_v8)

	.align 8
	.globl	C(ffi_closure_v8)
	.type	C(ffi_closure_v8),#function
	FFI_HIDDEN(C(ffi_closure_v8))

C(ffi_closure_v8):
	cfi_startproc
	save	%sp, -STACKFRAME, %sp
	cfi_def_cfa_register(%fp)
	cfi_window_save
	cfi_register(%o7, %i7)

	ld	[%g2+FFI_TRAMPOLINE_SIZE], %o0		! load cif
	ld	[%g2+FFI_TRAMPOLINE_SIZE+4], %o1	! load fun
	ld	[%g2+FFI_TRAMPOLINE_SIZE+8], %o2	! load user_data
0:
	! Store all of the potential argument registers in va_list format.
	st	%i0, [%fp+68+0]
	st	%i1, [%fp+68+4]
	st	%i2, [%fp+68+8]
	st	%i3, [%fp+68+12]
	st	%i4, [%fp+68+16]
	st	%i5, [%fp+68+20]

	! Call ffi_closure_sparc_inner to do the bulk of the work.
	add	%fp, -8*4, %o3
	call	ffi_closure_sparc_inner_v8
	 add	%fp,  64, %o4

0:	call	1f
	 and	%o0, SPARC_FLAG_RET_MASK, %o0
1:	sll	%o0, 4, %o0	! o0 = o0 * 16
	add	%o7, %o0, %o7	! o7 = 0b + o0*16
	jmp	%o7+(2f-0b)
	 add	%fp, -8*4, %i2
	 
	! Note that each entry is 4 insns, enforced by the E macro.
	.align	16
2:
E(SPARC_RET_VOID)
	ret
	 restore
E(SPARC_RET_STRUCT)
	ld	[%i2], %i0
	jmp	%i7+12
	 restore
E(SPARC_RET_UINT8)
	ldub	[%i2+3], %i0
	ret
	 restore
E(SPARC_RET_SINT8)
	ldsb	[%i2+3], %i0
	ret
	 restore
E(SPARC_RET_UINT16)
	lduh	[%i2+2], %i0
	ret
	 restore
E(SPARC_RET_SINT16)
	ldsh	[%i2+2], %i0
	ret
	 restore
E(SPARC_RET_UINT32)
	ld	[%i2], %i0
	ret
	 restore
E(SP_V8_RET_CPLX16)
	ld	[%i2], %i0
	ret
	 restore
E(SPARC_RET_INT64)
	ldd	[%i2], %i0
	ret
	 restore
E(SPARC_RET_INT128)
	ldd	[%i2], %i0
	ldd	[%i2+8], %i2
	ret
	 restore
E(SPARC_RET_F_8)
	ld	[%i2+7*4], %f7
	nop
	ld	[%i2+6*4], %f6
	nop
E(SPARC_RET_F_6)
	ld	[%i2+5*4], %f5
	nop
	ld	[%i2+4*4], %f4
	nop
E(SPARC_RET_F_4)
	ld	[%i2+3*4], %f3
	nop
	ld	[%i2+2*4], %f2
	nop
E(SPARC_RET_F_2)
	ldd	[%i2], %f0
	ret
	 restore
E(SP_V8_RET_CPLX8)
	lduh	[%i2], %i0
	ret
	 restore
E(SPARC_RET_F_1)
	ld	[%i2], %f0
	ret
	 restore

	cfi_endproc
	.size	C(ffi_closure_v8), . - C(ffi_closure_v8)
#endif /* !SPARC64 */
#if defined __ELF__ && defined __linux__
	.section	.note.GNU-stack,"",@progbits
#endif
