/* libffi support for Altera Nios II.
Copyright (c) 2013 Mentor Graphics.
Permission is hereby granted, free of charge, to any person obtaining
a copy of this software and associated documentation files (the
``Software''), to deal in the Software without restriction, including
without limitation the rights to use, copy, modify, merge, publish,
distribute, sublicense, and/or sell copies of the Software, and to
permit persons to whom the Software is furnished to do so, subject to
the following conditions:
The above copyright notice and this permission notice shall be
included in all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED ``AS IS'', WITHOUT WARRANTY OF ANY KIND,
EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
#include <ffi.h>
#include <ffi_common.h>
#include <stdlib.h>
/* The Nios II Processor Reference Handbook defines the procedure call
ABI as follows.
Arguments are passed as if a structure containing the types of
the arguments were constructed. The first 16 bytes are passed in r4
through r7, the remainder on the stack. The first 16 bytes of a function
taking variable arguments are passed in r4-r7 in the same way.
Return values of types up to 8 bytes are returned in r2 and r3. For
return values greater than 8 bytes, the caller must allocate memory for
the result and pass the address as if it were argument 0.
While this isn't specified explicitly in the ABI documentation, GCC
promotes integral arguments smaller than int size to 32 bits.
Also of note, the ABI specifies that all structure objects are
aligned to 32 bits even if all their fields have a smaller natural
alignment. See FFI_AGGREGATE_ALIGNMENT. */
/* Declare the assembly language hooks. */
extern UINT64 ffi_call_sysv (void (*) (char *, extended_cif *),
extended_cif *,
unsigned,
void (*fn) (void));
extern void ffi_closure_sysv (void);
/* Perform machine-dependent cif processing. */
ffi_status ffi_prep_cif_machdep (ffi_cif *cif)
{
/* We always want at least 16 bytes in the parameter block since it
simplifies the low-level call function. Also round the parameter
block size up to a multiple of 4 bytes to preserve
32-bit alignment of the stack pointer. */
if (cif->bytes < 16)
cif->bytes = 16;
else
cif->bytes = (cif->bytes + 3) & ~3;
return FFI_OK;
}
/* ffi_prep_args is called by the assembly routine to transfer arguments
to the stack using the pointers in the ecif array.
Note that the stack buffer is big enough to fit all the arguments,
but the first 16 bytes will be copied to registers for the actual
call. */
void ffi_prep_args (char *stack, extended_cif *ecif)
{
char *argp = stack;
unsigned int i;
/* The implicit return value pointer is passed as if it were a hidden
first argument. */
if (ecif->cif->rtype->type == FFI_TYPE_STRUCT
&& ecif->cif->rtype->size > 8)
{
(*(void **) argp) = ecif->rvalue;
argp += 4;
}
for (i = 0; i < ecif->cif->nargs; i++)
{
void *avalue = ecif->avalue[i];
ffi_type *atype = ecif->cif->arg_types[i];
size_t size = atype->size;
size_t alignment = atype->alignment;
/* Align argp as appropriate for the argument type. */
if ((alignment - 1) & (unsigned) argp)
argp = (char *) ALIGN (argp, alignment);
/* Copy the argument, promoting integral types smaller than a
word to word size. */
if (size < sizeof (int))
{
size = sizeof (int);
switch (atype->type)
{
case FFI_TYPE_SINT8:
*(signed int *) argp = (signed int) *(SINT8 *) avalue;
break;
case FFI_TYPE_UINT8:
*(unsigned int *) argp = (unsigned int) *(UINT8 *) avalue;
break;
case FFI_TYPE_SINT16:
*(signed int *) argp = (signed int) *(SINT16 *) avalue;
break;
case FFI_TYPE_UINT16:
*(unsigned int *) argp = (unsigned int) *(UINT16 *) avalue;
break;
case FFI_TYPE_STRUCT:
memcpy (argp, avalue, atype->size);
break;
default:
FFI_ASSERT(0);
}
}
else if (size == sizeof (int))
*(unsigned int *) argp = (unsigned int) *(UINT32 *) avalue;
else
memcpy (argp, avalue, size);
argp += size;
}
}
/* Call FN using the prepared CIF. RVALUE points to space allocated by
the caller for the return value, and AVALUE is an array of argument
pointers. */
void ffi_call (ffi_cif *cif, void (*fn) (void), void *rvalue, void **avalue)
{
extended_cif ecif;
UINT64 result;
/* If bigret is true, this is the case where a return value of larger
than 8 bytes is handled by being passed by reference as an implicit
argument. */
int bigret = (cif->rtype->type == FFI_TYPE_STRUCT
&& cif->rtype->size > 8);
ecif.cif = cif;
ecif.avalue = avalue;
/* Allocate space for return value if this is the pass-by-reference case
and the caller did not provide a buffer. */
if (rvalue == NULL && bigret)
ecif.rvalue = alloca (cif->rtype->size);
else
ecif.rvalue = rvalue;
result = ffi_call_sysv (ffi_prep_args, &ecif, cif->bytes, fn);
/* Now result contains the 64 bit contents returned from fn in
r2 and r3. Copy the value of the appropriate size to the user-provided
rvalue buffer. */
if (rvalue && !bigret)
switch (cif->rtype->size)
{
case 1:
*(UINT8 *)rvalue = (UINT8) result;
break;
case 2:
*(UINT16 *)rvalue = (UINT16) result;
break;
case 4:
*(UINT32 *)rvalue = (UINT32) result;
break;
case 8:
*(UINT64 *)rvalue = (UINT64) result;
break;
default:
memcpy (rvalue, (void *)&result, cif->rtype->size);
break;
}
}
/* This function is invoked from the closure trampoline to invoke
CLOSURE with argument block ARGS. Parse ARGS according to
CLOSURE->cfi and invoke CLOSURE->fun. */
static UINT64
ffi_closure_helper (unsigned char *args,
ffi_closure *closure)
{
ffi_cif *cif = closure->cif;
unsigned char *argp = args;
void **parsed_args = alloca (cif->nargs * sizeof (void *));
UINT64 result;
void *retptr;
unsigned int i;
/* First figure out what to do about the return type. If this is the
big-structure-return case, the first arg is the hidden return buffer
allocated by the caller. */
if (cif->rtype->type == FFI_TYPE_STRUCT
&& cif->rtype->size > 8)
{
retptr = *((void **) argp);
argp += 4;
}
else
retptr = (void *) &result;
/* Fill in the array of argument pointers. */
for (i = 0; i < cif->nargs; i++)
{
size_t size = cif->arg_types[i]->size;
size_t alignment = cif->arg_types[i]->alignment;
/* Align argp as appropriate for the argument type. */
if ((alignment - 1) & (unsigned) argp)
argp = (char *) ALIGN (argp, alignment);
/* Arguments smaller than an int are promoted to int. */
if (size < sizeof (int))
size = sizeof (int);
/* Store the pointer. */
parsed_args[i] = argp;
argp += size;
}
/* Call the user-supplied function. */
(closure->fun) (cif, retptr, parsed_args, closure->user_data);
return result;
}
/* Initialize CLOSURE with a trampoline to call FUN with
CIF and USER_DATA. */
ffi_status
ffi_prep_closure_loc (ffi_closure* closure,
ffi_cif* cif,
void (*fun) (ffi_cif*, void*, void**, void*),
void *user_data,
void *codeloc)
{
unsigned int *tramp = (unsigned int *) &closure->tramp[0];
int i;
if (cif->abi != FFI_SYSV)
return FFI_BAD_ABI;
/* The trampoline looks like:
movhi r8, %hi(ffi_closure_sysv)
ori r8, r8, %lo(ffi_closure_sysv)
movhi r9, %hi(ffi_closure_helper)
ori r0, r9, %lo(ffi_closure_helper)
movhi r10, %hi(closure)
ori r10, r10, %lo(closure)
jmp r8
and then ffi_closure_sysv retrieves the closure pointer out of r10
in addition to the arguments passed in the normal way for the call,
and invokes ffi_closure_helper. We encode the pointer to
ffi_closure_helper in the trampoline because making a PIC call
to it in ffi_closure_sysv would be messy (it would have to indirect
through the GOT). */
#define HI(x) ((((unsigned int) (x)) >> 16) & 0xffff)
#define LO(x) (((unsigned int) (x)) & 0xffff)
tramp[0] = (0 << 27) | (8 << 22) | (HI (ffi_closure_sysv) << 6) | 0x34;
tramp[1] = (8 << 27) | (8 << 22) | (LO (ffi_closure_sysv) << 6) | 0x14;
tramp[2] = (0 << 27) | (9 << 22) | (HI (ffi_closure_helper) << 6) | 0x34;
tramp[3] = (9 << 27) | (9 << 22) | (LO (ffi_closure_helper) << 6) | 0x14;
tramp[4] = (0 << 27) | (10 << 22) | (HI (closure) << 6) | 0x34;
tramp[5] = (10 << 27) | (10 << 22) | (LO (closure) << 6) | 0x14;
tramp[6] = (8 << 27) | (0x0d << 11) | 0x3a;
#undef HI
#undef LO
/* Flush the caches.
See Example 9-4 in the Nios II Software Developer's Handbook. */
for (i = 0; i < 7; i++)
asm volatile ("flushd 0(%0); flushi %0" :: "r"(tramp + i) : "memory");
asm volatile ("flushp" ::: "memory");
closure->cif = cif;
closure->fun = fun;
closure->user_data = user_data;
return FFI_OK;
}