| /* ----------------------------------------------------------------------- |
| ffi64.c - Copyright (c) 2013 The Written Word, Inc. |
| Copyright (c) 2011 Anthony Green |
| Copyright (c) 2008, 2010 Red Hat, Inc. |
| Copyright (c) 2002, 2007 Bo Thorsen <bo@suse.de> |
| |
| x86-64 Foreign Function Interface |
| |
| Permission is hereby granted, free of charge, to any person obtaining |
| a copy of this software and associated documentation files (the |
| ``Software''), to deal in the Software without restriction, including |
| without limitation the rights to use, copy, modify, merge, publish, |
| distribute, sublicense, and/or sell copies of the Software, and to |
| permit persons to whom the Software is furnished to do so, subject to |
| the following conditions: |
| |
| The above copyright notice and this permission notice shall be included |
| in all copies or substantial portions of the Software. |
| |
| THE SOFTWARE IS PROVIDED ``AS IS'', WITHOUT WARRANTY OF ANY KIND, |
| EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF |
| MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND |
| NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT |
| HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, |
| WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER |
| DEALINGS IN THE SOFTWARE. |
| ----------------------------------------------------------------------- */ |
| |
| #include <ffi.h> |
| #include <ffi_common.h> |
| |
| #include <stdlib.h> |
| #include <stdarg.h> |
| #include <stdint.h> |
| #include "internal64.h" |
| |
| #ifdef __x86_64__ |
| |
| #define MAX_GPR_REGS 6 |
| #define MAX_SSE_REGS 8 |
| |
| #if defined(__INTEL_COMPILER) |
| #include "xmmintrin.h" |
| #define UINT128 __m128 |
| #else |
| #if defined(__SUNPRO_C) |
| #include <sunmedia_types.h> |
| #define UINT128 __m128i |
| #else |
| #define UINT128 __int128_t |
| #endif |
| #endif |
| |
| union big_int_union |
| { |
| UINT32 i32; |
| UINT64 i64; |
| UINT128 i128; |
| }; |
| |
| struct register_args |
| { |
| /* Registers for argument passing. */ |
| UINT64 gpr[MAX_GPR_REGS]; |
| union big_int_union sse[MAX_SSE_REGS]; |
| UINT64 rax; /* ssecount */ |
| UINT64 r10; /* static chain */ |
| }; |
| |
| extern void ffi_call_unix64 (void *args, unsigned long bytes, unsigned flags, |
| void *raddr, void (*fnaddr)(void)) FFI_HIDDEN; |
| |
| /* All reference to register classes here is identical to the code in |
| gcc/config/i386/i386.c. Do *not* change one without the other. */ |
| |
| /* Register class used for passing given 64bit part of the argument. |
| These represent classes as documented by the PS ABI, with the |
| exception of SSESF, SSEDF classes, that are basically SSE class, |
| just gcc will use SF or DFmode move instead of DImode to avoid |
| reformatting penalties. |
| |
| Similary we play games with INTEGERSI_CLASS to use cheaper SImode moves |
| whenever possible (upper half does contain padding). */ |
| enum x86_64_reg_class |
| { |
| X86_64_NO_CLASS, |
| X86_64_INTEGER_CLASS, |
| X86_64_INTEGERSI_CLASS, |
| X86_64_SSE_CLASS, |
| X86_64_SSESF_CLASS, |
| X86_64_SSEDF_CLASS, |
| X86_64_SSEUP_CLASS, |
| X86_64_X87_CLASS, |
| X86_64_X87UP_CLASS, |
| X86_64_COMPLEX_X87_CLASS, |
| X86_64_MEMORY_CLASS |
| }; |
| |
| #define MAX_CLASSES 4 |
| |
| #define SSE_CLASS_P(X) ((X) >= X86_64_SSE_CLASS && X <= X86_64_SSEUP_CLASS) |
| |
| /* x86-64 register passing implementation. See x86-64 ABI for details. Goal |
| of this code is to classify each 8bytes of incoming argument by the register |
| class and assign registers accordingly. */ |
| |
| /* Return the union class of CLASS1 and CLASS2. |
| See the x86-64 PS ABI for details. */ |
| |
| static enum x86_64_reg_class |
| merge_classes (enum x86_64_reg_class class1, enum x86_64_reg_class class2) |
| { |
| /* Rule #1: If both classes are equal, this is the resulting class. */ |
| if (class1 == class2) |
| return class1; |
| |
| /* Rule #2: If one of the classes is NO_CLASS, the resulting class is |
| the other class. */ |
| if (class1 == X86_64_NO_CLASS) |
| return class2; |
| if (class2 == X86_64_NO_CLASS) |
| return class1; |
| |
| /* Rule #3: If one of the classes is MEMORY, the result is MEMORY. */ |
| if (class1 == X86_64_MEMORY_CLASS || class2 == X86_64_MEMORY_CLASS) |
| return X86_64_MEMORY_CLASS; |
| |
| /* Rule #4: If one of the classes is INTEGER, the result is INTEGER. */ |
| if ((class1 == X86_64_INTEGERSI_CLASS && class2 == X86_64_SSESF_CLASS) |
| || (class2 == X86_64_INTEGERSI_CLASS && class1 == X86_64_SSESF_CLASS)) |
| return X86_64_INTEGERSI_CLASS; |
| if (class1 == X86_64_INTEGER_CLASS || class1 == X86_64_INTEGERSI_CLASS |
| || class2 == X86_64_INTEGER_CLASS || class2 == X86_64_INTEGERSI_CLASS) |
| return X86_64_INTEGER_CLASS; |
| |
| /* Rule #5: If one of the classes is X87, X87UP, or COMPLEX_X87 class, |
| MEMORY is used. */ |
| if (class1 == X86_64_X87_CLASS |
| || class1 == X86_64_X87UP_CLASS |
| || class1 == X86_64_COMPLEX_X87_CLASS |
| || class2 == X86_64_X87_CLASS |
| || class2 == X86_64_X87UP_CLASS |
| || class2 == X86_64_COMPLEX_X87_CLASS) |
| return X86_64_MEMORY_CLASS; |
| |
| /* Rule #6: Otherwise class SSE is used. */ |
| return X86_64_SSE_CLASS; |
| } |
| |
| /* Classify the argument of type TYPE and mode MODE. |
| CLASSES will be filled by the register class used to pass each word |
| of the operand. The number of words is returned. In case the parameter |
| should be passed in memory, 0 is returned. As a special case for zero |
| sized containers, classes[0] will be NO_CLASS and 1 is returned. |
| |
| See the x86-64 PS ABI for details. |
| */ |
| static size_t |
| classify_argument (ffi_type *type, enum x86_64_reg_class classes[], |
| size_t byte_offset) |
| { |
| switch (type->type) |
| { |
| case FFI_TYPE_UINT8: |
| case FFI_TYPE_SINT8: |
| case FFI_TYPE_UINT16: |
| case FFI_TYPE_SINT16: |
| case FFI_TYPE_UINT32: |
| case FFI_TYPE_SINT32: |
| case FFI_TYPE_UINT64: |
| case FFI_TYPE_SINT64: |
| case FFI_TYPE_POINTER: |
| do_integer: |
| { |
| size_t size = byte_offset + type->size; |
| |
| if (size <= 4) |
| { |
| classes[0] = X86_64_INTEGERSI_CLASS; |
| return 1; |
| } |
| else if (size <= 8) |
| { |
| classes[0] = X86_64_INTEGER_CLASS; |
| return 1; |
| } |
| else if (size <= 12) |
| { |
| classes[0] = X86_64_INTEGER_CLASS; |
| classes[1] = X86_64_INTEGERSI_CLASS; |
| return 2; |
| } |
| else if (size <= 16) |
| { |
| classes[0] = classes[1] = X86_64_INTEGER_CLASS; |
| return 2; |
| } |
| else |
| FFI_ASSERT (0); |
| } |
| case FFI_TYPE_FLOAT: |
| if (!(byte_offset % 8)) |
| classes[0] = X86_64_SSESF_CLASS; |
| else |
| classes[0] = X86_64_SSE_CLASS; |
| return 1; |
| case FFI_TYPE_DOUBLE: |
| classes[0] = X86_64_SSEDF_CLASS; |
| return 1; |
| #if FFI_TYPE_LONGDOUBLE != FFI_TYPE_DOUBLE |
| case FFI_TYPE_LONGDOUBLE: |
| classes[0] = X86_64_X87_CLASS; |
| classes[1] = X86_64_X87UP_CLASS; |
| return 2; |
| #endif |
| case FFI_TYPE_STRUCT: |
| { |
| const size_t UNITS_PER_WORD = 8; |
| size_t words = (type->size + UNITS_PER_WORD - 1) / UNITS_PER_WORD; |
| ffi_type **ptr; |
| int i; |
| enum x86_64_reg_class subclasses[MAX_CLASSES]; |
| |
| /* If the struct is larger than 32 bytes, pass it on the stack. */ |
| if (type->size > 32) |
| return 0; |
| |
| for (i = 0; i < words; i++) |
| classes[i] = X86_64_NO_CLASS; |
| |
| /* Zero sized arrays or structures are NO_CLASS. We return 0 to |
| signalize memory class, so handle it as special case. */ |
| if (!words) |
| { |
| case FFI_TYPE_VOID: |
| classes[0] = X86_64_NO_CLASS; |
| return 1; |
| } |
| |
| /* Merge the fields of structure. */ |
| for (ptr = type->elements; *ptr != NULL; ptr++) |
| { |
| size_t num; |
| |
| byte_offset = ALIGN (byte_offset, (*ptr)->alignment); |
| |
| num = classify_argument (*ptr, subclasses, byte_offset % 8); |
| if (num == 0) |
| return 0; |
| for (i = 0; i < num; i++) |
| { |
| size_t pos = byte_offset / 8; |
| classes[i + pos] = |
| merge_classes (subclasses[i], classes[i + pos]); |
| } |
| |
| byte_offset += (*ptr)->size; |
| } |
| |
| if (words > 2) |
| { |
| /* When size > 16 bytes, if the first one isn't |
| X86_64_SSE_CLASS or any other ones aren't |
| X86_64_SSEUP_CLASS, everything should be passed in |
| memory. */ |
| if (classes[0] != X86_64_SSE_CLASS) |
| return 0; |
| |
| for (i = 1; i < words; i++) |
| if (classes[i] != X86_64_SSEUP_CLASS) |
| return 0; |
| } |
| |
| /* Final merger cleanup. */ |
| for (i = 0; i < words; i++) |
| { |
| /* If one class is MEMORY, everything should be passed in |
| memory. */ |
| if (classes[i] == X86_64_MEMORY_CLASS) |
| return 0; |
| |
| /* The X86_64_SSEUP_CLASS should be always preceded by |
| X86_64_SSE_CLASS or X86_64_SSEUP_CLASS. */ |
| if (classes[i] == X86_64_SSEUP_CLASS |
| && classes[i - 1] != X86_64_SSE_CLASS |
| && classes[i - 1] != X86_64_SSEUP_CLASS) |
| { |
| /* The first one should never be X86_64_SSEUP_CLASS. */ |
| FFI_ASSERT (i != 0); |
| classes[i] = X86_64_SSE_CLASS; |
| } |
| |
| /* If X86_64_X87UP_CLASS isn't preceded by X86_64_X87_CLASS, |
| everything should be passed in memory. */ |
| if (classes[i] == X86_64_X87UP_CLASS |
| && (classes[i - 1] != X86_64_X87_CLASS)) |
| { |
| /* The first one should never be X86_64_X87UP_CLASS. */ |
| FFI_ASSERT (i != 0); |
| return 0; |
| } |
| } |
| return words; |
| } |
| case FFI_TYPE_COMPLEX: |
| { |
| ffi_type *inner = type->elements[0]; |
| switch (inner->type) |
| { |
| case FFI_TYPE_INT: |
| case FFI_TYPE_UINT8: |
| case FFI_TYPE_SINT8: |
| case FFI_TYPE_UINT16: |
| case FFI_TYPE_SINT16: |
| case FFI_TYPE_UINT32: |
| case FFI_TYPE_SINT32: |
| case FFI_TYPE_UINT64: |
| case FFI_TYPE_SINT64: |
| goto do_integer; |
| |
| case FFI_TYPE_FLOAT: |
| classes[0] = X86_64_SSE_CLASS; |
| if (byte_offset % 8) |
| { |
| classes[1] = X86_64_SSESF_CLASS; |
| return 2; |
| } |
| return 1; |
| case FFI_TYPE_DOUBLE: |
| classes[0] = classes[1] = X86_64_SSEDF_CLASS; |
| return 2; |
| #if FFI_TYPE_LONGDOUBLE != FFI_TYPE_DOUBLE |
| case FFI_TYPE_LONGDOUBLE: |
| classes[0] = X86_64_COMPLEX_X87_CLASS; |
| return 1; |
| #endif |
| } |
| } |
| } |
| abort(); |
| } |
| |
| /* Examine the argument and return set number of register required in each |
| class. Return zero iff parameter should be passed in memory, otherwise |
| the number of registers. */ |
| |
| static size_t |
| examine_argument (ffi_type *type, enum x86_64_reg_class classes[MAX_CLASSES], |
| _Bool in_return, int *pngpr, int *pnsse) |
| { |
| size_t n; |
| int i, ngpr, nsse; |
| |
| n = classify_argument (type, classes, 0); |
| if (n == 0) |
| return 0; |
| |
| ngpr = nsse = 0; |
| for (i = 0; i < n; ++i) |
| switch (classes[i]) |
| { |
| case X86_64_INTEGER_CLASS: |
| case X86_64_INTEGERSI_CLASS: |
| ngpr++; |
| break; |
| case X86_64_SSE_CLASS: |
| case X86_64_SSESF_CLASS: |
| case X86_64_SSEDF_CLASS: |
| nsse++; |
| break; |
| case X86_64_NO_CLASS: |
| case X86_64_SSEUP_CLASS: |
| break; |
| case X86_64_X87_CLASS: |
| case X86_64_X87UP_CLASS: |
| case X86_64_COMPLEX_X87_CLASS: |
| return in_return != 0; |
| default: |
| abort (); |
| } |
| |
| *pngpr = ngpr; |
| *pnsse = nsse; |
| |
| return n; |
| } |
| |
| /* Perform machine dependent cif processing. */ |
| |
| ffi_status |
| ffi_prep_cif_machdep (ffi_cif *cif) |
| { |
| int gprcount, ssecount, i, avn, ngpr, nsse, flags; |
| enum x86_64_reg_class classes[MAX_CLASSES]; |
| size_t bytes, n, rtype_size; |
| ffi_type *rtype; |
| |
| if (cif->abi != FFI_UNIX64) |
| return FFI_BAD_ABI; |
| |
| gprcount = ssecount = 0; |
| |
| rtype = cif->rtype; |
| rtype_size = rtype->size; |
| switch (rtype->type) |
| { |
| case FFI_TYPE_VOID: |
| flags = UNIX64_RET_VOID; |
| break; |
| case FFI_TYPE_UINT8: |
| flags = UNIX64_RET_UINT8; |
| break; |
| case FFI_TYPE_SINT8: |
| flags = UNIX64_RET_SINT8; |
| break; |
| case FFI_TYPE_UINT16: |
| flags = UNIX64_RET_UINT16; |
| break; |
| case FFI_TYPE_SINT16: |
| flags = UNIX64_RET_SINT16; |
| break; |
| case FFI_TYPE_UINT32: |
| flags = UNIX64_RET_UINT32; |
| break; |
| case FFI_TYPE_INT: |
| case FFI_TYPE_SINT32: |
| flags = UNIX64_RET_SINT32; |
| break; |
| case FFI_TYPE_UINT64: |
| case FFI_TYPE_SINT64: |
| flags = UNIX64_RET_INT64; |
| break; |
| case FFI_TYPE_POINTER: |
| flags = (sizeof(void *) == 4 ? UNIX64_RET_UINT32 : UNIX64_RET_INT64); |
| break; |
| case FFI_TYPE_FLOAT: |
| flags = UNIX64_RET_XMM32; |
| break; |
| case FFI_TYPE_DOUBLE: |
| flags = UNIX64_RET_XMM64; |
| break; |
| case FFI_TYPE_LONGDOUBLE: |
| flags = UNIX64_RET_X87; |
| break; |
| case FFI_TYPE_STRUCT: |
| n = examine_argument (cif->rtype, classes, 1, &ngpr, &nsse); |
| if (n == 0) |
| { |
| /* The return value is passed in memory. A pointer to that |
| memory is the first argument. Allocate a register for it. */ |
| gprcount++; |
| /* We don't have to do anything in asm for the return. */ |
| flags = UNIX64_RET_VOID | UNIX64_FLAG_RET_IN_MEM; |
| } |
| else |
| { |
| _Bool sse0 = SSE_CLASS_P (classes[0]); |
| |
| if (rtype_size == 4 && sse0) |
| flags = UNIX64_RET_XMM32; |
| else if (rtype_size == 8) |
| flags = sse0 ? UNIX64_RET_XMM64 : UNIX64_RET_INT64; |
| else |
| { |
| _Bool sse1 = n == 2 && SSE_CLASS_P (classes[1]); |
| if (sse0 && sse1) |
| flags = UNIX64_RET_ST_XMM0_XMM1; |
| else if (sse0) |
| flags = UNIX64_RET_ST_XMM0_RAX; |
| else if (sse1) |
| flags = UNIX64_RET_ST_RAX_XMM0; |
| else |
| flags = UNIX64_RET_ST_RAX_RDX; |
| flags |= rtype_size << UNIX64_SIZE_SHIFT; |
| } |
| } |
| break; |
| case FFI_TYPE_COMPLEX: |
| switch (rtype->elements[0]->type) |
| { |
| case FFI_TYPE_UINT8: |
| case FFI_TYPE_SINT8: |
| case FFI_TYPE_UINT16: |
| case FFI_TYPE_SINT16: |
| case FFI_TYPE_INT: |
| case FFI_TYPE_UINT32: |
| case FFI_TYPE_SINT32: |
| case FFI_TYPE_UINT64: |
| case FFI_TYPE_SINT64: |
| flags = UNIX64_RET_ST_RAX_RDX | (rtype_size << UNIX64_SIZE_SHIFT); |
| break; |
| case FFI_TYPE_FLOAT: |
| flags = UNIX64_RET_XMM64; |
| break; |
| case FFI_TYPE_DOUBLE: |
| flags = UNIX64_RET_ST_XMM0_XMM1 | (16 << UNIX64_SIZE_SHIFT); |
| break; |
| #if FFI_TYPE_LONGDOUBLE != FFI_TYPE_DOUBLE |
| case FFI_TYPE_LONGDOUBLE: |
| flags = UNIX64_RET_X87_2; |
| break; |
| #endif |
| default: |
| return FFI_BAD_TYPEDEF; |
| } |
| break; |
| default: |
| return FFI_BAD_TYPEDEF; |
| } |
| |
| /* Go over all arguments and determine the way they should be passed. |
| If it's in a register and there is space for it, let that be so. If |
| not, add it's size to the stack byte count. */ |
| for (bytes = 0, i = 0, avn = cif->nargs; i < avn; i++) |
| { |
| if (examine_argument (cif->arg_types[i], classes, 0, &ngpr, &nsse) == 0 |
| || gprcount + ngpr > MAX_GPR_REGS |
| || ssecount + nsse > MAX_SSE_REGS) |
| { |
| long align = cif->arg_types[i]->alignment; |
| |
| if (align < 8) |
| align = 8; |
| |
| bytes = ALIGN (bytes, align); |
| bytes += cif->arg_types[i]->size; |
| } |
| else |
| { |
| gprcount += ngpr; |
| ssecount += nsse; |
| } |
| } |
| if (ssecount) |
| flags |= UNIX64_FLAG_XMM_ARGS; |
| |
| cif->flags = flags; |
| cif->bytes = ALIGN (bytes, 8); |
| |
| return FFI_OK; |
| } |
| |
| static void |
| ffi_call_int (ffi_cif *cif, void (*fn)(void), void *rvalue, |
| void **avalue, void *closure) |
| { |
| enum x86_64_reg_class classes[MAX_CLASSES]; |
| char *stack, *argp; |
| ffi_type **arg_types; |
| int gprcount, ssecount, ngpr, nsse, i, avn, flags; |
| struct register_args *reg_args; |
| |
| /* Can't call 32-bit mode from 64-bit mode. */ |
| FFI_ASSERT (cif->abi == FFI_UNIX64); |
| |
| /* If the return value is a struct and we don't have a return value |
| address then we need to make one. Otherwise we can ignore it. */ |
| flags = cif->flags; |
| if (rvalue == NULL) |
| { |
| if (flags & UNIX64_FLAG_RET_IN_MEM) |
| rvalue = alloca (cif->rtype->size); |
| else |
| flags = UNIX64_RET_VOID; |
| } |
| |
| /* Allocate the space for the arguments, plus 4 words of temp space. */ |
| stack = alloca (sizeof (struct register_args) + cif->bytes + 4*8); |
| reg_args = (struct register_args *) stack; |
| argp = stack + sizeof (struct register_args); |
| |
| reg_args->r10 = (uintptr_t) closure; |
| |
| gprcount = ssecount = 0; |
| |
| /* If the return value is passed in memory, add the pointer as the |
| first integer argument. */ |
| if (flags & UNIX64_FLAG_RET_IN_MEM) |
| reg_args->gpr[gprcount++] = (unsigned long) rvalue; |
| |
| avn = cif->nargs; |
| arg_types = cif->arg_types; |
| |
| for (i = 0; i < avn; ++i) |
| { |
| size_t n, size = arg_types[i]->size; |
| |
| n = examine_argument (arg_types[i], classes, 0, &ngpr, &nsse); |
| if (n == 0 |
| || gprcount + ngpr > MAX_GPR_REGS |
| || ssecount + nsse > MAX_SSE_REGS) |
| { |
| long align = arg_types[i]->alignment; |
| |
| /* Stack arguments are *always* at least 8 byte aligned. */ |
| if (align < 8) |
| align = 8; |
| |
| /* Pass this argument in memory. */ |
| argp = (void *) ALIGN (argp, align); |
| memcpy (argp, avalue[i], size); |
| argp += size; |
| } |
| else |
| { |
| /* The argument is passed entirely in registers. */ |
| char *a = (char *) avalue[i]; |
| int j; |
| |
| for (j = 0; j < n; j++, a += 8, size -= 8) |
| { |
| switch (classes[j]) |
| { |
| case X86_64_NO_CLASS: |
| case X86_64_SSEUP_CLASS: |
| break; |
| case X86_64_INTEGER_CLASS: |
| case X86_64_INTEGERSI_CLASS: |
| /* Sign-extend integer arguments passed in general |
| purpose registers, to cope with the fact that |
| LLVM incorrectly assumes that this will be done |
| (the x86-64 PS ABI does not specify this). */ |
| switch (arg_types[i]->type) |
| { |
| case FFI_TYPE_SINT8: |
| reg_args->gpr[gprcount] = (SINT64) *((SINT8 *) a); |
| break; |
| case FFI_TYPE_SINT16: |
| reg_args->gpr[gprcount] = (SINT64) *((SINT16 *) a); |
| break; |
| case FFI_TYPE_SINT32: |
| reg_args->gpr[gprcount] = (SINT64) *((SINT32 *) a); |
| break; |
| default: |
| reg_args->gpr[gprcount] = 0; |
| memcpy (®_args->gpr[gprcount], a, size); |
| } |
| gprcount++; |
| break; |
| case X86_64_SSE_CLASS: |
| case X86_64_SSEDF_CLASS: |
| reg_args->sse[ssecount++].i64 = *(UINT64 *) a; |
| break; |
| case X86_64_SSESF_CLASS: |
| reg_args->sse[ssecount++].i32 = *(UINT32 *) a; |
| break; |
| default: |
| abort(); |
| } |
| } |
| } |
| } |
| reg_args->rax = ssecount; |
| |
| ffi_call_unix64 (stack, cif->bytes + sizeof (struct register_args), |
| flags, rvalue, fn); |
| } |
| |
| void |
| ffi_call (ffi_cif *cif, void (*fn)(void), void *rvalue, void **avalue) |
| { |
| ffi_call_int (cif, fn, rvalue, avalue, NULL); |
| } |
| |
| void |
| ffi_call_go (ffi_cif *cif, void (*fn)(void), void *rvalue, |
| void **avalue, void *closure) |
| { |
| ffi_call_int (cif, fn, rvalue, avalue, closure); |
| } |
| |
| extern void ffi_closure_unix64(void) FFI_HIDDEN; |
| extern void ffi_closure_unix64_sse(void) FFI_HIDDEN; |
| |
| ffi_status |
| ffi_prep_closure_loc (ffi_closure* closure, |
| ffi_cif* cif, |
| void (*fun)(ffi_cif*, void*, void**, void*), |
| void *user_data, |
| void *codeloc) |
| { |
| static const unsigned char trampoline[16] = { |
| /* leaq -0x7(%rip),%r10 # 0x0 */ |
| 0x4c, 0x8d, 0x15, 0xf9, 0xff, 0xff, 0xff, |
| /* jmpq *0x3(%rip) # 0x10 */ |
| 0xff, 0x25, 0x03, 0x00, 0x00, 0x00, |
| /* nopl (%rax) */ |
| 0x0f, 0x1f, 0x00 |
| }; |
| void (*dest)(void); |
| char *tramp = closure->tramp; |
| |
| if (cif->abi != FFI_UNIX64) |
| return FFI_BAD_ABI; |
| |
| if (cif->flags & UNIX64_FLAG_XMM_ARGS) |
| dest = ffi_closure_unix64_sse; |
| else |
| dest = ffi_closure_unix64; |
| |
| memcpy (tramp, trampoline, sizeof(trampoline)); |
| *(UINT64 *)(tramp + 16) = (uintptr_t)dest; |
| |
| closure->cif = cif; |
| closure->fun = fun; |
| closure->user_data = user_data; |
| |
| return FFI_OK; |
| } |
| |
| int FFI_HIDDEN |
| ffi_closure_unix64_inner(ffi_cif *cif, |
| void (*fun)(ffi_cif*, void*, void**, void*), |
| void *user_data, |
| void *rvalue, |
| struct register_args *reg_args, |
| char *argp) |
| { |
| void **avalue; |
| ffi_type **arg_types; |
| long i, avn; |
| int gprcount, ssecount, ngpr, nsse; |
| int flags; |
| |
| avn = cif->nargs; |
| flags = cif->flags; |
| avalue = alloca(avn * sizeof(void *)); |
| gprcount = ssecount = 0; |
| |
| if (flags & UNIX64_FLAG_RET_IN_MEM) |
| { |
| /* On return, %rax will contain the address that was passed |
| by the caller in %rdi. */ |
| void *r = (void *)(uintptr_t)reg_args->gpr[gprcount++]; |
| *(void **)rvalue = r; |
| rvalue = r; |
| flags = (sizeof(void *) == 4 ? UNIX64_RET_UINT32 : UNIX64_RET_INT64); |
| } |
| |
| arg_types = cif->arg_types; |
| for (i = 0; i < avn; ++i) |
| { |
| enum x86_64_reg_class classes[MAX_CLASSES]; |
| size_t n; |
| |
| n = examine_argument (arg_types[i], classes, 0, &ngpr, &nsse); |
| if (n == 0 |
| || gprcount + ngpr > MAX_GPR_REGS |
| || ssecount + nsse > MAX_SSE_REGS) |
| { |
| long align = arg_types[i]->alignment; |
| |
| /* Stack arguments are *always* at least 8 byte aligned. */ |
| if (align < 8) |
| align = 8; |
| |
| /* Pass this argument in memory. */ |
| argp = (void *) ALIGN (argp, align); |
| avalue[i] = argp; |
| argp += arg_types[i]->size; |
| } |
| /* If the argument is in a single register, or two consecutive |
| integer registers, then we can use that address directly. */ |
| else if (n == 1 |
| || (n == 2 && !(SSE_CLASS_P (classes[0]) |
| || SSE_CLASS_P (classes[1])))) |
| { |
| /* The argument is in a single register. */ |
| if (SSE_CLASS_P (classes[0])) |
| { |
| avalue[i] = ®_args->sse[ssecount]; |
| ssecount += n; |
| } |
| else |
| { |
| avalue[i] = ®_args->gpr[gprcount]; |
| gprcount += n; |
| } |
| } |
| /* Otherwise, allocate space to make them consecutive. */ |
| else |
| { |
| char *a = alloca (16); |
| int j; |
| |
| avalue[i] = a; |
| for (j = 0; j < n; j++, a += 8) |
| { |
| if (SSE_CLASS_P (classes[j])) |
| memcpy (a, ®_args->sse[ssecount++], 8); |
| else |
| memcpy (a, ®_args->gpr[gprcount++], 8); |
| } |
| } |
| } |
| |
| /* Invoke the closure. */ |
| fun (cif, rvalue, avalue, user_data); |
| |
| /* Tell assembly how to perform return type promotions. */ |
| return flags; |
| } |
| |
| extern void ffi_go_closure_unix64(void) FFI_HIDDEN; |
| extern void ffi_go_closure_unix64_sse(void) FFI_HIDDEN; |
| |
| ffi_status |
| ffi_prep_go_closure (ffi_go_closure* closure, ffi_cif* cif, |
| void (*fun)(ffi_cif*, void*, void**, void*)) |
| { |
| if (cif->abi != FFI_UNIX64) |
| return FFI_BAD_ABI; |
| |
| closure->tramp = (cif->flags & UNIX64_FLAG_XMM_ARGS |
| ? ffi_go_closure_unix64_sse |
| : ffi_go_closure_unix64); |
| closure->cif = cif; |
| closure->fun = fun; |
| |
| return FFI_OK; |
| } |
| |
| #endif /* __x86_64__ */ |