1186 lines
43 KiB
C
1186 lines
43 KiB
C
/*
|
|
* Relay calls helper routines
|
|
*
|
|
* Copyright 1993 Robert J. Amstadt
|
|
* Copyright 1995 Martin von Loewis
|
|
* Copyright 1995, 1996, 1997 Alexandre Julliard
|
|
* Copyright 1997 Eric Youngdale
|
|
* Copyright 1999 Ulrich Weigand
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with this library; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
|
|
*/
|
|
|
|
#include "config.h"
|
|
#include "wine/port.h"
|
|
|
|
#include <ctype.h>
|
|
#include <stdarg.h>
|
|
|
|
#define __WINESRC__ /* FIXME: for WINE_VM86_TEB_INFO */
|
|
#include "winternl.h"
|
|
#include "wine/winbase16.h"
|
|
|
|
#include "build.h"
|
|
|
|
/* offset of a structure field relative to the start of the struct */
|
|
#define STRUCTOFFSET(type,field) ((int)FIELD_OFFSET(type,field))
|
|
|
|
/* offset of register relative to the start of the CONTEXT struct */
|
|
#define CONTEXTOFFSET(reg) STRUCTOFFSET(CONTEXT86,reg)
|
|
|
|
/* offset of register relative to the start of the STACK16FRAME struct */
|
|
#define STACK16OFFSET(reg) STRUCTOFFSET(STACK16FRAME,reg)
|
|
|
|
/* offset of register relative to the start of the STACK32FRAME struct */
|
|
#define STACK32OFFSET(reg) STRUCTOFFSET(STACK32FRAME,reg)
|
|
|
|
/* offset of the stack pointer relative to %fs:(0) */
|
|
#define STACKOFFSET 0xc0 /* STRUCTOFFSET(TEB,WOW32Reserved) */
|
|
|
|
/* fix this if the ntdll_thread_regs structure is changed */
|
|
#define GS_OFFSET 0x1d8 /* STRUCTOFFSET(TEB,SystemReserved2) + STRUCTOFFSET(ntdll_thread_data,gs) */
|
|
|
|
static void function_header( const char *name )
|
|
{
|
|
output( "\n\t.align %d\n", get_alignment(4) );
|
|
output( "\t%s\n", func_declaration(name) );
|
|
output( "%s\n", asm_globl(name) );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildCallFrom16Core
|
|
*
|
|
* This routine builds the core routines used in 16->32 thunks:
|
|
* CallFrom16Word, CallFrom16Long, CallFrom16Register, and CallFrom16Thunk.
|
|
*
|
|
* These routines are intended to be called via a far call (with 32-bit
|
|
* operand size) from 16-bit code. The 16-bit code stub must push %bp,
|
|
* the 32-bit entry point to be called, and the argument conversion
|
|
* routine to be used (see stack layout below).
|
|
*
|
|
* The core routine completes the STACK16FRAME on the 16-bit stack and
|
|
* switches to the 32-bit stack. Then, the argument conversion routine
|
|
* is called; it gets passed the 32-bit entry point and a pointer to the
|
|
* 16-bit arguments (on the 16-bit stack) as parameters. (You can either
|
|
* use conversion routines automatically generated by BuildCallFrom16,
|
|
* or write your own for special purposes.)
|
|
*
|
|
* The conversion routine must call the 32-bit entry point, passing it
|
|
* the converted arguments, and return its return value to the core.
|
|
* After the conversion routine has returned, the core switches back
|
|
* to the 16-bit stack, converts the return value to the DX:AX format
|
|
* (CallFrom16Long), and returns to the 16-bit call stub. All parameters,
|
|
* including %bp, are popped off the stack.
|
|
*
|
|
* The 16-bit call stub now returns to the caller, popping the 16-bit
|
|
* arguments if necessary (pascal calling convention).
|
|
*
|
|
* In the case of a 'register' function, CallFrom16Register fills a
|
|
* CONTEXT86 structure with the values all registers had at the point
|
|
* the first instruction of the 16-bit call stub was about to be
|
|
* executed. A pointer to this CONTEXT86 is passed as third parameter
|
|
* to the argument conversion routine, which typically passes it on
|
|
* to the called 32-bit entry point.
|
|
*
|
|
* CallFrom16Thunk is a special variant used by the implementation of
|
|
* the Win95 16->32 thunk functions C16ThkSL and C16ThkSL01 and is
|
|
* implemented as follows:
|
|
* On entry, the EBX register is set up to contain a flat pointer to the
|
|
* 16-bit stack such that EBX+22 points to the first argument.
|
|
* Then, the entry point is called, while EBP is set up to point
|
|
* to the return address (on the 32-bit stack).
|
|
* The called function returns with CX set to the number of bytes
|
|
* to be popped of the caller's stack.
|
|
*
|
|
* Stack layout upon entry to the core routine (STACK16FRAME):
|
|
* ... ...
|
|
* (sp+24) word first 16-bit arg
|
|
* (sp+22) word cs
|
|
* (sp+20) word ip
|
|
* (sp+18) word bp
|
|
* (sp+14) long 32-bit entry point (reused for Win16 mutex recursion count)
|
|
* (sp+12) word ip of actual entry point (necessary for relay debugging)
|
|
* (sp+8) long relay (argument conversion) function entry point
|
|
* (sp+4) long cs of 16-bit entry point
|
|
* (sp) long ip of 16-bit entry point
|
|
*
|
|
* Added on the stack:
|
|
* (sp-2) word saved gs
|
|
* (sp-4) word saved fs
|
|
* (sp-6) word saved es
|
|
* (sp-8) word saved ds
|
|
* (sp-12) long saved ebp
|
|
* (sp-16) long saved ecx
|
|
* (sp-20) long saved edx
|
|
* (sp-24) long saved previous stack
|
|
*/
|
|
static void BuildCallFrom16Core( int reg_func, int thunk )
|
|
{
|
|
/* Function header */
|
|
if (thunk) function_header( "__wine_call_from_16_thunk" );
|
|
else if (reg_func) function_header( "__wine_call_from_16_regs" );
|
|
else function_header( "__wine_call_from_16" );
|
|
|
|
/* Create STACK16FRAME (except STACK32FRAME link) */
|
|
output( "\tpushw %%gs\n" );
|
|
output( "\tpushw %%fs\n" );
|
|
output( "\tpushw %%es\n" );
|
|
output( "\tpushw %%ds\n" );
|
|
output( "\tpushl %%ebp\n" );
|
|
output( "\tpushl %%ecx\n" );
|
|
output( "\tpushl %%edx\n" );
|
|
|
|
/* Save original EFlags register */
|
|
if (reg_func) output( "\tpushfl\n" );
|
|
|
|
if ( UsePIC )
|
|
{
|
|
output( "\tcall 1f\n" );
|
|
output( "1:\tpopl %%ecx\n" );
|
|
output( "\t.byte 0x2e\n\tmovl %s-1b(%%ecx),%%edx\n", asm_name("CallTo16_DataSelector") );
|
|
}
|
|
else
|
|
output( "\t.byte 0x2e\n\tmovl %s,%%edx\n", asm_name("CallTo16_DataSelector") );
|
|
|
|
/* Load 32-bit segment registers */
|
|
output( "\tmovw %%dx, %%ds\n" );
|
|
output( "\tmovw %%dx, %%es\n" );
|
|
|
|
if ( UsePIC )
|
|
output( "\tmovw %s-1b(%%ecx), %%fs\n", asm_name("CallTo16_TebSelector") );
|
|
else
|
|
output( "\tmovw %s, %%fs\n", asm_name("CallTo16_TebSelector") );
|
|
|
|
output( "\t.byte 0x64\n\tmov (%d),%%gs\n", GS_OFFSET );
|
|
|
|
/* Translate STACK16FRAME base to flat offset in %edx */
|
|
output( "\tmovw %%ss, %%dx\n" );
|
|
output( "\tandl $0xfff8, %%edx\n" );
|
|
output( "\tshrl $1, %%edx\n" );
|
|
if (UsePIC)
|
|
{
|
|
output( "\taddl wine_ldt_copy_ptr-1b(%%ecx),%%edx\n" );
|
|
output( "\tmovl (%%edx), %%edx\n" );
|
|
}
|
|
else
|
|
output( "\tmovl %s(%%edx), %%edx\n", asm_name("wine_ldt_copy") );
|
|
output( "\tmovzwl %%sp, %%ebp\n" );
|
|
output( "\tleal %d(%%ebp,%%edx), %%edx\n", reg_func ? 0 : -4 );
|
|
|
|
/* Get saved flags into %ecx */
|
|
if (reg_func) output( "\tpopl %%ecx\n" );
|
|
|
|
/* Get the 32-bit stack pointer from the TEB and complete STACK16FRAME */
|
|
output( "\t.byte 0x64\n\tmovl (%d), %%ebp\n", STACKOFFSET );
|
|
output( "\tpushl %%ebp\n" );
|
|
|
|
/* Switch stacks */
|
|
output( "\t.byte 0x64\n\tmovw %%ss, (%d)\n", STACKOFFSET + 2 );
|
|
output( "\t.byte 0x64\n\tmovw %%sp, (%d)\n", STACKOFFSET );
|
|
output( "\tpushl %%ds\n" );
|
|
output( "\tpopl %%ss\n" );
|
|
output( "\tmovl %%ebp, %%esp\n" );
|
|
output( "\taddl $%d, %%ebp\n", STACK32OFFSET(ebp) );
|
|
|
|
|
|
/* At this point:
|
|
STACK16FRAME is completely set up
|
|
DS, ES, SS: flat data segment
|
|
FS: current TEB
|
|
ESP: points to last STACK32FRAME
|
|
EBP: points to ebp member of last STACK32FRAME
|
|
EDX: points to current STACK16FRAME
|
|
ECX: contains saved flags
|
|
all other registers: unchanged */
|
|
|
|
/* Special case: C16ThkSL stub */
|
|
if ( thunk )
|
|
{
|
|
/* Set up registers as expected and call thunk */
|
|
output( "\tleal %d(%%edx), %%ebx\n", (int)sizeof(STACK16FRAME)-22 );
|
|
output( "\tleal -4(%%esp), %%ebp\n" );
|
|
|
|
output( "\tcall *%d(%%edx)\n", STACK16OFFSET(entry_point) );
|
|
|
|
/* Switch stack back */
|
|
output( "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 );
|
|
output( "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET );
|
|
output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET );
|
|
|
|
/* Restore registers and return directly to caller */
|
|
output( "\taddl $8, %%esp\n" );
|
|
output( "\tpopl %%ebp\n" );
|
|
output( "\tpopw %%ds\n" );
|
|
output( "\tpopw %%es\n" );
|
|
output( "\tpopw %%fs\n" );
|
|
output( "\tpopw %%gs\n" );
|
|
output( "\taddl $20, %%esp\n" );
|
|
|
|
output( "\txorb %%ch, %%ch\n" );
|
|
output( "\tpopl %%ebx\n" );
|
|
output( "\taddw %%cx, %%sp\n" );
|
|
output( "\tpush %%ebx\n" );
|
|
|
|
output( "\t.byte 0x66\n" );
|
|
output( "\tlret\n" );
|
|
|
|
return;
|
|
}
|
|
|
|
|
|
/* Build register CONTEXT */
|
|
if ( reg_func )
|
|
{
|
|
output( "\tsubl $%d, %%esp\n", (int)sizeof(CONTEXT86) );
|
|
|
|
output( "\tmovl %%ecx, %d(%%esp)\n", CONTEXTOFFSET(EFlags) );
|
|
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Eax) );
|
|
output( "\tmovl %%ebx, %d(%%esp)\n", CONTEXTOFFSET(Ebx) );
|
|
output( "\tmovl %%esi, %d(%%esp)\n", CONTEXTOFFSET(Esi) );
|
|
output( "\tmovl %%edi, %d(%%esp)\n", CONTEXTOFFSET(Edi) );
|
|
|
|
output( "\tmovl %d(%%edx), %%eax\n", STACK16OFFSET(ebp) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Ebp) );
|
|
output( "\tmovl %d(%%edx), %%eax\n", STACK16OFFSET(ecx) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Ecx) );
|
|
output( "\tmovl %d(%%edx), %%eax\n", STACK16OFFSET(edx) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Edx) );
|
|
|
|
output( "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(ds) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegDs) );
|
|
output( "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(es) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegEs) );
|
|
output( "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(fs) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegFs) );
|
|
output( "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(gs) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegGs) );
|
|
|
|
output( "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(cs) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegCs) );
|
|
output( "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(ip) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Eip) );
|
|
|
|
output( "\t.byte 0x64\n\tmovzwl (%d), %%eax\n", STACKOFFSET+2 );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegSs) );
|
|
output( "\t.byte 0x64\n\tmovzwl (%d), %%eax\n", STACKOFFSET );
|
|
output( "\taddl $%d, %%eax\n", STACK16OFFSET(ip) );
|
|
output( "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Esp) );
|
|
#if 0
|
|
output( "\tfsave %d(%%esp)\n", CONTEXTOFFSET(FloatSave) );
|
|
#endif
|
|
|
|
/* Push address of CONTEXT86 structure -- popped by the relay routine */
|
|
output( "\tmovl %%esp,%%eax\n" );
|
|
output( "\tandl $~15,%%esp\n" );
|
|
output( "\tsubl $4,%%esp\n" );
|
|
output( "\tpushl %%eax\n" );
|
|
}
|
|
else
|
|
{
|
|
output( "\tsubl $8,%%esp\n" );
|
|
output( "\tandl $~15,%%esp\n" );
|
|
output( "\taddl $8,%%esp\n" );
|
|
}
|
|
|
|
/* Call relay routine (which will call the API entry point) */
|
|
output( "\tleal %d(%%edx), %%eax\n", (int)sizeof(STACK16FRAME) );
|
|
output( "\tpushl %%eax\n" );
|
|
output( "\tpushl %d(%%edx)\n", STACK16OFFSET(entry_point) );
|
|
output( "\tcall *%d(%%edx)\n", STACK16OFFSET(relay) );
|
|
|
|
if ( reg_func )
|
|
{
|
|
output( "\tleal -%d(%%ebp), %%ebx\n", (int)sizeof(CONTEXT) + STACK32OFFSET(ebp) );
|
|
|
|
/* Switch stack back */
|
|
output( "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 );
|
|
output( "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET );
|
|
output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET );
|
|
|
|
/* Get return address to CallFrom16 stub */
|
|
output( "\taddw $%d, %%sp\n", STACK16OFFSET(callfrom_ip)-4 );
|
|
output( "\tpopl %%eax\n" );
|
|
output( "\tpopl %%edx\n" );
|
|
|
|
/* Restore all registers from CONTEXT */
|
|
output( "\tmovw %d(%%ebx), %%ss\n", CONTEXTOFFSET(SegSs) );
|
|
output( "\tmovl %d(%%ebx), %%esp\n", CONTEXTOFFSET(Esp) );
|
|
output( "\taddl $4, %%esp\n" ); /* room for final return address */
|
|
|
|
output( "\tpushw %d(%%ebx)\n", CONTEXTOFFSET(SegCs) );
|
|
output( "\tpushw %d(%%ebx)\n", CONTEXTOFFSET(Eip) );
|
|
output( "\tpushl %%edx\n" );
|
|
output( "\tpushl %%eax\n" );
|
|
output( "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(EFlags) );
|
|
output( "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegDs) );
|
|
|
|
output( "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegEs) );
|
|
output( "\tpopl %%es\n" );
|
|
output( "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegFs) );
|
|
output( "\tpopl %%fs\n" );
|
|
output( "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegGs) );
|
|
output( "\tpopl %%gs\n" );
|
|
|
|
output( "\tmovl %d(%%ebx), %%ebp\n", CONTEXTOFFSET(Ebp) );
|
|
output( "\tmovl %d(%%ebx), %%esi\n", CONTEXTOFFSET(Esi) );
|
|
output( "\tmovl %d(%%ebx), %%edi\n", CONTEXTOFFSET(Edi) );
|
|
output( "\tmovl %d(%%ebx), %%eax\n", CONTEXTOFFSET(Eax) );
|
|
output( "\tmovl %d(%%ebx), %%edx\n", CONTEXTOFFSET(Edx) );
|
|
output( "\tmovl %d(%%ebx), %%ecx\n", CONTEXTOFFSET(Ecx) );
|
|
output( "\tmovl %d(%%ebx), %%ebx\n", CONTEXTOFFSET(Ebx) );
|
|
|
|
output( "\tpopl %%ds\n" );
|
|
output( "\tpopfl\n" );
|
|
output( "\tlret\n" );
|
|
}
|
|
else
|
|
{
|
|
/* Switch stack back */
|
|
output( "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 );
|
|
output( "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET );
|
|
output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET );
|
|
|
|
/* Restore registers */
|
|
output( "\tpopl %%edx\n" );
|
|
output( "\tpopl %%ecx\n" );
|
|
output( "\tpopl %%ebp\n" );
|
|
output( "\tpopw %%ds\n" );
|
|
output( "\tpopw %%es\n" );
|
|
output( "\tpopw %%fs\n" );
|
|
output( "\tpopw %%gs\n" );
|
|
|
|
/* Return to return stub which will return to caller */
|
|
output( "\tlret $12\n" );
|
|
}
|
|
if (thunk) output_function_size( "__wine_call_from_16_thunk" );
|
|
else if (reg_func) output_function_size( "__wine_call_from_16_regs" );
|
|
else output_function_size( "__wine_call_from_16" );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildCallTo16Core
|
|
*
|
|
* This routine builds the core routines used in 32->16 thunks:
|
|
*
|
|
* extern DWORD WINAPI wine_call_to_16( FARPROC16 target, DWORD cbArgs, PEXCEPTION_HANDLER handler );
|
|
* extern void WINAPI wine_call_to_16_regs( CONTEXT86 *context, DWORD cbArgs, PEXCEPTION_HANDLER handler );
|
|
*
|
|
* These routines can be called directly from 32-bit code.
|
|
*
|
|
* All routines expect that the 16-bit stack contents (arguments) and the
|
|
* return address (segptr to CallTo16_Ret) were already set up by the
|
|
* caller; nb_args must contain the number of bytes to be conserved. The
|
|
* 16-bit SS:SP will be set accordingly.
|
|
*
|
|
* All other registers are either taken from the CONTEXT86 structure
|
|
* or else set to default values. The target routine address is either
|
|
* given directly or taken from the CONTEXT86.
|
|
*/
|
|
static void BuildCallTo16Core( int reg_func )
|
|
{
|
|
const char *name = reg_func ? "wine_call_to_16_regs" : "wine_call_to_16";
|
|
|
|
/* Function header */
|
|
function_header( name );
|
|
|
|
/* Function entry sequence */
|
|
output( "\tpushl %%ebp\n" );
|
|
output( "\tmovl %%esp, %%ebp\n" );
|
|
|
|
/* Save the 32-bit registers */
|
|
output( "\tpushl %%ebx\n" );
|
|
output( "\tpushl %%esi\n" );
|
|
output( "\tpushl %%edi\n" );
|
|
output( "\t.byte 0x64\n\tmov %%gs,(%d)\n", GS_OFFSET );
|
|
|
|
/* Setup exception frame */
|
|
output( "\t.byte 0x64\n\tpushl (%d)\n", STACKOFFSET );
|
|
output( "\tpushl 16(%%ebp)\n" ); /* handler */
|
|
output( "\t.byte 0x64\n\tpushl (0)\n" );
|
|
output( "\t.byte 0x64\n\tmovl %%esp,(0)\n" );
|
|
|
|
/* Call the actual CallTo16 routine (simulate a lcall) */
|
|
output( "\tpushl %%cs\n" );
|
|
output( "\tcall .L%s\n", name );
|
|
|
|
/* Remove exception frame */
|
|
output( "\t.byte 0x64\n\tpopl (0)\n" );
|
|
output( "\taddl $4, %%esp\n" );
|
|
output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET );
|
|
|
|
if ( !reg_func )
|
|
{
|
|
/* Convert return value */
|
|
output( "\tandl $0xffff,%%eax\n" );
|
|
output( "\tshll $16,%%edx\n" );
|
|
output( "\torl %%edx,%%eax\n" );
|
|
}
|
|
else
|
|
{
|
|
/*
|
|
* Modify CONTEXT86 structure to contain new values
|
|
*
|
|
* NOTE: We restore only EAX, EBX, EDX, EDX, EBP, and ESP.
|
|
* The segment registers as well as ESI and EDI should
|
|
* not be modified by a well-behaved 16-bit routine in
|
|
* any case. [If necessary, we could restore them as well,
|
|
* at the cost of a somewhat less efficient return path.]
|
|
*/
|
|
|
|
output( "\tmovl %d(%%esp), %%edi\n", STACK32OFFSET(target) - STACK32OFFSET(edi));
|
|
/* everything above edi has been popped already */
|
|
|
|
output( "\tmovl %%eax, %d(%%edi)\n", CONTEXTOFFSET(Eax) );
|
|
output( "\tmovl %%ebx, %d(%%edi)\n", CONTEXTOFFSET(Ebx) );
|
|
output( "\tmovl %%ecx, %d(%%edi)\n", CONTEXTOFFSET(Ecx) );
|
|
output( "\tmovl %%edx, %d(%%edi)\n", CONTEXTOFFSET(Edx) );
|
|
output( "\tmovl %%ebp, %d(%%edi)\n", CONTEXTOFFSET(Ebp) );
|
|
output( "\tmovl %%esi, %d(%%edi)\n", CONTEXTOFFSET(Esp) );
|
|
/* The return glue code saved %esp into %esi */
|
|
}
|
|
|
|
/* Restore the 32-bit registers */
|
|
output( "\tpopl %%edi\n" );
|
|
output( "\tpopl %%esi\n" );
|
|
output( "\tpopl %%ebx\n" );
|
|
|
|
/* Function exit sequence */
|
|
output( "\tpopl %%ebp\n" );
|
|
output( "\tret $12\n" );
|
|
|
|
|
|
/* Start of the actual CallTo16 routine */
|
|
|
|
output( ".L%s:\n", name );
|
|
|
|
/* Switch to the 16-bit stack */
|
|
output( "\tmovl %%esp,%%edx\n" );
|
|
output( "\t.byte 0x64\n\tmovw (%d),%%ss\n", STACKOFFSET + 2);
|
|
output( "\t.byte 0x64\n\tmovw (%d),%%sp\n", STACKOFFSET );
|
|
output( "\t.byte 0x64\n\tmovl %%edx,(%d)\n", STACKOFFSET );
|
|
|
|
/* Make %bp point to the previous stackframe (built by CallFrom16) */
|
|
output( "\tmovzwl %%sp,%%ebp\n" );
|
|
output( "\tleal %d(%%ebp),%%ebp\n", STACK16OFFSET(bp) );
|
|
|
|
/* Add the specified offset to the new sp */
|
|
output( "\tsubw %d(%%edx), %%sp\n", STACK32OFFSET(nb_args) );
|
|
|
|
if (reg_func)
|
|
{
|
|
/* Push the called routine address */
|
|
output( "\tmovl %d(%%edx),%%edx\n", STACK32OFFSET(target) );
|
|
output( "\tpushw %d(%%edx)\n", CONTEXTOFFSET(SegCs) );
|
|
output( "\tpushw %d(%%edx)\n", CONTEXTOFFSET(Eip) );
|
|
|
|
/* Get the registers */
|
|
output( "\tpushw %d(%%edx)\n", CONTEXTOFFSET(SegDs) );
|
|
output( "\tpushl %d(%%edx)\n", CONTEXTOFFSET(SegEs) );
|
|
output( "\tpopl %%es\n" );
|
|
output( "\tpushl %d(%%edx)\n", CONTEXTOFFSET(SegFs) );
|
|
output( "\tpopl %%fs\n" );
|
|
output( "\tpushl %d(%%edx)\n", CONTEXTOFFSET(SegGs) );
|
|
output( "\tpopl %%gs\n" );
|
|
output( "\tmovl %d(%%edx),%%ebp\n", CONTEXTOFFSET(Ebp) );
|
|
output( "\tmovl %d(%%edx),%%esi\n", CONTEXTOFFSET(Esi) );
|
|
output( "\tmovl %d(%%edx),%%edi\n", CONTEXTOFFSET(Edi) );
|
|
output( "\tmovl %d(%%edx),%%eax\n", CONTEXTOFFSET(Eax) );
|
|
output( "\tmovl %d(%%edx),%%ebx\n", CONTEXTOFFSET(Ebx) );
|
|
output( "\tmovl %d(%%edx),%%ecx\n", CONTEXTOFFSET(Ecx) );
|
|
output( "\tmovl %d(%%edx),%%edx\n", CONTEXTOFFSET(Edx) );
|
|
|
|
/* Get the 16-bit ds */
|
|
output( "\tpopw %%ds\n" );
|
|
}
|
|
else /* not a register function */
|
|
{
|
|
/* Push the called routine address */
|
|
output( "\tpushl %d(%%edx)\n", STACK32OFFSET(target) );
|
|
|
|
/* Set %fs and %gs to the value saved by the last CallFrom16 */
|
|
output( "\tpushw %d(%%ebp)\n", STACK16OFFSET(fs)-STACK16OFFSET(bp) );
|
|
output( "\tpopw %%fs\n" );
|
|
output( "\tpushw %d(%%ebp)\n", STACK16OFFSET(gs)-STACK16OFFSET(bp) );
|
|
output( "\tpopw %%gs\n" );
|
|
|
|
/* Set %ds and %es (and %ax just in case) equal to %ss */
|
|
output( "\tmovw %%ss,%%ax\n" );
|
|
output( "\tmovw %%ax,%%ds\n" );
|
|
output( "\tmovw %%ax,%%es\n" );
|
|
}
|
|
|
|
/* Jump to the called routine */
|
|
output( "\t.byte 0x66\n" );
|
|
output( "\tlret\n" );
|
|
|
|
/* Function footer */
|
|
output_function_size( name );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildRet16Func
|
|
*
|
|
* Build the return code for 16-bit callbacks
|
|
*/
|
|
static void BuildRet16Func(void)
|
|
{
|
|
function_header( "__wine_call_to_16_ret" );
|
|
|
|
/* Save %esp into %esi */
|
|
output( "\tmovl %%esp,%%esi\n" );
|
|
|
|
/* Restore 32-bit segment registers */
|
|
|
|
output( "\t.byte 0x2e\n\tmovl %s", asm_name("CallTo16_DataSelector") );
|
|
output( "-%s,%%edi\n", asm_name("__wine_call16_start") );
|
|
output( "\tmovw %%di,%%ds\n" );
|
|
output( "\tmovw %%di,%%es\n" );
|
|
|
|
output( "\t.byte 0x2e\n\tmov %s", asm_name("CallTo16_TebSelector") );
|
|
output( "-%s,%%fs\n", asm_name("__wine_call16_start") );
|
|
|
|
output( "\t.byte 0x64\n\tmov (%d),%%gs\n", GS_OFFSET );
|
|
|
|
/* Restore the 32-bit stack */
|
|
|
|
output( "\tmovw %%di,%%ss\n" );
|
|
output( "\t.byte 0x64\n\tmovl (%d),%%esp\n", STACKOFFSET );
|
|
|
|
/* Return to caller */
|
|
|
|
output( "\tlret\n" );
|
|
output_function_size( "__wine_call_to_16_ret" );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildCallTo32CBClient
|
|
*
|
|
* Call a CBClient relay stub from 32-bit code (KERNEL.620).
|
|
*
|
|
* Since the relay stub is itself 32-bit, this should not be a problem;
|
|
* unfortunately, the relay stubs are expected to switch back to a
|
|
* 16-bit stack (and 16-bit code) after completion :-(
|
|
*
|
|
* This would conflict with our 16- vs. 32-bit stack handling, so
|
|
* we simply switch *back* to our 32-bit stack before returning to
|
|
* the caller ...
|
|
*
|
|
* The CBClient relay stub expects to be called with the following
|
|
* 16-bit stack layout, and with ebp and ebx pointing into the 16-bit
|
|
* stack at the designated places:
|
|
*
|
|
* ...
|
|
* (ebp+14) original arguments to the callback routine
|
|
* (ebp+10) far return address to original caller
|
|
* (ebp+6) Thunklet target address
|
|
* (ebp+2) Thunklet relay ID code
|
|
* (ebp) BP (saved by CBClientGlueSL)
|
|
* (ebp-2) SI (saved by CBClientGlueSL)
|
|
* (ebp-4) DI (saved by CBClientGlueSL)
|
|
* (ebp-6) DS (saved by CBClientGlueSL)
|
|
*
|
|
* ... buffer space used by the 16-bit side glue for temp copies
|
|
*
|
|
* (ebx+4) far return address to 16-bit side glue code
|
|
* (ebx) saved 16-bit ss:sp (pointing to ebx+4)
|
|
*
|
|
* The 32-bit side glue code accesses both the original arguments (via ebp)
|
|
* and the temporary copies prepared by the 16-bit side glue (via ebx).
|
|
* After completion, the stub will load ss:sp from the buffer at ebx
|
|
* and perform a far return to 16-bit code.
|
|
*
|
|
* To trick the relay stub into returning to us, we replace the 16-bit
|
|
* return address to the glue code by a cs:ip pair pointing to our
|
|
* return entry point (the original return address is saved first).
|
|
* Our return stub thus called will then reload the 32-bit ss:esp and
|
|
* return to 32-bit code (by using and ss:esp value that we have also
|
|
* pushed onto the 16-bit stack before and a cs:eip values found at
|
|
* that position on the 32-bit stack). The ss:esp to be restored is
|
|
* found relative to the 16-bit stack pointer at:
|
|
*
|
|
* (ebx-4) ss (flat)
|
|
* (ebx-8) sp (32-bit stack pointer)
|
|
*
|
|
* The second variant of this routine, CALL32_CBClientEx, which is used
|
|
* to implement KERNEL.621, has to cope with yet another problem: Here,
|
|
* the 32-bit side directly returns to the caller of the CBClient thunklet,
|
|
* restoring registers saved by CBClientGlueSL and cleaning up the stack.
|
|
* As we have to return to our 32-bit code first, we have to adapt the
|
|
* layout of our temporary area so as to include values for the registers
|
|
* that are to be restored, and later (in the implementation of KERNEL.621)
|
|
* we *really* restore them. The return stub restores DS, DI, SI, and BP
|
|
* from the stack, skips the next 8 bytes (CBClient relay code / target),
|
|
* and then performs a lret NN, where NN is the number of arguments to be
|
|
* removed. Thus, we prepare our temporary area as follows:
|
|
*
|
|
* (ebx+22) 16-bit cs (this segment)
|
|
* (ebx+20) 16-bit ip ('16-bit' return entry point)
|
|
* (ebx+16) 32-bit ss (flat)
|
|
* (ebx+12) 32-bit sp (32-bit stack pointer)
|
|
* (ebx+10) 16-bit bp (points to ebx+24)
|
|
* (ebx+8) 16-bit si (ignored)
|
|
* (ebx+6) 16-bit di (ignored)
|
|
* (ebx+4) 16-bit ds (we actually use the flat DS here)
|
|
* (ebx+2) 16-bit ss (16-bit stack segment)
|
|
* (ebx+0) 16-bit sp (points to ebx+4)
|
|
*
|
|
* Note that we ensure that DS is not changed and remains the flat segment,
|
|
* and the 32-bit stack pointer our own return stub needs fits just
|
|
* perfectly into the 8 bytes that are skipped by the Windows stub.
|
|
* One problem is that we have to determine the number of removed arguments,
|
|
* as these have to be really removed in KERNEL.621. Thus, the BP value
|
|
* that we place in the temporary area to be restored, contains the value
|
|
* that SP would have if no arguments were removed. By comparing the actual
|
|
* value of SP with this value in our return stub we can compute the number
|
|
* of removed arguments. This is then returned to KERNEL.621.
|
|
*
|
|
* The stack layout of this function:
|
|
* (ebp+20) nArgs pointer to variable receiving nr. of args (Ex only)
|
|
* (ebp+16) esi pointer to caller's esi value
|
|
* (ebp+12) arg ebp value to be set for relay stub
|
|
* (ebp+8) func CBClient relay stub address
|
|
* (ebp+4) ret addr
|
|
* (ebp) ebp
|
|
*/
|
|
static void BuildCallTo32CBClient( BOOL isEx )
|
|
{
|
|
function_header( isEx ? "CALL32_CBClientEx" : "CALL32_CBClient" );
|
|
|
|
/* Entry code */
|
|
|
|
output( "\tpushl %%ebp\n" );
|
|
output( "\tmovl %%esp,%%ebp\n" );
|
|
output( "\tpushl %%edi\n" );
|
|
output( "\tpushl %%esi\n" );
|
|
output( "\tpushl %%ebx\n" );
|
|
|
|
/* Get pointer to temporary area and save the 32-bit stack pointer */
|
|
|
|
output( "\tmovl 16(%%ebp), %%ebx\n" );
|
|
output( "\tleal -8(%%esp), %%eax\n" );
|
|
|
|
if ( !isEx )
|
|
output( "\tmovl %%eax, -8(%%ebx)\n" );
|
|
else
|
|
output( "\tmovl %%eax, 12(%%ebx)\n" );
|
|
|
|
/* Set up registers and call CBClient relay stub (simulating a far call) */
|
|
|
|
output( "\tmovl 20(%%ebp), %%esi\n" );
|
|
output( "\tmovl (%%esi), %%esi\n" );
|
|
|
|
output( "\tmovl 8(%%ebp), %%eax\n" );
|
|
output( "\tmovl 12(%%ebp), %%ebp\n" );
|
|
|
|
output( "\tpushl %%cs\n" );
|
|
output( "\tcall *%%eax\n" );
|
|
|
|
/* Return new esi value to caller */
|
|
|
|
output( "\tmovl 32(%%esp), %%edi\n" );
|
|
output( "\tmovl %%esi, (%%edi)\n" );
|
|
|
|
/* Return argument size to caller */
|
|
if ( isEx )
|
|
{
|
|
output( "\tmovl 36(%%esp), %%ebx\n" );
|
|
output( "\tmovl %%ebp, (%%ebx)\n" );
|
|
}
|
|
|
|
/* Restore registers and return */
|
|
|
|
output( "\tpopl %%ebx\n" );
|
|
output( "\tpopl %%esi\n" );
|
|
output( "\tpopl %%edi\n" );
|
|
output( "\tpopl %%ebp\n" );
|
|
output( "\tret\n" );
|
|
output_function_size( isEx ? "CALL32_CBClientEx" : "CALL32_CBClient" );
|
|
|
|
/* '16-bit' return stub */
|
|
|
|
function_header( isEx ? "CALL32_CBClientEx_Ret" : "CALL32_CBClient_Ret" );
|
|
if ( !isEx )
|
|
{
|
|
output( "\tmovzwl %%sp, %%ebx\n" );
|
|
output( "\tlssl %%ss:-16(%%ebx), %%esp\n" );
|
|
}
|
|
else
|
|
{
|
|
output( "\tmovzwl %%bp, %%ebx\n" );
|
|
output( "\tsubw %%bp, %%sp\n" );
|
|
output( "\tmovzwl %%sp, %%ebp\n" );
|
|
output( "\tlssl %%ss:-12(%%ebx), %%esp\n" );
|
|
}
|
|
output( "\tlret\n" );
|
|
output_function_size( isEx ? "CALL32_CBClientEx_Ret" : "CALL32_CBClient_Ret" );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildCallFrom32Regs
|
|
*
|
|
* Build a 32-bit-to-Wine call-back function for a 'register' function.
|
|
* 'args' is the number of dword arguments.
|
|
*
|
|
* Stack layout:
|
|
* ...
|
|
* (ebp+20) first arg
|
|
* (ebp+16) ret addr to user code
|
|
* (ebp+12) func to call (relative to relay code ret addr)
|
|
* (ebp+8) number of args
|
|
* (ebp+4) ret addr to relay code
|
|
* (ebp+0) saved ebp
|
|
* (ebp-128) buffer area to allow stack frame manipulation
|
|
* (ebp-332) CONTEXT86 struct
|
|
* (ebp-336) padding for stack alignment
|
|
* (ebp-336-n) CONTEXT86 *argument
|
|
* .... other arguments copied from (ebp+12)
|
|
*
|
|
* The entry point routine is called with a CONTEXT* extra argument,
|
|
* following the normal args. In this context structure, EIP_reg
|
|
* contains the return address to user code, and ESP_reg the stack
|
|
* pointer on return (with the return address and arguments already
|
|
* removed).
|
|
*/
|
|
static void BuildCallFrom32Regs(void)
|
|
{
|
|
static const int STACK_SPACE = 128 + sizeof(CONTEXT86);
|
|
|
|
/* Function header */
|
|
|
|
function_header( "__wine_call_from_32_regs" );
|
|
|
|
/* Allocate some buffer space on the stack */
|
|
|
|
output( "\tpushl %%ebp\n" );
|
|
output( "\tmovl %%esp,%%ebp\n ");
|
|
output( "\tleal -%d(%%esp),%%esp\n", STACK_SPACE );
|
|
|
|
/* Build the context structure */
|
|
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Eax) - STACK_SPACE );
|
|
output( "\tpushfl\n" );
|
|
output( "\tpopl %%eax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(EFlags) - STACK_SPACE );
|
|
output( "\tmovl 0(%%ebp),%%eax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Ebp) - STACK_SPACE );
|
|
output( "\tmovl %%ebx,%d(%%ebp)\n", CONTEXTOFFSET(Ebx) - STACK_SPACE );
|
|
output( "\tmovl %%ecx,%d(%%ebp)\n", CONTEXTOFFSET(Ecx) - STACK_SPACE );
|
|
output( "\tmovl %%edx,%d(%%ebp)\n", CONTEXTOFFSET(Edx) - STACK_SPACE );
|
|
output( "\tmovl %%esi,%d(%%ebp)\n", CONTEXTOFFSET(Esi) - STACK_SPACE );
|
|
output( "\tmovl %%edi,%d(%%ebp)\n", CONTEXTOFFSET(Edi) - STACK_SPACE );
|
|
|
|
output( "\txorl %%eax,%%eax\n" );
|
|
output( "\tmovw %%cs,%%ax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegCs) - STACK_SPACE );
|
|
output( "\tmovw %%es,%%ax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegEs) - STACK_SPACE );
|
|
output( "\tmovw %%fs,%%ax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegFs) - STACK_SPACE );
|
|
output( "\tmovw %%gs,%%ax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegGs) - STACK_SPACE );
|
|
output( "\tmovw %%ss,%%ax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegSs) - STACK_SPACE );
|
|
output( "\tmovw %%ds,%%ax\n" );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegDs) - STACK_SPACE );
|
|
output( "\tmovw %%ax,%%es\n" ); /* set %es equal to %ds just in case */
|
|
|
|
output( "\tmovl $0x%x,%%eax\n", CONTEXT86_FULL );
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(ContextFlags) - STACK_SPACE );
|
|
|
|
output( "\tmovl 16(%%ebp),%%eax\n" ); /* Get %eip at time of call */
|
|
output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Eip) - STACK_SPACE );
|
|
|
|
/* Transfer the arguments */
|
|
|
|
output( "\tmovl 8(%%ebp),%%ecx\n" ); /* fetch number of args to copy */
|
|
output( "\tleal 4(,%%ecx,4),%%edx\n" ); /* add 4 for context arg */
|
|
output( "\tsubl %%edx,%%esp\n" );
|
|
output( "\tandl $~15,%%esp\n" );
|
|
output( "\tleal 20(%%ebp),%%esi\n" ); /* get %esp at time of call */
|
|
output( "\tmovl %%esp,%%edi\n" );
|
|
output( "\ttest %%ecx,%%ecx\n" );
|
|
output( "\tjz 1f\n" );
|
|
output( "\tcld\n" );
|
|
output( "\trep\n\tmovsl\n" ); /* copy args */
|
|
output( "1:\tleal %d(%%ebp),%%eax\n", -STACK_SPACE ); /* get addr of context struct */
|
|
output( "\tmovl %%eax,(%%edi)\n" ); /* and pass it as extra arg */
|
|
output( "\tmovl %%esi,%d(%%ebp)\n", CONTEXTOFFSET(Esp) - STACK_SPACE );
|
|
|
|
/* Call the entry point */
|
|
|
|
output( "\tmovl 4(%%ebp),%%eax\n" ); /* get relay code addr */
|
|
output( "\taddl 12(%%ebp),%%eax\n" );
|
|
output( "\tcall *%%eax\n" );
|
|
output( "\tleal -%d(%%ebp),%%ecx\n", STACK_SPACE );
|
|
|
|
/* Restore the context structure */
|
|
|
|
output( "2:\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegEs) );
|
|
output( "\tpopl %%es\n" );
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegFs) );
|
|
output( "\tpopl %%fs\n" );
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegGs) );
|
|
output( "\tpopl %%gs\n" );
|
|
|
|
output( "\tmovl %d(%%ecx),%%edi\n", CONTEXTOFFSET(Edi) );
|
|
output( "\tmovl %d(%%ecx),%%esi\n", CONTEXTOFFSET(Esi) );
|
|
output( "\tmovl %d(%%ecx),%%edx\n", CONTEXTOFFSET(Edx) );
|
|
output( "\tmovl %d(%%ecx),%%ebx\n", CONTEXTOFFSET(Ebx) );
|
|
output( "\tmovl %d(%%ecx),%%eax\n", CONTEXTOFFSET(Eax) );
|
|
output( "\tmovl %d(%%ecx),%%ebp\n", CONTEXTOFFSET(Ebp) );
|
|
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegSs) );
|
|
output( "\tpopl %%ss\n" );
|
|
output( "\tmovl %d(%%ecx),%%esp\n", CONTEXTOFFSET(Esp) );
|
|
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(EFlags) );
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegCs) );
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(Eip) );
|
|
output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegDs) );
|
|
output( "\tmovl %d(%%ecx),%%ecx\n", CONTEXTOFFSET(Ecx) );
|
|
|
|
output( "\tpopl %%ds\n" );
|
|
output( "\tiret\n" );
|
|
output_function_size( "__wine_call_from_32_regs" );
|
|
|
|
function_header( "__wine_call_from_32_restore_regs" );
|
|
output( "\tmovl 4(%%esp),%%ecx\n" );
|
|
output( "\tjmp 2b\n" );
|
|
output_function_size( "__wine_call_from_32_restore_regs" );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildPendingEventCheck
|
|
*
|
|
* Build a function that checks whether there are any
|
|
* pending DPMI events.
|
|
*
|
|
* Stack layout:
|
|
*
|
|
* (sp+12) long eflags
|
|
* (sp+6) long cs
|
|
* (sp+2) long ip
|
|
* (sp) word fs
|
|
*
|
|
* On entry to function, fs register points to a valid TEB.
|
|
* On exit from function, stack will be popped.
|
|
*/
|
|
static void BuildPendingEventCheck(void)
|
|
{
|
|
/* Function header */
|
|
|
|
function_header( "DPMI_PendingEventCheck" );
|
|
|
|
/* Check for pending events. */
|
|
|
|
output( "\t.byte 0x64\n\ttestl $0xffffffff,(%d)\n",
|
|
STRUCTOFFSET(TEB,GdiTebBatch) + STRUCTOFFSET(WINE_VM86_TEB_INFO,vm86_pending) );
|
|
output( "\tje %s\n", asm_name("DPMI_PendingEventCheck_Cleanup") );
|
|
output( "\t.byte 0x64\n\ttestl $0xffffffff,(%d)\n",
|
|
STRUCTOFFSET(TEB,GdiTebBatch) + STRUCTOFFSET(WINE_VM86_TEB_INFO,dpmi_vif) );
|
|
output( "\tje %s\n", asm_name("DPMI_PendingEventCheck_Cleanup") );
|
|
|
|
/* Process pending events. */
|
|
|
|
output( "\tsti\n" );
|
|
|
|
/* Start cleanup. Restore fs register. */
|
|
|
|
output( "%s\n", asm_globl("DPMI_PendingEventCheck_Cleanup") );
|
|
output( "\tpopw %%fs\n" );
|
|
|
|
/* Return from function. */
|
|
|
|
output( "%s\n", asm_globl("DPMI_PendingEventCheck_Return") );
|
|
output( "\tiret\n" );
|
|
|
|
output_function_size( "DPMI_PendingEventCheck" );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildRelays16
|
|
*
|
|
* Build all the 16-bit relay callbacks
|
|
*/
|
|
void BuildRelays16(void)
|
|
{
|
|
if (target_cpu != CPU_x86)
|
|
{
|
|
output( "/* File not used with this architecture. Do not edit! */\n\n" );
|
|
return;
|
|
}
|
|
|
|
/* File header */
|
|
|
|
output( "/* File generated automatically. Do not edit! */\n\n" );
|
|
output( "\t.text\n" );
|
|
|
|
output( "%s:\n\n", asm_name("__wine_spec_thunk_text_16") );
|
|
|
|
output( "%s\n", asm_globl("__wine_call16_start") );
|
|
|
|
/* Standard CallFrom16 routine */
|
|
BuildCallFrom16Core( FALSE, FALSE );
|
|
|
|
/* Register CallFrom16 routine */
|
|
BuildCallFrom16Core( TRUE, FALSE );
|
|
|
|
/* C16ThkSL CallFrom16 routine */
|
|
BuildCallFrom16Core( FALSE, TRUE );
|
|
|
|
/* Standard CallTo16 routine */
|
|
BuildCallTo16Core( 0 );
|
|
|
|
/* Register CallTo16 routine */
|
|
BuildCallTo16Core( 1 );
|
|
|
|
/* Standard CallTo16 return stub */
|
|
BuildRet16Func();
|
|
|
|
/* CBClientThunkSL routine */
|
|
BuildCallTo32CBClient( FALSE );
|
|
|
|
/* CBClientThunkSLEx routine */
|
|
BuildCallTo32CBClient( TRUE );
|
|
|
|
/* Pending DPMI events check stub */
|
|
BuildPendingEventCheck();
|
|
|
|
output( "%s\n", asm_globl("__wine_call16_end") );
|
|
output_function_size( "__wine_spec_thunk_text_16" );
|
|
|
|
/* Declare the return address and data selector variables */
|
|
output( "\n\t.data\n\t.align %d\n", get_alignment(4) );
|
|
output( "%s\n\t.long 0\n", asm_globl("CallTo16_DataSelector") );
|
|
output( "%s\n\t.long 0\n", asm_globl("CallTo16_TebSelector") );
|
|
if (UsePIC) output( "wine_ldt_copy_ptr:\t.long %s\n", asm_name("wine_ldt_copy") );
|
|
|
|
output( "\t.text\n" );
|
|
output( "%s:\n\n", asm_name("__wine_spec_thunk_text_32") );
|
|
BuildCallFrom32Regs();
|
|
output_function_size( "__wine_spec_thunk_text_32" );
|
|
|
|
output_gnu_stack_note();
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* build_call_from_regs_x86_64
|
|
*
|
|
* Build the register saving code for a 'register' entry point.
|
|
*
|
|
* Stack layout:
|
|
* ...
|
|
* (rsp+16) first arg
|
|
* (rsp+8) ret addr to user code
|
|
* (rsp) ret addr to relay code
|
|
* (rsp-128) buffer area to allow stack frame manipulation
|
|
*
|
|
* Parameters:
|
|
* %rcx number of args
|
|
* %rdx entry point
|
|
*/
|
|
static void build_call_from_regs_x86_64(void)
|
|
{
|
|
static const int STACK_SPACE = 128 + 0x4d0; /* size of x86_64 context */
|
|
|
|
/* Function header */
|
|
|
|
function_header( "__wine_call_from_regs" );
|
|
|
|
output( "\tsubq $%u,%%rsp\n", STACK_SPACE );
|
|
|
|
/* save registers into the context */
|
|
|
|
output( "\tmovq %%rax,0x78(%%rsp)\n" );
|
|
output( "\tmovq %u(%%rsp),%%rax\n", STACK_SPACE + 16 ); /* saved %rcx on stack */
|
|
output( "\tmovq %%rax,0x80(%%rsp)\n" );
|
|
output( "\tmovq %u(%%rsp),%%rax\n", STACK_SPACE + 24 ); /* saved %rdx on stack */
|
|
output( "\tmovq %%rax,0x88(%%rsp)\n" );
|
|
output( "\tmovq %%rbx,0x90(%%rsp)\n" );
|
|
output( "\tleaq %u(%%rsp),%%rax\n", STACK_SPACE + 16 );
|
|
output( "\tmovq %%rax,0x98(%%rsp)\n" );
|
|
output( "\tmovq %%rbp,0xa0(%%rsp)\n" );
|
|
output( "\tmovq %%rsi,0xa8(%%rsp)\n" );
|
|
output( "\tmovq %%rdi,0xb0(%%rsp)\n" );
|
|
output( "\tmovq %%r8,0xb8(%%rsp)\n" );
|
|
output( "\tmovq %%r9,0xc0(%%rsp)\n" );
|
|
output( "\tmovq %%r10,0xc8(%%rsp)\n" );
|
|
output( "\tmovq %%r11,0xd0(%%rsp)\n" );
|
|
output( "\tmovq %%r12,0xd8(%%rsp)\n" );
|
|
output( "\tmovq %%r13,0xe0(%%rsp)\n" );
|
|
output( "\tmovq %%r14,0xe8(%%rsp)\n" );
|
|
output( "\tmovq %%r15,0xf0(%%rsp)\n" );
|
|
output( "\tmovq %u(%%rsp),%%rax\n", STACK_SPACE + 8 );
|
|
output( "\tmovq %%rax,0xf8(%%rsp)\n" );
|
|
|
|
output( "\tstmxcsr 0x34(%%rsp)\n" );
|
|
output( "\tfxsave 0x100(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm0,0x1a0(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm1,0x1b0(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm2,0x1c0(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm3,0x1d0(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm4,0x1e0(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm5,0x1f0(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm6,0x200(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm7,0x210(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm8,0x220(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm9,0x230(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm10,0x240(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm11,0x250(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm12,0x260(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm13,0x270(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm14,0x280(%%rsp)\n" );
|
|
output( "\tmovdqa %%xmm15,0x290(%%rsp)\n" );
|
|
|
|
output( "\tmovw %%cs,0x38(%%rsp)\n" );
|
|
output( "\tmovw %%ds,0x3a(%%rsp)\n" );
|
|
output( "\tmovw %%es,0x3c(%%rsp)\n" );
|
|
output( "\tmovw %%fs,0x3e(%%rsp)\n" );
|
|
output( "\tmovw %%gs,0x40(%%rsp)\n" );
|
|
output( "\tmovw %%ss,0x42(%%rsp)\n" );
|
|
output( "\tpushfq\n" );
|
|
output( "\tpopq %%rax\n" );
|
|
output( "\tmovl %%eax,0x44(%%rsp)\n" );
|
|
|
|
output( "\tmovl $0x%x,0x30(%%rsp)\n", 0x0010000f );
|
|
|
|
/* transfer the arguments */
|
|
|
|
output( "\tmovq %%r8,%u(%%rsp)\n", STACK_SPACE + 32 );
|
|
output( "\tmovq %%r9,%u(%%rsp)\n", STACK_SPACE + 40 );
|
|
output( "\tmovq $4,%%rax\n" );
|
|
output( "\tleaq %u(%%rsp),%%rsi\n", STACK_SPACE + 16 );
|
|
output( "\tcmpq %%rax,%%rcx\n" );
|
|
output( "\tcmovgq %%rcx,%%rax\n" );
|
|
output( "\tmovq %%rsp,%%rbx\n" );
|
|
output( "\tleaq 16(,%%rax,8),%%rax\n" ); /* add 8 for context arg and 8 for rounding */
|
|
output( "\tandq $~15,%%rax\n" );
|
|
output( "\tsubq %%rax,%%rsp\n" );
|
|
output( "\tmovq %%rsp,%%rdi\n" );
|
|
output( "\tjrcxz 1f\n" );
|
|
output( "\tcld\n" );
|
|
output( "\trep\n\tmovsq\n" );
|
|
output( "1:\tmovq %%rbx,0(%%rdi)\n" ); /* context arg */
|
|
|
|
/* call the entry point */
|
|
|
|
output( "\tmovq %%rdx,%%rax\n" );
|
|
output( "\tmovq 0(%%rsp),%%rcx\n" );
|
|
output( "\tmovq 8(%%rsp),%%rdx\n" );
|
|
output( "\tmovq 16(%%rsp),%%r8\n" );
|
|
output( "\tmovq 24(%%rsp),%%r9\n" );
|
|
output( "\tcallq *%%rax\n" );
|
|
|
|
/* restore the context structure */
|
|
|
|
output( "1:\tmovq 0x80(%%rbx),%%rcx\n" );
|
|
output( "\tmovq 0x88(%%rbx),%%rdx\n" );
|
|
output( "\tmovq 0xa0(%%rbx),%%rbp\n" );
|
|
output( "\tmovq 0xa8(%%rbx),%%rsi\n" );
|
|
output( "\tmovq 0xb0(%%rbx),%%rdi\n" );
|
|
output( "\tmovq 0xb8(%%rbx),%%r8\n" );
|
|
output( "\tmovq 0xc0(%%rbx),%%r9\n" );
|
|
output( "\tmovq 0xc8(%%rbx),%%r10\n" );
|
|
output( "\tmovq 0xd0(%%rbx),%%r11\n" );
|
|
output( "\tmovq 0xd8(%%rbx),%%r12\n" );
|
|
output( "\tmovq 0xe0(%%rbx),%%r13\n" );
|
|
output( "\tmovq 0xe8(%%rbx),%%r14\n" );
|
|
output( "\tmovq 0xf0(%%rbx),%%r15\n" );
|
|
|
|
output( "\tmovdqa 0x1a0(%%rbx),%%xmm0\n" );
|
|
output( "\tmovdqa 0x1b0(%%rbx),%%xmm1\n" );
|
|
output( "\tmovdqa 0x1c0(%%rbx),%%xmm2\n" );
|
|
output( "\tmovdqa 0x1d0(%%rbx),%%xmm3\n" );
|
|
output( "\tmovdqa 0x1e0(%%rbx),%%xmm4\n" );
|
|
output( "\tmovdqa 0x1f0(%%rbx),%%xmm5\n" );
|
|
output( "\tmovdqa 0x200(%%rbx),%%xmm6\n" );
|
|
output( "\tmovdqa 0x210(%%rbx),%%xmm7\n" );
|
|
output( "\tmovdqa 0x220(%%rbx),%%xmm8\n" );
|
|
output( "\tmovdqa 0x230(%%rbx),%%xmm9\n" );
|
|
output( "\tmovdqa 0x240(%%rbx),%%xmm10\n" );
|
|
output( "\tmovdqa 0x250(%%rbx),%%xmm11\n" );
|
|
output( "\tmovdqa 0x260(%%rbx),%%xmm12\n" );
|
|
output( "\tmovdqa 0x270(%%rbx),%%xmm13\n" );
|
|
output( "\tmovdqa 0x280(%%rbx),%%xmm14\n" );
|
|
output( "\tmovdqa 0x290(%%rbx),%%xmm15\n" );
|
|
output( "\tfxrstor 0x100(%%rbx)\n" );
|
|
output( "\tldmxcsr 0x34(%%rbx)\n" );
|
|
|
|
output( "\tmovl 0x44(%%rbx),%%eax\n" );
|
|
output( "\tpushq %%rax\n" );
|
|
output( "\tpopfq\n" );
|
|
|
|
output( "\tmovq 0x98(%%rbx),%%rax\n" ); /* stack pointer */
|
|
output( "\tpushq 0xf8(%%rbx)\n" ); /* return address */
|
|
output( "\tpopq -8(%%rax)\n" );
|
|
output( "\tpushq 0x78(%%rbx)\n" ); /* rax */
|
|
output( "\tpopq -16(%%rax)\n" );
|
|
output( "\tmovq 0x90(%%rbx),%%rbx\n" );
|
|
output( "\tleaq -16(%%rax),%%rsp\n" );
|
|
output( "\tpopq %%rax\n" );
|
|
output( "\tret\n" );
|
|
|
|
output_function_size( "__wine_call_from_regs" );
|
|
|
|
function_header( "__wine_restore_regs" );
|
|
output( "\tmovq %%rcx,%%rbx\n" );
|
|
output( "\tjmp 1b\n" );
|
|
output_function_size( "__wine_restore_regs" );
|
|
}
|
|
|
|
|
|
/*******************************************************************
|
|
* BuildRelays32
|
|
*
|
|
* Build all the 32-bit relay callbacks
|
|
*/
|
|
void BuildRelays32(void)
|
|
{
|
|
switch (target_cpu)
|
|
{
|
|
case CPU_x86:
|
|
output( "/* File generated automatically. Do not edit! */\n\n" );
|
|
output( "\t.text\n" );
|
|
output( "%s:\n\n", asm_name("__wine_spec_thunk_text_32") );
|
|
|
|
/* 32-bit register entry point */
|
|
BuildCallFrom32Regs();
|
|
|
|
output_function_size( "__wine_spec_thunk_text_32" );
|
|
output_gnu_stack_note();
|
|
break;
|
|
|
|
case CPU_x86_64:
|
|
output( "/* File generated automatically. Do not edit! */\n\n" );
|
|
output( "\t.text\n" );
|
|
build_call_from_regs_x86_64();
|
|
output_gnu_stack_note();
|
|
break;
|
|
|
|
default:
|
|
output( "/* File not used with this architecture. Do not edit! */\n\n" );
|
|
return;
|
|
}
|
|
}
|