thunk.c 71.5 KB
Newer Older
1 2 3 4 5 6 7
/*
 * KERNEL32 thunks and other undocumented stuff
 *
 * Copyright 1996, 1997 Alexandre Julliard
 * Copyright 1997, 1998 Marcus Meissner
 * Copyright 1998       Ulrich Weigand
 *
8 9 10 11 12 13 14 15 16 17 18 19
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
20
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
21 22
 */

23
#include "config.h"
24
#include "wine/port.h"
25

26 27
#include <string.h>
#include <sys/types.h>
28
#include <stdarg.h>
29
#include <stdio.h>
30 31 32
#ifdef HAVE_UNISTD_H
# include <unistd.h>
#endif
33 34 35 36

#include "windef.h"
#include "winbase.h"
#include "winerror.h"
37
#include "winternl.h"
38
#include "wownt32.h"
39 40
#include "wine/winbase16.h"

41
#include "wine/debug.h"
42
#include "wine/library.h"
43
#include "kernel_private.h"
44
#include "kernel16_private.h"
45

46
WINE_DEFAULT_DEBUG_CHANNEL(thunk);
47

48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119
struct ThunkDataCommon
{
    char                   magic[4];         /* 00 */
    DWORD                  checksum;         /* 04 */
};

struct ThunkDataLS16
{
    struct ThunkDataCommon common;           /* 00 */
    SEGPTR                 targetTable;      /* 08 */
    DWORD                  firstTime;        /* 0C */
};

struct ThunkDataLS32
{
    struct ThunkDataCommon common;           /* 00 */
    DWORD *                targetTable;      /* 08 */
    char                   lateBinding[4];   /* 0C */
    DWORD                  flags;            /* 10 */
    DWORD                  reserved1;        /* 14 */
    DWORD                  reserved2;        /* 18 */
    DWORD                  offsetQTThunk;    /* 1C */
    DWORD                  offsetFTProlog;   /* 20 */
};

struct ThunkDataSL16
{
    struct ThunkDataCommon common;            /* 00 */
    DWORD                  flags1;            /* 08 */
    DWORD                  reserved1;         /* 0C */
    struct ThunkDataSL *   fpData;            /* 10 */
    SEGPTR                 spData;            /* 14 */
    DWORD                  reserved2;         /* 18 */
    char                   lateBinding[4];    /* 1C */
    DWORD                  flags2;            /* 20 */
    DWORD                  reserved3;         /* 20 */
    SEGPTR                 apiDatabase;       /* 28 */
};

struct ThunkDataSL32
{
    struct ThunkDataCommon common;            /* 00 */
    DWORD                  reserved1;         /* 08 */
    struct ThunkDataSL *   data;              /* 0C */
    char                   lateBinding[4];    /* 10 */
    DWORD                  flags;             /* 14 */
    DWORD                  reserved2;         /* 18 */
    DWORD                  reserved3;         /* 1C */
    DWORD                  offsetTargetTable; /* 20 */
};

struct ThunkDataSL
{
#if 0
    This structure differs from the Win95 original,
    but this should not matter since it is strictly internal to
    the thunk handling routines in KRNL386 / KERNEL32.

    For reference, here is the Win95 layout:

    struct ThunkDataCommon common;            /* 00 */
    DWORD                  flags1;            /* 08 */
    SEGPTR                 apiDatabase;       /* 0C */
    WORD                   exePtr;            /* 10 */
    WORD                   segMBA;            /* 12 */
    DWORD                  lenMBATotal;       /* 14 */
    DWORD                  lenMBAUsed;        /* 18 */
    DWORD                  flags2;            /* 1C */
    char                   pszDll16[256];     /* 20 */
    char                   pszDll32[256];     /*120 */

    We do it differently since all our thunk handling is done
120
    by 32-bit code. Therefore we do not need to provide
121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146
    easy access to this data, especially the process target
    table database, for 16-bit code.
#endif

    struct ThunkDataCommon common;
    DWORD                  flags1;
    struct SLApiDB *       apiDB;
    struct SLTargetDB *    targetDB;
    DWORD                  flags2;
    char                   pszDll16[256];
    char                   pszDll32[256];
};

struct SLTargetDB
{
     struct SLTargetDB *   next;
     DWORD                 process;
     DWORD *               targetTable;
};

struct SLApiDB
{
    DWORD                  nrArgBytes;
    DWORD                  errorReturnValue;
};

147 148 149
SEGPTR CALL32_CBClient_RetAddr = 0;
SEGPTR CALL32_CBClientEx_RetAddr = 0;

150 151 152 153 154
#ifdef __i386__
extern void __wine_call_from_16_thunk();
#else
static void __wine_call_from_16_thunk() { }
#endif
155

156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
/* Push a DWORD on the 32-bit stack */
static inline void stack32_push( CONTEXT86 *context, DWORD val )
{
    context->Esp -= sizeof(DWORD);
    *(DWORD *)context->Esp = val;
}

/* Pop a DWORD from the 32-bit stack */
static inline DWORD stack32_pop( CONTEXT86 *context )
{
    DWORD ret = *(DWORD *)context->Esp;
    context->Esp += sizeof(DWORD);
    return ret;
}

171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186
/***********************************************************************
 *                                                                     *
 *                 Win95 internal thunks                               *
 *                                                                     *
 ***********************************************************************/

/***********************************************************************
 *           LogApiThk    (KERNEL.423)
 */
void WINAPI LogApiThk( LPSTR func )
{
    TRACE( "%s\n", debugstr_a(func) );
}

/***********************************************************************
 *           LogApiThkLSF    (KERNEL32.42)
187
 *
188 189
 * NOTE: needs to preserve all registers!
 */
190
void WINAPI __regs_LogApiThkLSF( LPSTR func, CONTEXT86 *context )
191 192 193
{
    TRACE( "%s\n", debugstr_a(func) );
}
194
#ifdef DEFINE_REGS_ENTRYPOINT
195
DEFINE_REGS_ENTRYPOINT( LogApiThkLSF, 4, 4 )
196
#endif
197 198 199

/***********************************************************************
 *           LogApiThkSL    (KERNEL32.44)
200
 *
201 202
 * NOTE: needs to preserve all registers!
 */
203
void WINAPI __regs_LogApiThkSL( LPSTR func, CONTEXT86 *context )
204 205 206
{
    TRACE( "%s\n", debugstr_a(func) );
}
207
#ifdef DEFINE_REGS_ENTRYPOINT
208
DEFINE_REGS_ENTRYPOINT( LogApiThkSL, 4, 4 )
209
#endif
210 211 212

/***********************************************************************
 *           LogCBThkSL    (KERNEL32.47)
213
 *
214 215
 * NOTE: needs to preserve all registers!
 */
216
void WINAPI __regs_LogCBThkSL( LPSTR func, CONTEXT86 *context )
217 218 219
{
    TRACE( "%s\n", debugstr_a(func) );
}
220
#ifdef DEFINE_REGS_ENTRYPOINT
221
DEFINE_REGS_ENTRYPOINT( LogCBThkSL, 4, 4 )
222
#endif
223 224 225

/***********************************************************************
 * Generates a FT_Prolog call.
226
 *
227 228 229 230 231 232 233 234 235 236 237 238
 *  0FB6D1                  movzbl edx,cl
 *  8B1495xxxxxxxx	    mov edx,[4*edx + targetTable]
 *  68xxxxxxxx		    push FT_Prolog
 *  C3			    lret
 */
static void _write_ftprolog(LPBYTE relayCode ,DWORD *targetTable) {
	LPBYTE	x;

	x	= relayCode;
	*x++	= 0x0f;*x++=0xb6;*x++=0xd1; /* movzbl edx,cl */
	*x++	= 0x8B;*x++=0x14;*x++=0x95;*(DWORD**)x= targetTable;
	x+=4;	/* mov edx, [4*edx + targetTable] */
239
	*x++	= 0x68; *(DWORD*)x = (DWORD)GetProcAddress(kernel32_handle,"FT_Prolog");
240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265
	x+=4; 	/* push FT_Prolog */
	*x++	= 0xC3;		/* lret */
	/* fill rest with 0xCC / int 3 */
}

/***********************************************************************
 *	_write_qtthunk					(internal)
 * Generates a QT_Thunk style call.
 *
 *  33C9                    xor ecx, ecx
 *  8A4DFC                  mov cl , [ebp-04]
 *  8B148Dxxxxxxxx          mov edx, [4*ecx + targetTable]
 *  B8yyyyyyyy              mov eax, QT_Thunk
 *  FFE0                    jmp eax
 */
static void _write_qtthunk(
	LPBYTE relayCode,	/* [in] start of QT_Thunk stub */
	DWORD *targetTable	/* [in] start of thunk (for index lookup) */
) {
	LPBYTE	x;

	x	= relayCode;
	*x++	= 0x33;*x++=0xC9; /* xor ecx,ecx */
	*x++	= 0x8A;*x++=0x4D;*x++=0xFC; /* movb cl,[ebp-04] */
	*x++	= 0x8B;*x++=0x14;*x++=0x8D;*(DWORD**)x= targetTable;
	x+=4;	/* mov edx, [4*ecx + targetTable */
266
	*x++	= 0xB8; *(DWORD*)x = (DWORD)GetProcAddress(kernel32_handle,"QT_Thunk");
267 268 269 270 271 272 273 274
	x+=4; 	/* mov eax , QT_Thunk */
	*x++	= 0xFF; *x++ = 0xE0;	/* jmp eax */
	/* should fill the rest of the 32 bytes with 0xCC */
}

/***********************************************************************
 *           _loadthunk
 */
275
static LPVOID _loadthunk(LPCSTR module, LPCSTR func, LPCSTR module32,
276 277 278
                         struct ThunkDataCommon *TD32, DWORD checksum)
{
    struct ThunkDataCommon *TD16;
279
    HMODULE16 hmod;
280 281
    int ordinal;

282
    if ((hmod = LoadLibrary16(module)) <= 32)
283 284 285 286 287 288 289
    {
        ERR("(%s, %s, %s): Unable to load '%s', error %d\n",
                   module, func, module32, module, hmod);
        return 0;
    }

    if (   !(ordinal = NE_GetOrdinal(hmod, func))
290
        || !(TD16 = MapSL((SEGPTR)NE_GetEntryPointEx(hmod, ordinal, FALSE))))
291 292 293 294 295 296 297 298 299
    {
        ERR("Unable to find thunk data '%s' in %s, required by %s (conflicting/incorrect DLL versions !?).\n",
                   func, module, module32);
        return 0;
    }

    if (TD32 && memcmp(TD16->magic, TD32->magic, 4))
    {
        ERR("(%s, %s, %s): Bad magic %c%c%c%c (should be %c%c%c%c)\n",
300
                   module, func, module32,
301 302 303 304 305 306 307
                   TD16->magic[0], TD16->magic[1], TD16->magic[2], TD16->magic[3],
                   TD32->magic[0], TD32->magic[1], TD32->magic[2], TD32->magic[3]);
        return 0;
    }

    if (TD32 && TD16->checksum != TD32->checksum)
    {
308
        ERR("(%s, %s, %s): Wrong checksum %08x (should be %08x)\n",
309 310 311 312 313 314
                   module, func, module32, TD16->checksum, TD32->checksum);
        return 0;
    }

    if (!TD32 && checksum && checksum != *(LPDWORD)TD16)
    {
315
        ERR("(%s, %s, %s): Wrong checksum %08x (should be %08x)\n",
316 317 318 319 320 321 322 323 324 325
                   module, func, module32, *(LPDWORD)TD16, checksum);
        return 0;
    }

    return TD16;
}

/***********************************************************************
 *           GetThunkStuff    (KERNEL32.53)
 */
326
LPVOID WINAPI GetThunkStuff(LPCSTR module, LPCSTR func)
327 328 329 330 331 332 333 334 335 336 337 338 339 340
{
    return _loadthunk(module, func, "<kernel>", NULL, 0L);
}

/***********************************************************************
 *           GetThunkBuff    (KERNEL32.52)
 * Returns a pointer to ThkBuf in the 16bit library SYSTHUNK.DLL.
 */
LPVOID WINAPI GetThunkBuff(void)
{
    return GetThunkStuff("SYSTHUNK.DLL", "ThkBuf");
}

/***********************************************************************
341
 *		ThunkConnect32		(KERNEL32.@)
342 343
 * Connects a 32bit and a 16bit thunkbuffer.
 */
344
UINT WINAPI ThunkConnect32(
345 346 347 348 349 350 351 352 353 354 355 356 357
	struct ThunkDataCommon *TD,  /* [in/out] thunkbuffer */
	LPSTR thunkfun16,            /* [in] win16 thunkfunction */
	LPSTR module16,              /* [in] name of win16 dll */
	LPSTR module32,              /* [in] name of win32 dll */
	HMODULE hmod32,            /* [in] hmodule of win32 dll */
	DWORD dwReason               /* [in] initialisation argument */
) {
    BOOL directionSL;

    if (!strncmp(TD->magic, "SL01", 4))
    {
        directionSL = TRUE;

358
        TRACE("SL01 thunk %s (%p) <- %s (%s), Reason: %d\n",
359
              module32, TD, module16, thunkfun16, dwReason);
360 361 362 363 364
    }
    else if (!strncmp(TD->magic, "LS01", 4))
    {
        directionSL = FALSE;

365
        TRACE("LS01 thunk %s (%p) -> %s (%s), Reason: %d\n",
366
              module32, TD, module16, thunkfun16, dwReason);
367 368 369
    }
    else
    {
370
        ERR("Invalid magic %c%c%c%c\n",
371 372 373
                   TD->magic[0], TD->magic[1], TD->magic[2], TD->magic[3]);
        return 0;
    }
374

375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403
    switch (dwReason)
    {
        case DLL_PROCESS_ATTACH:
        {
            struct ThunkDataCommon *TD16;
            if (!(TD16 = _loadthunk(module16, thunkfun16, module32, TD, 0L)))
                return 0;

            if (directionSL)
            {
                struct ThunkDataSL32 *SL32 = (struct ThunkDataSL32 *)TD;
                struct ThunkDataSL16 *SL16 = (struct ThunkDataSL16 *)TD16;
                struct SLTargetDB *tdb;

                if (SL16->fpData == NULL)
                {
                    ERR("ThunkConnect16 was not called!\n");
                    return 0;
                }

                SL32->data = SL16->fpData;

                tdb = HeapAlloc(GetProcessHeap(), 0, sizeof(*tdb));
                tdb->process = GetCurrentProcessId();
                tdb->targetTable = (DWORD *)(thunkfun16 + SL32->offsetTargetTable);

                tdb->next = SL32->data->targetDB;   /* FIXME: not thread-safe! */
                SL32->data->targetDB = tdb;

404
                TRACE("Process %08x allocated TargetDB entry for ThunkDataSL %p\n",
405
                      GetCurrentProcessId(), SL32->data);
406 407 408 409 410 411
            }
            else
            {
                struct ThunkDataLS32 *LS32 = (struct ThunkDataLS32 *)TD;
                struct ThunkDataLS16 *LS16 = (struct ThunkDataLS16 *)TD16;

412
                LS32->targetTable = MapSL(LS16->targetTable);
413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429

                /* write QT_Thunk and FT_Prolog stubs */
                _write_qtthunk ((LPBYTE)TD + LS32->offsetQTThunk,  LS32->targetTable);
                _write_ftprolog((LPBYTE)TD + LS32->offsetFTProlog, LS32->targetTable);
            }
            break;
        }

        case DLL_PROCESS_DETACH:
            /* FIXME: cleanup */
            break;
    }

    return 1;
}

/**********************************************************************
430
 * 		QT_Thunk			(KERNEL32.@)
431 432
 *
 * The target address is in EDX.
433
 * The 16bit arguments start at ESP.
434
 * The number of 16bit argument bytes is EBP-ESP-0x40 (64 Byte thunksetup).
435 436 437 438 439 440 441 442 443
 * So the stack layout is 16bit argument bytes and then the 64 byte
 * scratch buffer.
 * The scratch buffer is used as work space by Windows' QT_Thunk
 * function.
 * As the programs unfortunately don't always provide a fixed size
 * scratch buffer (danger, stack corruption ahead !!), we simply resort
 * to copying over the whole EBP-ESP range to the 16bit stack
 * (as there's no way to safely figure out the param count
 * due to this misbehaviour of some programs).
444
 * [ok]
445 446 447 448 449 450
 *
 * See DDJ article 9614c for a very good description of QT_Thunk (also
 * available online !).
 *
 * FIXME: DDJ talks of certain register usage rules; I'm not sure
 * whether we cover this 100%.
451
 */
452
void WINAPI __regs_QT_Thunk( CONTEXT86 *context )
453 454 455 456 457 458
{
    CONTEXT86 context16;
    DWORD argsize;

    memcpy(&context16,context,sizeof(context16));

459 460
    context16.SegFs = wine_get_fs();
    context16.SegGs = wine_get_gs();
461 462
    context16.SegCs = HIWORD(context->Edx);
    context16.Eip   = LOWORD(context->Edx);
463 464
    /* point EBP to the STACK16FRAME on the stack
     * for the call_to_16 to set up the register content on calling */
465
    context16.Ebp   = OFFSETOF(NtCurrentTeb()->WOW32Reserved) + FIELD_OFFSET(STACK16FRAME,bp);
466

467 468 469 470 471 472 473 474 475 476
    /*
     * used to be (problematic):
     * argsize = context->Ebp - context->Esp - 0x40;
     * due to some programs abusing the API, we better assume the full
     * EBP - ESP range for copying instead: */
    argsize = context->Ebp - context->Esp;

    /* ok, too much is insane; let's limit param count a bit again */
    if (argsize > 64)
	argsize = 64; /* 32 WORDs */
477

478
    WOWCallback16Ex( 0, WCB16_REGS, argsize, (void *)context->Esp, (DWORD *)&context16 );
479 480 481
    context->Eax = context16.Eax;
    context->Edx = context16.Edx;
    context->Ecx = context16.Ecx;
482

483 484 485
    /* make sure to update the Win32 ESP, too, in order to throw away
     * the number of parameters that the Win16 function
     * accepted (that it popped from the corresponding Win16 stack) */
486
    context->Esp +=   LOWORD(context16.Esp) -
487
                        ( OFFSETOF(NtCurrentTeb()->WOW32Reserved) - argsize );
488
}
489
#ifdef DEFINE_REGS_ENTRYPOINT
490
DEFINE_REGS_ENTRYPOINT( QT_Thunk, 0, 0 )
491
#endif
492 493 494


/**********************************************************************
495
 * 		FT_Prolog			(KERNEL32.@)
496
 *
497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512
 * The set of FT_... thunk routines is used instead of QT_Thunk,
 * if structures have to be converted from 32-bit to 16-bit
 * (change of member alignment, conversion of members).
 *
 * The thunk function (as created by the thunk compiler) calls
 * FT_Prolog at the beginning, to set up a stack frame and
 * allocate a 64 byte buffer on the stack.
 * The input parameters (target address and some flags) are
 * saved for later use by FT_Thunk.
 *
 * Input:  EDX  16-bit target address (SEGPTR)
 *         CX   bits  0..7   target number (in target table)
 *              bits  8..9   some flags (unclear???)
 *              bits 10..15  number of DWORD arguments
 *
 * Output: A new stackframe is created, and a 64 byte buffer
513
 *         allocated on the stack. The layout of the stack
514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534
 *         on return is as follows:
 *
 *  (ebp+4)  return address to caller of thunk function
 *  (ebp)    old EBP
 *  (ebp-4)  saved EBX register of caller
 *  (ebp-8)  saved ESI register of caller
 *  (ebp-12) saved EDI register of caller
 *  (ebp-16) saved ECX register, containing flags
 *  (ebp-20) bitmap containing parameters that are to be converted
 *           by FT_Thunk; it is initialized to 0 by FT_Prolog and
 *           filled in by the thunk code before calling FT_Thunk
 *  (ebp-24)
 *    ...    (unclear)
 *  (ebp-44)
 *  (ebp-48) saved EAX register of caller (unclear, never restored???)
 *  (ebp-52) saved EDX register, containing 16-bit thunk target
 *  (ebp-56)
 *    ...    (unclear)
 *  (ebp-64)
 *
 *  ESP is EBP-64 after return.
535
 *
536
 */
537
void WINAPI __regs_FT_Prolog( CONTEXT86 *context )
538 539
{
    /* Build stack frame */
540 541
    stack32_push(context, context->Ebp);
    context->Ebp = context->Esp;
542 543

    /* Allocate 64-byte Thunk Buffer */
544 545
    context->Esp -= 64;
    memset((char *)context->Esp, '\0', 64);
546 547 548

    /* Store Flags (ECX) and Target Address (EDX) */
    /* Save other registers to be restored later */
549 550 551 552
    *(DWORD *)(context->Ebp -  4) = context->Ebx;
    *(DWORD *)(context->Ebp -  8) = context->Esi;
    *(DWORD *)(context->Ebp - 12) = context->Edi;
    *(DWORD *)(context->Ebp - 16) = context->Ecx;
553

554 555
    *(DWORD *)(context->Ebp - 48) = context->Eax;
    *(DWORD *)(context->Ebp - 52) = context->Edx;
556
}
557
#ifdef DEFINE_REGS_ENTRYPOINT
558
DEFINE_REGS_ENTRYPOINT( FT_Prolog, 0, 0 )
559
#endif
560 561

/**********************************************************************
562
 * 		FT_Thunk			(KERNEL32.@)
563
 *
564
 * This routine performs the actual call to 16-bit code,
565 566 567 568 569 570 571 572
 * similar to QT_Thunk. The differences are:
 *  - The call target is taken from the buffer created by FT_Prolog
 *  - Those arguments requested by the thunk code (by setting the
 *    corresponding bit in the bitmap at EBP-20) are converted
 *    from 32-bit pointers to segmented pointers (those pointers
 *    are guaranteed to point to structures copied to the stack
 *    by the thunk code, so we always use the 16-bit stack selector
 *    for those addresses).
573
 *
574 575
 *    The bit #i of EBP-20 corresponds here to the DWORD starting at
 *    ESP+4 + 2*i.
576 577
 *
 * FIXME: It is unclear what happens if there are more than 32 WORDs
578 579 580
 *        of arguments, so that the single DWORD bitmap is no longer
 *        sufficient ...
 */
581
void WINAPI __regs_FT_Thunk( CONTEXT86 *context )
582
{
583 584
    DWORD mapESPrelative = *(DWORD *)(context->Ebp - 20);
    DWORD callTarget     = *(DWORD *)(context->Ebp - 52);
585 586 587

    CONTEXT86 context16;
    DWORD i, argsize;
588 589
    DWORD newstack[32];
    LPBYTE oldstack;
590 591 592

    memcpy(&context16,context,sizeof(context16));

593 594
    context16.SegFs = wine_get_fs();
    context16.SegGs = wine_get_gs();
595 596
    context16.SegCs = HIWORD(callTarget);
    context16.Eip   = LOWORD(callTarget);
597
    context16.Ebp   = OFFSETOF(NtCurrentTeb()->WOW32Reserved) + FIELD_OFFSET(STACK16FRAME,bp);
598

599
    argsize  = context->Ebp-context->Esp-0x40;
600
    if (argsize > sizeof(newstack)) argsize = sizeof(newstack);
601
    oldstack = (LPBYTE)context->Esp;
602 603 604 605 606 607

    memcpy( newstack, oldstack, argsize );

    for (i = 0; i < 32; i++)	/* NOTE: What about > 32 arguments? */
	if (mapESPrelative & (1 << i))
	{
608
	    SEGPTR *arg = (SEGPTR *)newstack[i];
609 610
	    *arg = MAKESEGPTR(SELECTOROF(NtCurrentTeb()->WOW32Reserved),
                              OFFSETOF(NtCurrentTeb()->WOW32Reserved) - argsize
611
                              + (*(LPBYTE *)arg - oldstack));
612 613
	}

614
    WOWCallback16Ex( 0, WCB16_REGS, argsize, newstack, (DWORD *)&context16 );
615 616 617
    context->Eax = context16.Eax;
    context->Edx = context16.Edx;
    context->Ecx = context16.Ecx;
618

619
    context->Esp +=   LOWORD(context16.Esp) -
620
                        ( OFFSETOF(NtCurrentTeb()->WOW32Reserved) - argsize );
621 622 623 624

    /* Copy modified buffers back to 32-bit stack */
    memcpy( oldstack, newstack, argsize );
}
625
#ifdef DEFINE_REGS_ENTRYPOINT
626
DEFINE_REGS_ENTRYPOINT( FT_Thunk, 0, 0 )
627
#endif
628

629 630
#ifdef __i386__

631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646
/***********************************************************************
 *		FT_Exit0 (KERNEL32.@)
 *		FT_Exit4 (KERNEL32.@)
 *		FT_Exit8 (KERNEL32.@)
 *		FT_Exit12 (KERNEL32.@)
 *		FT_Exit16 (KERNEL32.@)
 *		FT_Exit20 (KERNEL32.@)
 *		FT_Exit24 (KERNEL32.@)
 *		FT_Exit28 (KERNEL32.@)
 *		FT_Exit32 (KERNEL32.@)
 *		FT_Exit36 (KERNEL32.@)
 *		FT_Exit40 (KERNEL32.@)
 *		FT_Exit44 (KERNEL32.@)
 *		FT_Exit48 (KERNEL32.@)
 *		FT_Exit52 (KERNEL32.@)
 *		FT_Exit56 (KERNEL32.@)
647 648 649
 *
 * One of the FT_ExitNN functions is called at the end of the thunk code.
 * It removes the stack frame created by FT_Prolog, moves the function
650 651
 * return from EBX to EAX (yes, FT_Thunk did use EAX for the return
 * value, but the thunk code has moved it from EAX to EBX in the
652 653 654 655
 * meantime ... :-), restores the caller's EBX, ESI, and EDI registers,
 * and perform a return to the CALLER of the thunk code (while removing
 * the given number of arguments from the caller's stack).
 */
656 657 658 659 660 661
#define FT_EXIT_RESTORE_REGS \
    "movl %ebx,%eax\n\t" \
    "movl -4(%ebp),%ebx\n\t" \
    "movl -8(%ebp),%esi\n\t" \
    "movl -12(%ebp),%edi\n\t" \
    "leave\n\t"
662

663
#define DEFINE_FT_Exit(n) \
664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680
    __ASM_GLOBAL_FUNC( FT_Exit ## n, FT_EXIT_RESTORE_REGS "ret $" #n )

DEFINE_FT_Exit(0)
DEFINE_FT_Exit(4)
DEFINE_FT_Exit(8)
DEFINE_FT_Exit(12)
DEFINE_FT_Exit(16)
DEFINE_FT_Exit(20)
DEFINE_FT_Exit(24)
DEFINE_FT_Exit(28)
DEFINE_FT_Exit(32)
DEFINE_FT_Exit(36)
DEFINE_FT_Exit(40)
DEFINE_FT_Exit(44)
DEFINE_FT_Exit(48)
DEFINE_FT_Exit(52)
DEFINE_FT_Exit(56)
681

682
#endif /* __i386__ */
683 684 685 686


/***********************************************************************
 * 		ThunkInitLS 	(KERNEL32.43)
687
 * A thunkbuffer link routine
688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711
 * The thunkbuf looks like:
 *
 *	00: DWORD	length		? don't know exactly
 *	04: SEGPTR	ptr		? where does it point to?
 * The pointer ptr is written into the first DWORD of 'thunk'.
 * (probably correctly implemented)
 * [ok probably]
 * RETURNS
 *	segmented pointer to thunk?
 */
DWORD WINAPI ThunkInitLS(
	LPDWORD thunk,	/* [in] win32 thunk */
	LPCSTR thkbuf,	/* [in] thkbuffer name in win16 dll */
	DWORD len,	/* [in] thkbuffer length */
	LPCSTR dll16,	/* [in] name of win16 dll */
	LPCSTR dll32	/* [in] name of win32 dll (FIXME: not used?) */
) {
	LPDWORD		addr;

	if (!(addr = _loadthunk( dll16, thkbuf, dll32, NULL, len )))
		return 0;

	if (!addr[1])
		return 0;
712
	*thunk = addr[1];
713 714 715 716 717 718

	return addr[1];
}

/***********************************************************************
 * 		Common32ThkLS 	(KERNEL32.45)
719
 *
720
 * This is another 32->16 thunk, independent of the QT_Thunk/FT_Thunk
721
 * style thunks. The basic difference is that the parameter conversion
722 723 724 725
 * is done completely on the *16-bit* side here. Thus we do not call
 * the 16-bit target directly, but call a common entry point instead.
 * This entry function then calls the target according to the target
 * number passed in the DI register.
726
 *
727 728 729 730 731 732 733 734 735 736 737 738
 * Input:  EAX    SEGPTR to the common 16-bit entry point
 *         CX     offset in thunk table (target number * 4)
 *         DX     error return value if execution fails (unclear???)
 *         EDX.HI number of DWORD parameters
 *
 * (Note that we need to move the thunk table offset from CX to DI !)
 *
 * The called 16-bit stub expects its stack to look like this:
 *     ...
 *   (esp+40)  32-bit arguments
 *     ...
 *   (esp+8)   32 byte of stack space available as buffer
739 740
 *   (esp)     8 byte return address for use with 0x66 lret
 *
741 742
 * The called 16-bit stub uses a 0x66 lret to return to 32-bit code,
 * and uses the EAX register to return a DWORD return value.
743
 * Thus we need to use a special assembly glue routine
744 745
 * (CallRegisterLongProc instead of CallRegisterShortProc).
 *
746
 * Finally, we return to the caller, popping the arguments off
747 748
 * the stack.  The number of arguments to be popped is returned
 * in the BL register by the called 16-bit routine.
749 750
 *
 */
751
void WINAPI __regs_Common32ThkLS( CONTEXT86 *context )
752 753 754 755 756 757
{
    CONTEXT86 context16;
    DWORD argsize;

    memcpy(&context16,context,sizeof(context16));

758 759
    context16.SegFs = wine_get_fs();
    context16.SegGs = wine_get_gs();
760 761 762
    context16.Edi   = LOWORD(context->Ecx);
    context16.SegCs = HIWORD(context->Eax);
    context16.Eip   = LOWORD(context->Eax);
763
    context16.Ebp   = OFFSETOF(NtCurrentTeb()->WOW32Reserved) + FIELD_OFFSET(STACK16FRAME,bp);
764

765
    argsize = HIWORD(context->Edx) * 4;
766 767

    /* FIXME: hack for stupid USER32 CallbackGlueLS routine */
768
    if (context->Edx == context->Eip)
769 770
        argsize = 6 * 4;

771 772 773 774 775
    /* Note: the first 32 bytes we copy are just garbage from the 32-bit stack, in order to reserve
     *       the space. It is safe to do that since the register function prefix has reserved
     *       a lot more space than that below context->Esp.
     */
    WOWCallback16Ex( 0, WCB16_REGS, argsize + 32, (LPBYTE)context->Esp - 32, (DWORD *)&context16 );
776
    context->Eax = context16.Eax;
777 778

    /* Clean up caller's stack frame */
779
    context->Esp += LOBYTE(context16.Ebx);
780
}
781
#ifdef DEFINE_REGS_ENTRYPOINT
782
DEFINE_REGS_ENTRYPOINT( Common32ThkLS, 0, 0 )
783
#endif
784 785 786 787 788 789 790

/***********************************************************************
 *		OT_32ThkLSF	(KERNEL32.40)
 *
 * YET Another 32->16 thunk. The difference to Common32ThkLS is that
 * argument processing is done on both the 32-bit and the 16-bit side:
 * The 32-bit side prepares arguments, copying them onto the stack.
791 792
 *
 * When this routine is called, the first word on the stack is the
793 794 795
 * number of argument bytes prepared by the 32-bit code, and EDX
 * contains the 16-bit target address.
 *
796
 * The called 16-bit routine is another relaycode, doing further
797 798 799 800 801 802 803
 * argument processing and then calling the real 16-bit target
 * whose address is stored at [bp-04].
 *
 * The call proceeds using a normal CallRegisterShortProc.
 * After return from the 16-bit relaycode, the arguments need
 * to be copied *back* to the 32-bit stack, since the 32-bit
 * relaycode processes output parameters.
804
 *
805 806 807 808 809 810 811
 * Note that we copy twice the number of arguments, since some of the
 * 16-bit relaycodes in SYSTHUNK.DLL directly access the original
 * arguments of the caller!
 *
 * (Note that this function seems only to be used for
 *  OLECLI32 -> OLECLI and OLESVR32 -> OLESVR thunking.)
 */
812
void WINAPI __regs_OT_32ThkLSF( CONTEXT86 *context )
813 814 815 816 817 818
{
    CONTEXT86 context16;
    DWORD argsize;

    memcpy(&context16,context,sizeof(context16));

819 820
    context16.SegFs = wine_get_fs();
    context16.SegGs = wine_get_gs();
821 822
    context16.SegCs = HIWORD(context->Edx);
    context16.Eip   = LOWORD(context->Edx);
823
    context16.Ebp   = OFFSETOF(NtCurrentTeb()->WOW32Reserved) + FIELD_OFFSET(STACK16FRAME,bp);
824

825
    argsize = 2 * *(WORD *)context->Esp + 2;
826

827
    WOWCallback16Ex( 0, WCB16_REGS, argsize, (void *)context->Esp, (DWORD *)&context16 );
828 829
    context->Eax = context16.Eax;
    context->Edx = context16.Edx;
830

831
    /* Copy modified buffers back to 32-bit stack */
832
    memcpy( (LPBYTE)context->Esp,
833
            (LPBYTE)CURRENT_STACK16 - argsize, argsize );
834

835
    context->Esp +=   LOWORD(context16.Esp) -
836
                        ( OFFSETOF(NtCurrentTeb()->WOW32Reserved) - argsize );
837
}
838
#ifdef DEFINE_REGS_ENTRYPOINT
839
DEFINE_REGS_ENTRYPOINT( OT_32ThkLSF, 0, 0 )
840
#endif
841 842 843 844 845 846

/***********************************************************************
 *		ThunkInitLSF		(KERNEL32.41)
 * A thunk setup routine.
 * Expects a pointer to a preinitialized thunkbuffer in the first argument
 * looking like:
Jon Griffiths's avatar
Jon Griffiths committed
847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868
 *|	00..03:		unknown	(pointer, check _41, _43, _46)
 *|	04: EB1E		jmp +0x20
 *|
 *|	06..23:		unknown (space for replacement code, check .90)
 *|
 *|	24:>E800000000		call offset 29
 *|	29:>58			pop eax		   ( target of call )
 *|	2A: 2D25000000		sub eax,0x00000025 ( now points to offset 4 )
 *|	2F: BAxxxxxxxx		mov edx,xxxxxxxx
 *|	34: 68yyyyyyyy		push KERNEL32.90
 *|	39: C3			ret
 *|
 *|	3A: EB1E		jmp +0x20
 *|	3E ... 59:	unknown (space for replacement code?)
 *|	5A: E8xxxxxxxx		call <32bitoffset xxxxxxxx>
 *|	5F: 5A			pop edx
 *|	60: 81EA25xxxxxx	sub edx, 0x25xxxxxx
 *|	66: 52			push edx
 *|	67: 68xxxxxxxx		push xxxxxxxx
 *|	6C: 68yyyyyyyy		push KERNEL32.89
 *|	71: C3			ret
 *|	72: end?
869 870 871 872
 * This function checks if the code is there, and replaces the yyyyyyyy entries
 * by the functionpointers.
 * The thunkbuf looks like:
 *
Jon Griffiths's avatar
Jon Griffiths committed
873 874
 *|	00: DWORD	length		? don't know exactly
 *|	04: SEGPTR	ptr		? where does it point to?
875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890
 * The segpointer ptr is written into the first DWORD of 'thunk'.
 * [ok probably]
 * RETURNS
 *	unclear, pointer to win16 thkbuffer?
 */
LPVOID WINAPI ThunkInitLSF(
	LPBYTE thunk,	/* [in] win32 thunk */
	LPCSTR thkbuf,	/* [in] thkbuffer name in win16 dll */
	DWORD len,	/* [in] length of thkbuffer */
	LPCSTR dll16,	/* [in] name of win16 dll */
	LPCSTR dll32	/* [in] name of win32 dll */
) {
	LPDWORD		addr,addr2;

	/* FIXME: add checks for valid code ... */
	/* write pointers to kernel32.89 and kernel32.90 (+ordinal base of 1) */
891 892
	*(DWORD*)(thunk+0x35) = (DWORD)GetProcAddress(kernel32_handle,(LPSTR)90);
	*(DWORD*)(thunk+0x6D) = (DWORD)GetProcAddress(kernel32_handle,(LPSTR)89);
893

894

895 896 897
	if (!(addr = _loadthunk( dll16, thkbuf, dll32, NULL, len )))
		return 0;

898
	addr2 = MapSL(addr[1]);
899 900 901 902 903 904 905 906
	if (HIWORD(addr2))
		*(DWORD*)thunk = (DWORD)addr2;

	return addr2;
}

/***********************************************************************
 *		FT_PrologPrime			(KERNEL32.89)
907
 *
908
 * This function is called from the relay code installed by
909
 * ThunkInitLSF. It replaces the location from where it was
910 911 912
 * called by a standard FT_Prolog call stub (which is 'primed'
 * by inserting the correct target table pointer).
 * Finally, it calls that stub.
913
 *
914
 * Input:  ECX    target number + flags (passed through to FT_Prolog)
915
 *        (ESP)   offset of location where target table pointer
916 917 918
 *                is stored, relative to the start of the relay code
 *        (ESP+4) pointer to start of relay code
 *                (this is where the FT_Prolog call stub gets written to)
919
 *
920
 * Note: The two DWORD arguments get popped off the stack.
921
 *
922
 */
923
void WINAPI __regs_FT_PrologPrime( CONTEXT86 *context )
924 925 926 927 928 929
{
    DWORD  targetTableOffset;
    LPBYTE relayCode;

    /* Compensate for the fact that the Wine register relay code thought
       we were being called, although we were in fact jumped to */
930
    context->Esp -= 4;
931 932 933 934 935 936 937

    /* Write FT_Prolog call stub */
    targetTableOffset = stack32_pop(context);
    relayCode = (LPBYTE)stack32_pop(context);
    _write_ftprolog( relayCode, *(DWORD **)(relayCode+targetTableOffset) );

    /* Jump to the call stub just created */
938
    context->Eip = (DWORD)relayCode;
939
}
940
#ifdef DEFINE_REGS_ENTRYPOINT
941
DEFINE_REGS_ENTRYPOINT( FT_PrologPrime, 0, 0 )
942
#endif
943 944 945 946

/***********************************************************************
 *		QT_ThunkPrime			(KERNEL32.90)
 *
947
 * This function corresponds to FT_PrologPrime, but installs a
948 949 950 951 952
 * call stub for QT_Thunk instead.
 *
 * Input: (EBP-4) target number (passed through to QT_Thunk)
 *         EDX    target table pointer location offset
 *         EAX    start of relay code
953
 *
954
 */
955
void WINAPI __regs_QT_ThunkPrime( CONTEXT86 *context )
956 957 958 959 960 961
{
    DWORD  targetTableOffset;
    LPBYTE relayCode;

    /* Compensate for the fact that the Wine register relay code thought
       we were being called, although we were in fact jumped to */
962
    context->Esp -= 4;
963 964

    /* Write QT_Thunk call stub */
965 966
    targetTableOffset = context->Edx;
    relayCode = (LPBYTE)context->Eax;
967 968 969
    _write_qtthunk( relayCode, *(DWORD **)(relayCode+targetTableOffset) );

    /* Jump to the call stub just created */
970
    context->Eip = (DWORD)relayCode;
971
}
972
#ifdef DEFINE_REGS_ENTRYPOINT
973
DEFINE_REGS_ENTRYPOINT( QT_ThunkPrime, 0, 0 )
974
#endif
975 976 977 978 979 980 981 982

/***********************************************************************
 *		ThunkInitSL (KERNEL32.46)
 * Another thunkbuf link routine.
 * The start of the thunkbuf looks like this:
 * 	00: DWORD	length
 *	04: SEGPTR	address for thunkbuffer pointer
 * [ok probably]
983 984 985
 *
 * RETURNS
 *  Nothing.
986 987 988 989 990 991 992 993 994 995 996 997 998
 */
VOID WINAPI ThunkInitSL(
	LPBYTE thunk,		/* [in] start of thunkbuffer */
	LPCSTR thkbuf,		/* [in] name/ordinal of thunkbuffer in win16 dll */
	DWORD len,		/* [in] length of thunkbuffer */
	LPCSTR dll16,		/* [in] name of win16 dll containing the thkbuf */
	LPCSTR dll32		/* [in] win32 dll. FIXME: strange, unused */
) {
	LPDWORD		addr;

	if (!(addr = _loadthunk( dll16, thkbuf, dll32, NULL, len )))
		return;

999
	*(DWORD*)MapSL(addr[1]) = (DWORD)thunk;
1000 1001 1002
}

/**********************************************************************
1003
 *           SSInit		(KERNEL.700)
1004 1005 1006
 * RETURNS
 *	TRUE for success.
 */
1007
BOOL WINAPI SSInit16(void)
1008 1009 1010 1011 1012
{
    return TRUE;
}

/**********************************************************************
1013
 *           SSOnBigStack	(KERNEL32.87)
1014 1015 1016 1017 1018 1019
 * Check if thunking is initialized (ss selector set up etc.)
 * We do that differently, so just return TRUE.
 * [ok]
 * RETURNS
 *	TRUE for success.
 */
1020
BOOL WINAPI SSOnBigStack(void)
1021 1022 1023 1024 1025 1026
{
    TRACE("Yes, thunking is initialized\n");
    return TRUE;
}

/**********************************************************************
1027
 *           SSConfirmSmallStack     (KERNEL.704)
1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038
 *
 * Abort if not on small stack.
 *
 * This must be a register routine as it has to preserve *all* registers.
 */
void WINAPI SSConfirmSmallStack( CONTEXT86 *context )
{
    /* We are always on the small stack while in 16-bit code ... */
}

/**********************************************************************
1039
 *           SSCall (KERNEL32.88)
1040 1041 1042 1043 1044
 * One of the real thunking functions. This one seems to be for 32<->32
 * thunks. It should probably be capable of crossing processboundaries.
 *
 * And YES, I've seen nr=48 (somewhere in the Win95 32<->16 OLE coupling)
 * [ok]
1045 1046 1047
 *
 * RETURNS
 *  Thunked function result.
1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059
 */
DWORD WINAPIV SSCall(
	DWORD nr,	/* [in] number of argument bytes */
	DWORD flags,	/* [in] FIXME: flags ? */
	FARPROC fun,	/* [in] function to call */
	...		/* [in/out] arguments */
) {
    DWORD i,ret;
    DWORD *args = ((DWORD *)&fun) + 1;

    if(TRACE_ON(thunk))
    {
1060
      DPRINTF("(%d,0x%08x,%p,[",nr,flags,fun);
1061
      for (i=0;i<nr/4;i++)
1062
          DPRINTF("0x%08x,",args[i]);
1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092
      DPRINTF("])\n");
    }
    switch (nr) {
    case 0:	ret = fun();
		break;
    case 4:	ret = fun(args[0]);
		break;
    case 8:	ret = fun(args[0],args[1]);
		break;
    case 12:	ret = fun(args[0],args[1],args[2]);
		break;
    case 16:	ret = fun(args[0],args[1],args[2],args[3]);
		break;
    case 20:	ret = fun(args[0],args[1],args[2],args[3],args[4]);
		break;
    case 24:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5]);
		break;
    case 28:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5],args[6]);
		break;
    case 32:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5],args[6],args[7]);
		break;
    case 36:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5],args[6],args[7],args[8]);
		break;
    case 40:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5],args[6],args[7],args[8],args[9]);
		break;
    case 44:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5],args[6],args[7],args[8],args[9],args[10]);
		break;
    case 48:	ret = fun(args[0],args[1],args[2],args[3],args[4],args[5],args[6],args[7],args[8],args[9],args[10],args[11]);
		break;
    default:
1093
	WARN("Unsupported nr of arguments, %d\n",nr);
1094 1095 1096 1097
	ret = 0;
	break;

    }
1098
    TRACE(" returning %d ...\n",ret);
1099 1100 1101 1102 1103 1104
    return ret;
}

/**********************************************************************
 *           W32S_BackTo32                      (KERNEL32.51)
 */
1105
void WINAPI __regs_W32S_BackTo32( CONTEXT86 *context )
1106
{
1107 1108
    LPDWORD stack = (LPDWORD)context->Esp;
    FARPROC proc = (FARPROC)context->Eip;
1109

1110
    context->Eax = proc( stack[1], stack[2], stack[3], stack[4], stack[5],
1111 1112
                               stack[6], stack[7], stack[8], stack[9], stack[10] );

1113
    context->Eip = stack32_pop(context);
1114
}
1115
#ifdef DEFINE_REGS_ENTRYPOINT
1116
DEFINE_REGS_ENTRYPOINT( W32S_BackTo32, 0, 0 )
1117
#endif
1118 1119

/**********************************************************************
1120
 *			AllocSLCallback		(KERNEL32.@)
1121
 *
1122 1123
 * Allocate a 16->32 callback.
 *
Jon Griffiths's avatar
Jon Griffiths committed
1124
 * NOTES
1125 1126 1127
 * Win95 uses some structchains for callbacks. It allocates them
 * in blocks of 100 entries, size 32 bytes each, layout:
 * blockstart:
Jon Griffiths's avatar
Jon Griffiths committed
1128 1129 1130 1131
 *| 	0:	PTR	nextblockstart
 *|	4:	entry	*first;
 *|	8:	WORD	sel ( start points to blockstart)
 *|	A:	WORD	unknown
1132
 * 100xentry:
Jon Griffiths's avatar
Jon Griffiths committed
1133 1134 1135
 *|	00..17:		Code
 *|	18:	PDB	*owning_process;
 *|	1C:	PTR	blockstart
1136 1137 1138 1139 1140 1141 1142
 *
 * We ignore this for now. (Just a note for further developers)
 * FIXME: use this method, so we don't waste selectors...
 *
 * Following code is then generated by AllocSLCallback. The code is 16 bit, so
 * the 0x66 prefix switches from word->long registers.
 *
Jon Griffiths's avatar
Jon Griffiths committed
1143 1144 1145 1146
 *|	665A		pop	edx
 *|	6668x arg2 x 	pushl	<arg2>
 *|	6652		push	edx
 *|	EAx arg1 x	jmpf	<arg1>
1147 1148 1149
 *
 * returns the startaddress of this thunk.
 *
Jon Griffiths's avatar
Jon Griffiths committed
1150
 * Note, that they look very similar to the ones allocates by THUNK_Alloc.
1151
 * RETURNS
Jon Griffiths's avatar
Jon Griffiths committed
1152
 *	A segmented pointer to the start of the thunk
1153 1154 1155
 */
DWORD WINAPI
AllocSLCallback(
Jon Griffiths's avatar
Jon Griffiths committed
1156 1157
	DWORD finalizer,	/* [in] Finalizer function */
	DWORD callback		/* [in] Callback function */
1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169
) {
	LPBYTE	x,thunk = HeapAlloc( GetProcessHeap(), 0, 32 );
	WORD	sel;

	x=thunk;
	*x++=0x66;*x++=0x5a;				/* popl edx */
	*x++=0x66;*x++=0x68;*(DWORD*)x=finalizer;x+=4;	/* pushl finalizer */
	*x++=0x66;*x++=0x52;				/* pushl edx */
	*x++=0xea;*(DWORD*)x=callback;x+=4;		/* jmpf callback */

	*(DWORD*)(thunk+18) = GetCurrentProcessId();

1170
	sel = SELECTOR_AllocBlock( thunk, 32, WINE_LDT_FLAGS_CODE );
1171 1172 1173 1174
	return (sel<<16)|0;
}

/**********************************************************************
1175
 * 		FreeSLCallback		(KERNEL32.@)
1176
 * Frees the specified 16->32 callback
1177 1178 1179
 *
 * RETURNS
 *  Nothing.
1180 1181 1182 1183 1184
 */
void WINAPI
FreeSLCallback(
	DWORD x	/* [in] 16 bit callback (segmented pointer?) */
) {
1185
	FIXME("(0x%08x): stub\n",x);
1186 1187 1188 1189 1190 1191 1192
}


/**********************************************************************
 * 		GetTEBSelectorFS	(KERNEL.475)
 * 	Set the 16-bit %fs to the 32-bit %fs (current TEB selector)
 */
1193
void WINAPI GetTEBSelectorFS16(void)
1194
{
1195
    CURRENT_STACK16->fs = wine_get_fs();
1196 1197 1198
}

/**********************************************************************
1199
 * 		IsPeFormat		(KERNEL.431)
Jon Griffiths's avatar
Jon Griffiths committed
1200 1201 1202
 *
 * Determine if a file is a PE format executable.
 *
1203 1204
 * RETURNS
 *  TRUE, if it is.
Jon Griffiths's avatar
Jon Griffiths committed
1205 1206 1207 1208
 *  FALSE if the file could not be opened or is not a PE file.
 *
 * NOTES
 *  If fn is given as NULL then the function expects hf16 to be valid.
1209 1210
 */
BOOL16 WINAPI IsPeFormat16(
1211
	LPSTR	fn,	/* [in] Filename to the executable */
Jon Griffiths's avatar
Jon Griffiths committed
1212 1213
	HFILE16 hf16)	/* [in] An open file handle */
{
1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229
    BOOL ret = FALSE;
    IMAGE_DOS_HEADER mzh;
    OFSTRUCT ofs;
    DWORD xmagic;

    if (fn) hf16 = OpenFile16(fn,&ofs,OF_READ);
    if (hf16 == HFILE_ERROR16) return FALSE;
    _llseek16(hf16,0,SEEK_SET);
    if (sizeof(mzh)!=_lread16(hf16,&mzh,sizeof(mzh))) goto done;
    if (mzh.e_magic!=IMAGE_DOS_SIGNATURE) goto done;
    _llseek16(hf16,mzh.e_lfanew,SEEK_SET);
    if (sizeof(DWORD)!=_lread16(hf16,&xmagic,sizeof(DWORD))) goto done;
    ret = (xmagic == IMAGE_NT_SIGNATURE);
 done:
    _lclose16(hf16);
    return ret;
1230 1231 1232 1233
}


/***********************************************************************
1234
 *           K32Thk1632Prolog			(KERNEL32.@)
1235
 */
1236
void WINAPI __regs_K32Thk1632Prolog( CONTEXT86 *context )
1237
{
1238
   LPBYTE code = (LPBYTE)context->Eip - 5;
1239 1240 1241 1242 1243 1244

   /* Arrrgh! SYSTHUNK.DLL just has to re-implement another method
      of 16->32 thunks instead of using one of the standard methods!
      This means that SYSTHUNK.DLL itself switches to a 32-bit stack,
      and does a far call to the 32-bit code segment of OLECLI32/OLESVR32.
      Unfortunately, our CallTo/CallFrom mechanism is therefore completely
1245
      bypassed, which means it will crash the next time the 32-bit OLE
1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257
      code thunks down again to 16-bit (this *will* happen!).

      The following hack tries to recognize this situation.
      This is possible since the called stubs in OLECLI32/OLESVR32 all
      look exactly the same:
        00   E8xxxxxxxx    call K32Thk1632Prolog
        05   FF55FC        call [ebp-04]
        08   E8xxxxxxxx    call K32Thk1632Epilog
        0D   66CB          retf

      If we recognize this situation, we try to simulate the actions
      of our CallTo/CallFrom mechanism by copying the 16-bit stack
1258 1259
      to our 32-bit stack, creating a proper STACK16FRAME and
      updating cur_stack. */
1260 1261 1262 1263

   if (   code[5] == 0xFF && code[6] == 0x55 && code[7] == 0xFC
       && code[13] == 0x66 && code[14] == 0xCB)
   {
1264 1265
      DWORD argSize = context->Ebp - context->Esp;
      char *stack16 = (char *)context->Esp - 4;
1266
      STACK16FRAME *frame16 = (STACK16FRAME *)stack16 - 1;
1267 1268 1269 1270
      STACK32FRAME *frame32 = (STACK32FRAME *)NtCurrentTeb()->WOW32Reserved;
      char *stack32 = (char *)frame32 - argSize;
      WORD  stackSel  = SELECTOROF(frame32->frame16);
      DWORD stackBase = GetSelectorBase(stackSel);
1271

1272
      TRACE("before SYSTHUNK hack: EBP: %08x ESP: %08x cur_stack: %p\n",
1273
            context->Ebp, context->Esp, NtCurrentTeb()->WOW32Reserved);
1274 1275

      memset(frame16, '\0', sizeof(STACK16FRAME));
1276
      frame16->frame32 = frame32;
1277
      frame16->ebp = context->Ebp;
1278 1279

      memcpy(stack32, stack16, argSize);
1280
      NtCurrentTeb()->WOW32Reserved = (void *)MAKESEGPTR(stackSel, (DWORD)frame16 - stackBase);
1281

1282 1283
      context->Esp = (DWORD)stack32 + 4;
      context->Ebp = context->Esp + argSize;
1284

1285
      TRACE("after  SYSTHUNK hack: EBP: %08x ESP: %08x cur_stack: %p\n",
1286
            context->Ebp, context->Esp, NtCurrentTeb()->WOW32Reserved);
1287 1288
   }

1289 1290 1291
    /* entry_point is never used again once the entry point has
       been called.  Thus we re-use it to hold the Win16Lock count */
   ReleaseThunkLock(&CURRENT_STACK16->entry_point);
1292
}
1293
#ifdef DEFINE_REGS_ENTRYPOINT
1294
DEFINE_REGS_ENTRYPOINT( K32Thk1632Prolog, 0, 0 )
1295
#endif
1296 1297

/***********************************************************************
1298
 *           K32Thk1632Epilog			(KERNEL32.@)
1299
 */
1300
void WINAPI __regs_K32Thk1632Epilog( CONTEXT86 *context )
1301
{
1302
   LPBYTE code = (LPBYTE)context->Eip - 13;
1303

1304
   RestoreThunkLock(CURRENT_STACK16->entry_point);
1305 1306 1307 1308 1309 1310

   /* We undo the SYSTHUNK hack if necessary. See K32Thk1632Prolog. */

   if (   code[5] == 0xFF && code[6] == 0x55 && code[7] == 0xFC
       && code[13] == 0x66 && code[14] == 0xCB)
   {
1311
      STACK16FRAME *frame16 = MapSL((SEGPTR)NtCurrentTeb()->WOW32Reserved);
1312 1313 1314 1315
      char *stack16 = (char *)(frame16 + 1);
      DWORD argSize = frame16->ebp - (DWORD)stack16;
      char *stack32 = (char *)frame16->frame32 - argSize;

1316
      DWORD nArgsPopped = context->Esp - (DWORD)stack32;
1317

1318
      TRACE("before SYSTHUNK hack: EBP: %08x ESP: %08x cur_stack: %p\n",
1319
            context->Ebp, context->Esp, NtCurrentTeb()->WOW32Reserved);
1320

1321
      NtCurrentTeb()->WOW32Reserved = frame16->frame32;
1322

1323 1324
      context->Esp = (DWORD)stack16 + nArgsPopped;
      context->Ebp = frame16->ebp;
1325

1326
      TRACE("after  SYSTHUNK hack: EBP: %08x ESP: %08x cur_stack: %p\n",
1327
            context->Ebp, context->Esp, NtCurrentTeb()->WOW32Reserved);
1328 1329
   }
}
1330
#ifdef DEFINE_REGS_ENTRYPOINT
1331
DEFINE_REGS_ENTRYPOINT( K32Thk1632Epilog, 0, 0 )
1332
#endif
1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350

/*********************************************************************
 *                   PK16FNF [KERNEL32.91]
 *
 *  This routine fills in the supplied 13-byte (8.3 plus terminator)
 *  string buffer with the 8.3 filename of a recently loaded 16-bit
 *  module.  It is unknown exactly what modules trigger this
 *  mechanism or what purpose this serves.  Win98 Explorer (and
 *  probably also Win95 with IE 4 shell integration) calls this
 *  several times during initialization.
 *
 *  FIXME: find out what this really does and make it work.
 */
void WINAPI PK16FNF(LPSTR strPtr)
{
       FIXME("(%p): stub\n", strPtr);

       /* fill in a fake filename that'll be easy to recognize */
1351
       strcpy(strPtr, "WINESTUB.FIX");
1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376
}

/***********************************************************************
 * 16->32 Flat Thunk routines:
 */

/***********************************************************************
 *              ThunkConnect16          (KERNEL.651)
 * Connects a 32bit and a 16bit thunkbuffer.
 */
UINT WINAPI ThunkConnect16(
        LPSTR module16,              /* [in] name of win16 dll */
        LPSTR module32,              /* [in] name of win32 dll */
        HINSTANCE16 hInst16,         /* [in] hInst of win16 dll */
        DWORD dwReason,              /* [in] initialisation argument */
        struct ThunkDataCommon *TD,  /* [in/out] thunkbuffer */
        LPSTR thunkfun32,            /* [in] win32 thunkfunction */
        WORD cs                      /* [in] CS of win16 dll */
) {
    BOOL directionSL;

    if (!strncmp(TD->magic, "SL01", 4))
    {
        directionSL = TRUE;

1377
        TRACE("SL01 thunk %s (%p) -> %s (%s), Reason: %d\n",
1378
              module16, TD, module32, thunkfun32, dwReason);
1379 1380 1381 1382 1383
    }
    else if (!strncmp(TD->magic, "LS01", 4))
    {
        directionSL = FALSE;

1384
        TRACE("LS01 thunk %s (%p) <- %s (%s), Reason: %d\n",
1385
              module16, TD, module32, thunkfun32, dwReason);
1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409
    }
    else
    {
        ERR("Invalid magic %c%c%c%c\n",
            TD->magic[0], TD->magic[1], TD->magic[2], TD->magic[3]);
        return 0;
    }

    switch (dwReason)
    {
        case DLL_PROCESS_ATTACH:
            if (directionSL)
            {
                struct ThunkDataSL16 *SL16 = (struct ThunkDataSL16 *)TD;
                struct ThunkDataSL   *SL   = SL16->fpData;

                if (SL == NULL)
                {
                    SL = HeapAlloc(GetProcessHeap(), 0, sizeof(*SL));

                    SL->common   = SL16->common;
                    SL->flags1   = SL16->flags1;
                    SL->flags2   = SL16->flags2;

1410
                    SL->apiDB    = MapSL(SL16->apiDatabase);
1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450
                    SL->targetDB = NULL;

                    lstrcpynA(SL->pszDll16, module16, 255);
                    lstrcpynA(SL->pszDll32, module32, 255);

                    /* We should create a SEGPTR to the ThunkDataSL,
                       but since the contents are not in the original format,
                       any access to this by 16-bit code would crash anyway. */
                    SL16->spData = 0;
                    SL16->fpData = SL;
                }


                if (SL->flags2 & 0x80000000)
                {
                    TRACE("Preloading 32-bit library\n");
                    LoadLibraryA(module32);
                }
            }
            else
            {
                /* nothing to do */
            }
            break;

        case DLL_PROCESS_DETACH:
            /* FIXME: cleanup */
            break;
    }

    return 1;
}


/***********************************************************************
 *           C16ThkSL                           (KERNEL.630)
 */

void WINAPI C16ThkSL(CONTEXT86 *context)
{
1451
    LPBYTE stub = MapSL(context->Eax), x = stub;
1452 1453
    WORD cs = wine_get_cs();
    WORD ds = wine_get_ds();
1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464

    /* We produce the following code:
     *
     *   mov ax, __FLATDS
     *   mov es, ax
     *   movzx ecx, cx
     *   mov edx, es:[ecx + $EDX]
     *   push bp
     *   push edx
     *   push dx
     *   push edx
1465
     *   call __FLATCS:__wine_call_from_16_thunk
1466 1467
     */

1468
    *x++ = 0xB8; *(WORD *)x = ds; x += sizeof(WORD);
1469 1470 1471
    *x++ = 0x8E; *x++ = 0xC0;
    *x++ = 0x66; *x++ = 0x0F; *x++ = 0xB7; *x++ = 0xC9;
    *x++ = 0x67; *x++ = 0x66; *x++ = 0x26; *x++ = 0x8B;
1472
                 *x++ = 0x91; *(DWORD *)x = context->Edx; x += sizeof(DWORD);
1473 1474 1475 1476 1477

    *x++ = 0x55;
    *x++ = 0x66; *x++ = 0x52;
    *x++ = 0x52;
    *x++ = 0x66; *x++ = 0x52;
1478 1479 1480
    *x++ = 0x66; *x++ = 0x9A;
    *(void **)x = __wine_call_from_16_thunk; x += sizeof(void *);
    *(WORD *)x = cs; x += sizeof(WORD);
1481 1482

    /* Jump to the stub code just created */
1483 1484
    context->Eip = LOWORD(context->Eax);
    context->SegCs  = HIWORD(context->Eax);
1485 1486 1487

    /* Since C16ThkSL got called by a jmp, we need to leave the
       original return address on the stack */
1488
    context->Esp -= 4;
1489 1490 1491 1492 1493 1494 1495 1496
}

/***********************************************************************
 *           C16ThkSL01                         (KERNEL.631)
 */

void WINAPI C16ThkSL01(CONTEXT86 *context)
{
1497
    LPBYTE stub = MapSL(context->Eax), x = stub;
1498 1499 1500

    if (stub)
    {
1501
        struct ThunkDataSL16 *SL16 = MapSL(context->Edx);
1502 1503
        struct ThunkDataSL *td = SL16->fpData;

1504
        DWORD procAddress = (DWORD)GetProcAddress16(GetModuleHandle16("KERNEL"), (LPCSTR)631);
1505
        WORD cs = wine_get_cs();
1506 1507 1508 1509 1510 1511 1512

        if (!td)
        {
            ERR("ThunkConnect16 was not called!\n");
            return;
        }

1513
        TRACE("Creating stub for ThunkDataSL %p\n", td);
1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524


        /* We produce the following code:
         *
         *   xor eax, eax
         *   mov edx, $td
         *   call C16ThkSL01
         *   push bp
         *   push edx
         *   push dx
         *   push edx
1525
         *   call __FLATCS:__wine_call_from_16_thunk
1526 1527 1528
         */

        *x++ = 0x66; *x++ = 0x33; *x++ = 0xC0;
1529 1530
        *x++ = 0x66; *x++ = 0xBA; *(void **)x = td; x += sizeof(void *);
        *x++ = 0x9A; *(DWORD *)x = procAddress; x += sizeof(DWORD);
1531 1532 1533 1534 1535

        *x++ = 0x55;
        *x++ = 0x66; *x++ = 0x52;
        *x++ = 0x52;
        *x++ = 0x66; *x++ = 0x52;
1536 1537 1538
        *x++ = 0x66; *x++ = 0x9A;
        *(void **)x = __wine_call_from_16_thunk; x += sizeof(void *);
        *(WORD *)x = cs; x += sizeof(WORD);
1539 1540

        /* Jump to the stub code just created */
1541 1542
        context->Eip = LOWORD(context->Eax);
        context->SegCs  = HIWORD(context->Eax);
1543 1544

        /* Since C16ThkSL01 got called by a jmp, we need to leave the
1545
           original return address on the stack */
1546
        context->Esp -= 4;
1547 1548 1549
    }
    else
    {
1550
        struct ThunkDataSL *td = (struct ThunkDataSL *)context->Edx;
1551
        DWORD targetNr = LOWORD(context->Ecx) / 4;
1552 1553
        struct SLTargetDB *tdb;

1554
        TRACE("Process %08x calling target %d of ThunkDataSL %p\n",
1555
              GetCurrentProcessId(), targetNr, td);
1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572

        for (tdb = td->targetDB; tdb; tdb = tdb->next)
            if (tdb->process == GetCurrentProcessId())
                break;

        if (!tdb)
        {
            TRACE("Loading 32-bit library %s\n", td->pszDll32);
            LoadLibraryA(td->pszDll32);

            for (tdb = td->targetDB; tdb; tdb = tdb->next)
                if (tdb->process == GetCurrentProcessId())
                    break;
        }

        if (tdb)
        {
1573
            context->Edx = tdb->targetTable[targetNr];
1574

1575
            TRACE("Call target is %08x\n", context->Edx);
1576 1577 1578
        }
        else
        {
1579
            WORD *stack = MapSL( MAKESEGPTR(context->SegSs, LOWORD(context->Esp)) );
1580 1581
            context->Edx = (context->Edx & ~0xffff) | HIWORD(td->apiDB[targetNr].errorReturnValue);
            context->Eax = (context->Eax & ~0xffff) | LOWORD(td->apiDB[targetNr].errorReturnValue);
1582 1583 1584
            context->Eip = stack[2];
            context->SegCs  = stack[3];
            context->Esp += td->apiDB[targetNr].nrArgBytes + 4;
1585

1586
            ERR("Process %08x did not ThunkConnect32 %s to %s\n",
1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620
                GetCurrentProcessId(), td->pszDll32, td->pszDll16);
        }
    }
}


/***********************************************************************
 * 16<->32 Thunklet/Callback API:
 */

#include "pshpack1.h"
typedef struct _THUNKLET
{
    BYTE        prefix_target;
    BYTE        pushl_target;
    DWORD       target;

    BYTE        prefix_relay;
    BYTE        pushl_relay;
    DWORD       relay;

    BYTE        jmp_glue;
    DWORD       glue;

    BYTE        type;
    HINSTANCE16 owner;
    struct _THUNKLET *next;
} THUNKLET;
#include "poppack.h"

#define THUNKLET_TYPE_LS  1
#define THUNKLET_TYPE_SL  2

static HANDLE  ThunkletHeap = 0;
1621
static WORD ThunkletCodeSel;
1622 1623 1624 1625 1626 1627 1628 1629
static THUNKLET *ThunkletAnchor = NULL;

static FARPROC ThunkletSysthunkGlueLS = 0;
static SEGPTR    ThunkletSysthunkGlueSL = 0;

static FARPROC ThunkletCallbackGlueLS = 0;
static SEGPTR    ThunkletCallbackGlueSL = 0;

1630 1631

/* map a thunk allocated on ThunkletHeap to a 16-bit pointer */
1632
static inline SEGPTR get_segptr( void *thunk )
1633
{
1634
    if (!thunk) return 0;
1635 1636 1637
    return MAKESEGPTR( ThunkletCodeSel, (char *)thunk - (char *)ThunkletHeap );
}

1638 1639 1640
/***********************************************************************
 *           THUNK_Init
 */
1641
static BOOL THUNK_Init(void)
1642 1643 1644
{
    LPBYTE thunk;

1645
    ThunkletHeap = HeapCreate( 0, 0x10000, 0x10000 );
1646 1647
    if (!ThunkletHeap) return FALSE;

1648
    ThunkletCodeSel = SELECTOR_AllocBlock( ThunkletHeap, 0x10000, WINE_LDT_FLAGS_CODE );
1649

1650 1651
    thunk = HeapAlloc( ThunkletHeap, 0, 5 );
    if (!thunk) return FALSE;
1652

1653 1654 1655 1656
    ThunkletSysthunkGlueLS = (FARPROC)thunk;
    *thunk++ = 0x58;                             /* popl eax */
    *thunk++ = 0xC3;                             /* ret      */

1657
    ThunkletSysthunkGlueSL = get_segptr( thunk );
1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676
    *thunk++ = 0x66; *thunk++ = 0x58;            /* popl eax */
    *thunk++ = 0xCB;                             /* lret     */

    return TRUE;
}

/***********************************************************************
 *     SetThunkletCallbackGlue             (KERNEL.560)
 */
void WINAPI SetThunkletCallbackGlue16( FARPROC glueLS, SEGPTR glueSL )
{
    ThunkletCallbackGlueLS = glueLS;
    ThunkletCallbackGlueSL = glueSL;
}


/***********************************************************************
 *     THUNK_FindThunklet
 */
1677 1678
static THUNKLET *THUNK_FindThunklet( DWORD target, DWORD relay,
                                     DWORD glue, BYTE type )
1679
{
1680
    THUNKLET *thunk;
1681 1682 1683 1684

    for (thunk = ThunkletAnchor; thunk; thunk = thunk->next)
        if (    thunk->type   == type
             && thunk->target == target
1685
             && thunk->relay  == relay
1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696
             && ( type == THUNKLET_TYPE_LS ?
                    ( thunk->glue == glue - (DWORD)&thunk->type )
                  : ( thunk->glue == glue ) ) )
            return thunk;

     return NULL;
}

/***********************************************************************
 *     THUNK_AllocLSThunklet
 */
1697 1698
static FARPROC THUNK_AllocLSThunklet( SEGPTR target, DWORD relay,
                                      FARPROC glue, HTASK16 owner )
1699 1700 1701 1702 1703
{
    THUNKLET *thunk = THUNK_FindThunklet( (DWORD)target, relay, (DWORD)glue,
                                          THUNKLET_TYPE_LS );
    if (!thunk)
    {
1704
        TDB *pTask = GlobalLock16( owner );
1705

1706
        if (!ThunkletHeap) THUNK_Init();
1707 1708 1709 1710 1711 1712 1713 1714
        if ( !(thunk = HeapAlloc( ThunkletHeap, 0, sizeof(THUNKLET) )) )
            return 0;

        thunk->prefix_target = thunk->prefix_relay = 0x90;
        thunk->pushl_target  = thunk->pushl_relay  = 0x68;
        thunk->jmp_glue = 0xE9;

        thunk->target  = (DWORD)target;
1715
        thunk->relay   = relay;
1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730
        thunk->glue    = (DWORD)glue - (DWORD)&thunk->type;

        thunk->type    = THUNKLET_TYPE_LS;
        thunk->owner   = pTask? pTask->hInstance : 0;

        thunk->next    = ThunkletAnchor;
        ThunkletAnchor = thunk;
    }

    return (FARPROC)thunk;
}

/***********************************************************************
 *     THUNK_AllocSLThunklet
 */
1731 1732
static SEGPTR THUNK_AllocSLThunklet( FARPROC target, DWORD relay,
                                     SEGPTR glue, HTASK16 owner )
1733 1734 1735 1736 1737
{
    THUNKLET *thunk = THUNK_FindThunklet( (DWORD)target, relay, (DWORD)glue,
                                          THUNKLET_TYPE_SL );
    if (!thunk)
    {
1738
        TDB *pTask = GlobalLock16( owner );
1739

1740
        if (!ThunkletHeap) THUNK_Init();
1741 1742 1743 1744 1745 1746 1747 1748
        if ( !(thunk = HeapAlloc( ThunkletHeap, 0, sizeof(THUNKLET) )) )
            return 0;

        thunk->prefix_target = thunk->prefix_relay = 0x66;
        thunk->pushl_target  = thunk->pushl_relay  = 0x68;
        thunk->jmp_glue = 0xEA;

        thunk->target  = (DWORD)target;
1749
        thunk->relay   = relay;
1750 1751 1752 1753 1754 1755 1756 1757 1758
        thunk->glue    = (DWORD)glue;

        thunk->type    = THUNKLET_TYPE_SL;
        thunk->owner   = pTask? pTask->hInstance : 0;

        thunk->next    = ThunkletAnchor;
        ThunkletAnchor = thunk;
    }

1759
    return get_segptr( thunk );
1760 1761 1762 1763 1764
}

/**********************************************************************
 *     IsLSThunklet
 */
1765
static BOOL16 IsLSThunklet( THUNKLET *thunk )
1766 1767 1768 1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786
{
    return    thunk->prefix_target == 0x90 && thunk->pushl_target == 0x68
           && thunk->prefix_relay  == 0x90 && thunk->pushl_relay  == 0x68
           && thunk->jmp_glue == 0xE9 && thunk->type == THUNKLET_TYPE_LS;
}

/**********************************************************************
 *     IsSLThunklet                        (KERNEL.612)
 */
BOOL16 WINAPI IsSLThunklet16( THUNKLET *thunk )
{
    return    thunk->prefix_target == 0x66 && thunk->pushl_target == 0x68
           && thunk->prefix_relay  == 0x66 && thunk->pushl_relay  == 0x68
           && thunk->jmp_glue == 0xEA && thunk->type == THUNKLET_TYPE_SL;
}



/***********************************************************************
 *     AllocLSThunkletSysthunk             (KERNEL.607)
 */
1787
FARPROC WINAPI AllocLSThunkletSysthunk16( SEGPTR target,
1788 1789
                                          FARPROC relay, DWORD dummy )
{
1790
    if (!ThunkletSysthunkGlueLS) THUNK_Init();
1791
    return THUNK_AllocLSThunklet( (SEGPTR)relay, (DWORD)target,
1792 1793 1794 1795 1796 1797
                                  ThunkletSysthunkGlueLS, GetCurrentTask() );
}

/***********************************************************************
 *     AllocSLThunkletSysthunk             (KERNEL.608)
 */
1798
SEGPTR WINAPI AllocSLThunkletSysthunk16( FARPROC target,
1799 1800
                                       SEGPTR relay, DWORD dummy )
{
1801
    if (!ThunkletSysthunkGlueSL) THUNK_Init();
1802
    return THUNK_AllocSLThunklet( (FARPROC)relay, (DWORD)target,
1803 1804 1805 1806 1807 1808 1809
                                  ThunkletSysthunkGlueSL, GetCurrentTask() );
}


/***********************************************************************
 *     AllocLSThunkletCallbackEx           (KERNEL.567)
 */
1810
FARPROC WINAPI AllocLSThunkletCallbackEx16( SEGPTR target,
1811 1812
                                            DWORD relay, HTASK16 task )
{
1813
    THUNKLET *thunk = MapSL( target );
1814 1815
    if ( !thunk ) return NULL;

1816
    if (   IsSLThunklet16( thunk ) && thunk->relay == relay
1817 1818 1819
        && thunk->glue == (DWORD)ThunkletCallbackGlueSL )
        return (FARPROC)thunk->target;

1820
    return THUNK_AllocLSThunklet( target, relay,
1821 1822 1823 1824 1825 1826
                                  ThunkletCallbackGlueLS, task );
}

/***********************************************************************
 *     AllocSLThunkletCallbackEx           (KERNEL.568)
 */
1827
SEGPTR WINAPI AllocSLThunkletCallbackEx16( FARPROC target,
1828 1829 1830 1831 1832
                                         DWORD relay, HTASK16 task )
{
    THUNKLET *thunk = (THUNKLET *)target;
    if ( !thunk ) return 0;

1833
    if (   IsLSThunklet( thunk ) && thunk->relay == relay
1834 1835 1836
        && thunk->glue == (DWORD)ThunkletCallbackGlueLS - (DWORD)&thunk->type )
        return (SEGPTR)thunk->target;

1837
    return THUNK_AllocSLThunklet( target, relay,
1838 1839 1840 1841
                                  ThunkletCallbackGlueSL, task );
}

/***********************************************************************
1842
 *     AllocLSThunkletCallback             (KERNEL.561)
1843
 *     AllocLSThunkletCallback_dup         (KERNEL.606)
1844 1845 1846 1847 1848 1849 1850
 */
FARPROC WINAPI AllocLSThunkletCallback16( SEGPTR target, DWORD relay )
{
    return AllocLSThunkletCallbackEx16( target, relay, GetCurrentTask() );
}

/***********************************************************************
1851
 *     AllocSLThunkletCallback             (KERNEL.562)
1852
 *     AllocSLThunkletCallback_dup         (KERNEL.605)
1853 1854 1855 1856 1857 1858 1859
 */
SEGPTR WINAPI AllocSLThunkletCallback16( FARPROC target, DWORD relay )
{
    return AllocSLThunkletCallbackEx16( target, relay, GetCurrentTask() );
}

/***********************************************************************
1860
 *     FindLSThunkletCallback              (KERNEL.563)
1861
 *     FindLSThunkletCallback_dup          (KERNEL.609)
1862 1863 1864
 */
FARPROC WINAPI FindLSThunkletCallback( SEGPTR target, DWORD relay )
{
1865
    THUNKLET *thunk = MapSL( target );
1866
    if (   thunk && IsSLThunklet16( thunk ) && thunk->relay == relay
1867 1868 1869
        && thunk->glue == (DWORD)ThunkletCallbackGlueSL )
        return (FARPROC)thunk->target;

1870 1871
    thunk = THUNK_FindThunklet( (DWORD)target, relay,
                                (DWORD)ThunkletCallbackGlueLS,
1872 1873 1874 1875 1876
                                THUNKLET_TYPE_LS );
    return (FARPROC)thunk;
}

/***********************************************************************
1877
 *     FindSLThunkletCallback              (KERNEL.564)
1878
 *     FindSLThunkletCallback_dup          (KERNEL.610)
1879 1880 1881 1882
 */
SEGPTR WINAPI FindSLThunkletCallback( FARPROC target, DWORD relay )
{
    THUNKLET *thunk = (THUNKLET *)target;
1883
    if (   thunk && IsLSThunklet( thunk ) && thunk->relay == relay
1884 1885 1886
        && thunk->glue == (DWORD)ThunkletCallbackGlueLS - (DWORD)&thunk->type )
        return (SEGPTR)thunk->target;

1887 1888
    thunk = THUNK_FindThunklet( (DWORD)target, relay,
                                (DWORD)ThunkletCallbackGlueSL,
1889
                                THUNKLET_TYPE_SL );
1890
    return get_segptr( thunk );
1891 1892 1893 1894
}


/***********************************************************************
Patrik Stridvall's avatar
Patrik Stridvall committed
1895
 *     FreeThunklet            (KERNEL.611)
1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916
 */
BOOL16 WINAPI FreeThunklet16( DWORD unused1, DWORD unused2 )
{
    return FALSE;
}


/***********************************************************************
 * Callback Client API
 */

#define N_CBC_FIXED    20
#define N_CBC_VARIABLE 10
#define N_CBC_TOTAL    (N_CBC_FIXED + N_CBC_VARIABLE)

static SEGPTR CBClientRelay16[ N_CBC_TOTAL ];
static FARPROC *CBClientRelay32[ N_CBC_TOTAL ];

/***********************************************************************
 *     RegisterCBClient                    (KERNEL.619)
 */
1917
INT16 WINAPI RegisterCBClient16( INT16 wCBCId,
1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940
                                 SEGPTR relay16, FARPROC *relay32 )
{
    /* Search for free Callback ID */
    if ( wCBCId == -1 )
        for ( wCBCId = N_CBC_FIXED; wCBCId < N_CBC_TOTAL; wCBCId++ )
            if ( !CBClientRelay16[ wCBCId ] )
                break;

    /* Register Callback ID */
    if ( wCBCId > 0 && wCBCId < N_CBC_TOTAL )
    {
        CBClientRelay16[ wCBCId ] = relay16;
        CBClientRelay32[ wCBCId ] = relay32;
    }
    else
        wCBCId = 0;

    return wCBCId;
}

/***********************************************************************
 *     UnRegisterCBClient                  (KERNEL.622)
 */
1941
INT16 WINAPI UnRegisterCBClient16( INT16 wCBCId,
1942 1943
                                   SEGPTR relay16, FARPROC *relay32 )
{
1944 1945
    if (    wCBCId >= N_CBC_FIXED && wCBCId < N_CBC_TOTAL
         && CBClientRelay16[ wCBCId ] == relay16
1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963
         && CBClientRelay32[ wCBCId ] == relay32 )
    {
        CBClientRelay16[ wCBCId ] = 0;
        CBClientRelay32[ wCBCId ] = 0;
    }
    else
        wCBCId = 0;

    return wCBCId;
}


/***********************************************************************
 *     InitCBClient                        (KERNEL.623)
 */
void WINAPI InitCBClient16( FARPROC glueLS )
{
    HMODULE16 kernel = GetModuleHandle16( "KERNEL" );
1964
    SEGPTR glueSL = (SEGPTR)GetProcAddress16( kernel, (LPCSTR)604 );
1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975

    SetThunkletCallbackGlue16( glueLS, glueSL );
}

/***********************************************************************
 *     CBClientGlueSL                      (KERNEL.604)
 */
void WINAPI CBClientGlueSL( CONTEXT86 *context )
{
    /* Create stack frame */
    SEGPTR stackSeg = stack16_push( 12 );
1976
    LPWORD stackLin = MapSL( stackSeg );
1977
    SEGPTR glue, *glueTab;
1978

1979 1980 1981 1982
    stackLin[3] = (WORD)context->Ebp;
    stackLin[2] = (WORD)context->Esi;
    stackLin[1] = (WORD)context->Edi;
    stackLin[0] = (WORD)context->SegDs;
1983

1984 1985 1986
    context->Ebp = OFFSETOF( stackSeg ) + 6;
    context->Esp = OFFSETOF( stackSeg ) - 4;
    context->SegGs = 0;
1987 1988

    /* Jump to 16-bit relay code */
1989
    glueTab = MapSL( CBClientRelay16[ stackLin[5] ] );
1990
    glue = glueTab[ stackLin[4] ];
1991 1992
    context->SegCs = SELECTOROF( glue );
    context->Eip   = OFFSETOF  ( glue );
1993 1994 1995 1996 1997
}

/***********************************************************************
 *     CBClientThunkSL                      (KERNEL.620)
 */
1998
extern DWORD CALL32_CBClient( FARPROC proc, LPWORD args, WORD *stackLin, DWORD *esi );
1999 2000 2001 2002
void WINAPI CBClientThunkSL( CONTEXT86 *context )
{
    /* Call 32-bit relay code */

2003
    LPWORD args = MapSL( MAKESEGPTR( context->SegSs, LOWORD(context->Ebp) ) );
2004 2005
    FARPROC proc = CBClientRelay32[ args[2] ][ args[1] ];

2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017
    /* fill temporary area for the asm code (see comments in winebuild) */
    SEGPTR stack = stack16_push( 12 );
    LPWORD stackLin = MapSL(stack);
    /* stackLin[0] and stackLin[1] reserved for the 32-bit stack ptr */
    stackLin[2] = wine_get_ss();
    stackLin[3] = 0;
    stackLin[4] = OFFSETOF(stack) + 12;
    stackLin[5] = SELECTOROF(stack);
    stackLin[6] = OFFSETOF(CALL32_CBClientEx_RetAddr);  /* overwrite return address */
    stackLin[7] = SELECTOROF(CALL32_CBClientEx_RetAddr);
    context->Eax = CALL32_CBClient( proc, args, stackLin + 4, &context->Esi );
    stack16_pop( 12 );
2018 2019 2020 2021 2022
}

/***********************************************************************
 *     CBClientThunkSLEx                    (KERNEL.621)
 */
2023
extern DWORD CALL32_CBClientEx( FARPROC proc, LPWORD args, WORD *stackLin, DWORD *esi, INT *nArgs );
2024 2025 2026 2027
void WINAPI CBClientThunkSLEx( CONTEXT86 *context )
{
    /* Call 32-bit relay code */

2028
    LPWORD args = MapSL( MAKESEGPTR( context->SegSs, LOWORD(context->Ebp) ) );
2029 2030 2031 2032
    FARPROC proc = CBClientRelay32[ args[2] ][ args[1] ];
    INT nArgs;
    LPWORD stackLin;

2033 2034 2035 2036 2037 2038 2039 2040 2041 2042 2043 2044 2045 2046 2047
    /* fill temporary area for the asm code (see comments in winebuild) */
    SEGPTR stack = stack16_push( 24 );
    stackLin = MapSL(stack);
    stackLin[0] = OFFSETOF(stack) + 4;
    stackLin[1] = SELECTOROF(stack);
    stackLin[2] = wine_get_ds();
    stackLin[5] = OFFSETOF(stack) + 24;
    /* stackLin[6] and stackLin[7] reserved for the 32-bit stack ptr */
    stackLin[8] = wine_get_ss();
    stackLin[9] = 0;
    stackLin[10] = OFFSETOF(CALL32_CBClientEx_RetAddr);
    stackLin[11] = SELECTOROF(CALL32_CBClientEx_RetAddr);

    context->Eax = CALL32_CBClientEx( proc, args, stackLin, &context->Esi, &nArgs );
    stack16_pop( 24 );
2048 2049 2050

    /* Restore registers saved by CBClientGlueSL */
    stackLin = (LPWORD)((LPBYTE)CURRENT_STACK16 + sizeof(STACK16FRAME) - 4);
2051
    context->Ebp = (context->Ebp & ~0xffff) | stackLin[3];
2052 2053
    context->Esi = (context->Esi & ~0xffff) | stackLin[2];
    context->Edi = (context->Edi & ~0xffff) | stackLin[1];
2054 2055
    context->SegDs = stackLin[0];
    context->Esp += 16+nArgs;
2056 2057

    /* Return to caller of CBClient thunklet */
2058 2059
    context->SegCs = stackLin[9];
    context->Eip   = stackLin[8];
2060 2061 2062 2063
}


/***********************************************************************
2064
 *           Get16DLLAddress       (KERNEL32.@)
2065 2066 2067 2068 2069
 *
 * This function is used by a Win32s DLL if it wants to call a Win16 function.
 * A 16:16 segmented pointer to the function is returned.
 * Written without any docu.
 */
2070
SEGPTR WINAPI Get16DLLAddress(HMODULE16 handle, LPSTR func_name)
2071 2072 2073 2074 2075 2076 2077
{
    static WORD code_sel32;
    FARPROC16 proc_16;
    LPBYTE thunk;

    if (!code_sel32)
    {
2078
        if (!ThunkletHeap) THUNK_Init();
2079
        code_sel32 = SELECTOR_AllocBlock( ThunkletHeap, 0x10000,
2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094
                                          WINE_LDT_FLAGS_CODE | WINE_LDT_FLAGS_32BIT );
        if (!code_sel32) return 0;
    }
    if (!(thunk = HeapAlloc( ThunkletHeap, 0, 32 ))) return 0;

    if (!handle) handle = GetModuleHandle16("WIN32S16");
    proc_16 = GetProcAddress16(handle, func_name);

    /* movl proc_16, $edx */
    *thunk++ = 0xba;
    *(FARPROC16 *)thunk = proc_16;
    thunk += sizeof(FARPROC16);

     /* jmpl QT_Thunk */
    *thunk++ = 0xea;
2095
    *(FARPROC *)thunk = GetProcAddress(kernel32_handle,"QT_Thunk");
2096
    thunk += sizeof(FARPROC16);
2097
    *(WORD *)thunk = wine_get_cs();
2098 2099

    return MAKESEGPTR( code_sel32, (char *)thunk - (char *)ThunkletHeap );
2100 2101 2102 2103 2104 2105 2106
}


/***********************************************************************
 *		GetWin16DOSEnv			(KERNEL32.34)
 * Returns some internal value.... probably the default environment database?
 */
2107
DWORD WINAPI GetWin16DOSEnv(void)
2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121 2122 2123 2124 2125 2126
{
	FIXME("stub, returning 0\n");
	return 0;
}

/**********************************************************************
 *           GetPK16SysVar    (KERNEL32.92)
 */
LPVOID WINAPI GetPK16SysVar(void)
{
    static BYTE PK16SysVar[128];

    FIXME("()\n");
    return PK16SysVar;
}

/**********************************************************************
 *           CommonUnimpStub    (KERNEL32.17)
 */
2127
void WINAPI __regs_CommonUnimpStub( CONTEXT86 *context )
2128
{
2129
    FIXME("generic stub: %s\n", ((LPSTR)context->Eax ? (LPSTR)context->Eax : "?"));
2130

2131
    switch ((context->Ecx >> 4) & 0x0f)
2132
    {
2133 2134 2135 2136 2137
    case 15:  context->Eax = -1;   break;
    case 14:  context->Eax = 0x78; break;
    case 13:  context->Eax = 0x32; break;
    case 1:   context->Eax = 1;    break;
    default:  context->Eax = 0;    break;
2138 2139
    }

2140
    context->Esp += (context->Ecx & 0x0f) * 4;
2141
}
2142
#ifdef DEFINE_REGS_ENTRYPOINT
2143
DEFINE_REGS_ENTRYPOINT( CommonUnimpStub, 0, 0 )
2144
#endif
2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155

/**********************************************************************
 *           HouseCleanLogicallyDeadHandles    (KERNEL32.33)
 */
void WINAPI HouseCleanLogicallyDeadHandles(void)
{
    /* Whatever this is supposed to do, our handles probably
       don't need it :-) */
}

/**********************************************************************
Patrik Stridvall's avatar
Patrik Stridvall committed
2156
 *		@ (KERNEL32.100)
2157 2158 2159
 */
BOOL WINAPI _KERNEL32_100(HANDLE threadid,DWORD exitcode,DWORD x)
{
2160
	FIXME("(%p,%d,0x%08x): stub\n",threadid,exitcode,x);
2161 2162 2163 2164
	return TRUE;
}

/**********************************************************************
Patrik Stridvall's avatar
Patrik Stridvall committed
2165
 *		@ (KERNEL32.99)
2166 2167 2168 2169
 *
 * Checks whether the clock has to be switched from daylight
 * savings time to standard time or vice versa.
 *
2170 2171 2172
 */
DWORD WINAPI _KERNEL32_99(DWORD x)
{
2173
	FIXME("(0x%08x): stub\n",x);
2174 2175 2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190 2191 2192 2193 2194 2195 2196 2197 2198 2199 2200 2201
	return 1;
}


/**********************************************************************
 *	     Catch    (KERNEL.55)
 *
 * Real prototype is:
 *   INT16 WINAPI Catch( LPCATCHBUF lpbuf );
 */
void WINAPI Catch16( LPCATCHBUF lpbuf, CONTEXT86 *context )
{
    /* Note: we don't save the current ss, as the catch buffer is */
    /* only 9 words long. Hopefully no one will have the silly    */
    /* idea to change the current stack before calling Throw()... */

    /* Windows uses:
     * lpbuf[0] = ip
     * lpbuf[1] = cs
     * lpbuf[2] = sp
     * lpbuf[3] = bp
     * lpbuf[4] = si
     * lpbuf[5] = di
     * lpbuf[6] = ds
     * lpbuf[7] = unused
     * lpbuf[8] = ss
     */

2202 2203
    lpbuf[0] = LOWORD(context->Eip);
    lpbuf[1] = context->SegCs;
2204
    /* Windows pushes 4 more words before saving sp */
2205 2206 2207 2208 2209
    lpbuf[2] = LOWORD(context->Esp) - 4 * sizeof(WORD);
    lpbuf[3] = LOWORD(context->Ebp);
    lpbuf[4] = LOWORD(context->Esi);
    lpbuf[5] = LOWORD(context->Edi);
    lpbuf[6] = context->SegDs;
2210
    lpbuf[7] = 0;
2211
    lpbuf[8] = context->SegSs;
2212
    context->Eax &= ~0xffff;  /* Return 0 */
2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226
}


/**********************************************************************
 *	     Throw    (KERNEL.56)
 *
 * Real prototype is:
 *   INT16 WINAPI Throw( LPCATCHBUF lpbuf, INT16 retval );
 */
void WINAPI Throw16( LPCATCHBUF lpbuf, INT16 retval, CONTEXT86 *context )
{
    STACK16FRAME *pFrame;
    STACK32FRAME *frame32;

2227
    context->Eax = (context->Eax & ~0xffff) | (WORD)retval;
2228 2229

    /* Find the frame32 corresponding to the frame16 we are jumping to */
2230
    pFrame = CURRENT_STACK16;
2231 2232 2233
    frame32 = pFrame->frame32;
    while (frame32 && frame32->frame16)
    {
2234
        if (OFFSETOF(frame32->frame16) < OFFSETOF(NtCurrentTeb()->WOW32Reserved))
2235 2236 2237 2238 2239 2240 2241
            break;  /* Something strange is going on */
        if (OFFSETOF(frame32->frame16) > lpbuf[2])
        {
            /* We found the right frame */
            pFrame->frame32 = frame32;
            break;
        }
2242
        frame32 = ((STACK16FRAME *)MapSL(frame32->frame16))->frame32;
2243
    }
2244
    RtlUnwind( &pFrame->frame32->frame, NULL, NULL, 0 );
2245

2246 2247 2248 2249 2250 2251 2252
    context->Eip = lpbuf[0];
    context->SegCs  = lpbuf[1];
    context->Esp = lpbuf[2] + 4 * sizeof(WORD) - sizeof(WORD) /*extra arg*/;
    context->Ebp = lpbuf[3];
    context->Esi = lpbuf[4];
    context->Edi = lpbuf[5];
    context->SegDs  = lpbuf[6];
2253

2254
    if (lpbuf[8] != context->SegSs)
2255 2256
        ERR("Switching stack segment with Throw() not supported; expect crash now\n" );
}