// // visit_vector_type // void Stub_Attribute_Generator:: visit_vector_type (const OASIS_PDL_Vector_Type & v) { // Declaration and implementation of the setter/getter methods // specific to structure types this->hfile_ << stub_return_t (&v) << " " << this->member_name_ << " (void);" << "const " << stub_return_t (&v) << " " << this->member_name_ << " (void) const;"; // Implementation of the setter/getter methods for structure types. this->cppfile_ << function_header (this->member_name_) << "const " << stub_return_t (&v) << " " << this->probe_->name () << "::" << this->member_name_ << " (void) const" << "{" << "return this->" << this->member_name_ << "_;" << "}" << function_header (this->member_name_) << stub_return_t (&v) << " " << this->probe_->name () << "::" << this->member_name_ << " (void)" << "{" << "return this->" << this->member_name_ << "_;" << "}"; }
// // visit_probe // void Stub_Dump_Generator::visit_probe (const OASIS_PDL_Probe & p) { // Make sure we know the base probe type. const std::string base_probe = p.has_base_probe () ? ("::" + p.base_probe ()->fq_name ("::")) : "::OASIS::Software_Probe"; const std::string & name = p.name (); this->hfile_ << std::endl << "public:" << std::endl << "/// Stub_Dump the software probe's data." << std::endl << "virtual void dump (std::ostream & output);" << std::endl; // Implementation of the dump method. this->cppfile_ << function_header ("dump") << "void " << name << "::" << "dump (std::ostream & output) {" << base_probe << "::dump (output);"; if (!p.members ().empty ()) { Stub_Dump_Variable_Generator var_gen (this->hfile_, this->cppfile_); var_gen.parent_is_probe (true); std::vector <OASIS_PDL_Complex_Type_Member *>::const_iterator iter = p.members ().begin (), iter_end = p.members ().end (); for (; iter != iter_end; ++ iter) { var_gen.name ((*iter)->name ()); // Call accept on the actual child type (*iter)->type ()->accept (var_gen); } } this->cppfile_ << "}"; }
// // visit_struct // void Package_Data_Generator::visit_struct (const OASIS_PDL_Struct & s) { this->hfile_ << "/// Package the software probe's data." << std::endl << "int package_data (::OASIS::Software_Probe_Data_Packager * p);" << std::endl; this->cppfile_ << function_header ("package_data") << "int " << s.fq_name ("::") << "Impl::package_data (::OASIS::Software_Probe_Data_Packager * p) {"; this->var_suffix_ = ""; std::for_each (s.members ().begin (), s.members ().end (), boost::bind (&OASIS_PDL_Complex_Type_Member::accept, _1, boost::ref (*this))); this->cppfile_ << "return 0;" << "}"; }
// // visit_probe // void Package_Data_Generator::visit_probe (const OASIS_PDL_Probe & p) { const std::string name = p.name (); // Make sure we know the base probe type. std::string base_probe = p.has_base_probe () ? ("::" + p.base_probe ()->fq_name ("::") + "Impl") : "::OASIS::Software_Probe_Impl"; this->hfile_ << std::endl << "/// Package the software probe's data." << std::endl << "protected:" << std::endl << "virtual int package_data (::OASIS::Software_Probe_Data_Packager * p);" << std::endl; // Implement the package data method. this->cppfile_ << function_header ("package_data") << "int " << name << "Impl::package_data (::OASIS::Software_Probe_Data_Packager * p) {" << "if (0 != " << base_probe << "::package_data (p))" << std::endl << " ACE_ERROR_RETURN ((LM_ERROR," << std::endl << "ACE_TEXT (\"%T (%t) - %M - failed to package data\\n\"))," << std::endl << "-1);"; this->var_suffix_ = "_"; std::for_each (p.members ().begin (), p.members ().end (), boost::bind (&OASIS_PDL_Complex_Type_Member::accept, _1, boost::ref (*this))); this->cppfile_ << "return 0;" << "}"; }
/******************************************************************* * BuildCallTo32CBClient * * Call a CBClient relay stub from 32-bit code (KERNEL.620). * * Since the relay stub is itself 32-bit, this should not be a problem; * unfortunately, the relay stubs are expected to switch back to a * 16-bit stack (and 16-bit code) after completion :-( * * This would conflict with our 16- vs. 32-bit stack handling, so * we simply switch *back* to our 32-bit stack before returning to * the caller ... * * The CBClient relay stub expects to be called with the following * 16-bit stack layout, and with ebp and ebx pointing into the 16-bit * stack at the designated places: * * ... * (ebp+14) original arguments to the callback routine * (ebp+10) far return address to original caller * (ebp+6) Thunklet target address * (ebp+2) Thunklet relay ID code * (ebp) BP (saved by CBClientGlueSL) * (ebp-2) SI (saved by CBClientGlueSL) * (ebp-4) DI (saved by CBClientGlueSL) * (ebp-6) DS (saved by CBClientGlueSL) * * ... buffer space used by the 16-bit side glue for temp copies * * (ebx+4) far return address to 16-bit side glue code * (ebx) saved 16-bit ss:sp (pointing to ebx+4) * * The 32-bit side glue code accesses both the original arguments (via ebp) * and the temporary copies prepared by the 16-bit side glue (via ebx). * After completion, the stub will load ss:sp from the buffer at ebx * and perform a far return to 16-bit code. * * To trick the relay stub into returning to us, we replace the 16-bit * return address to the glue code by a cs:ip pair pointing to our * return entry point (the original return address is saved first). * Our return stub thus called will then reload the 32-bit ss:esp and * return to 32-bit code (by using and ss:esp value that we have also * pushed onto the 16-bit stack before and a cs:eip values found at * that position on the 32-bit stack). The ss:esp to be restored is * found relative to the 16-bit stack pointer at: * * (ebx-4) ss (flat) * (ebx-8) sp (32-bit stack pointer) * * The second variant of this routine, CALL32_CBClientEx, which is used * to implement KERNEL.621, has to cope with yet another problem: Here, * the 32-bit side directly returns to the caller of the CBClient thunklet, * restoring registers saved by CBClientGlueSL and cleaning up the stack. * As we have to return to our 32-bit code first, we have to adapt the * layout of our temporary area so as to include values for the registers * that are to be restored, and later (in the implementation of KERNEL.621) * we *really* restore them. The return stub restores DS, DI, SI, and BP * from the stack, skips the next 8 bytes (CBClient relay code / target), * and then performs a lret NN, where NN is the number of arguments to be * removed. Thus, we prepare our temporary area as follows: * * (ebx+22) 16-bit cs (this segment) * (ebx+20) 16-bit ip ('16-bit' return entry point) * (ebx+16) 32-bit ss (flat) * (ebx+12) 32-bit sp (32-bit stack pointer) * (ebx+10) 16-bit bp (points to ebx+24) * (ebx+8) 16-bit si (ignored) * (ebx+6) 16-bit di (ignored) * (ebx+4) 16-bit ds (we actually use the flat DS here) * (ebx+2) 16-bit ss (16-bit stack segment) * (ebx+0) 16-bit sp (points to ebx+4) * * Note that we ensure that DS is not changed and remains the flat segment, * and the 32-bit stack pointer our own return stub needs fits just * perfectly into the 8 bytes that are skipped by the Windows stub. * One problem is that we have to determine the number of removed arguments, * as these have to be really removed in KERNEL.621. Thus, the BP value * that we place in the temporary area to be restored, contains the value * that SP would have if no arguments were removed. By comparing the actual * value of SP with this value in our return stub we can compute the number * of removed arguments. This is then returned to KERNEL.621. * * The stack layout of this function: * (ebp+20) nArgs pointer to variable receiving nr. of args (Ex only) * (ebp+16) esi pointer to caller's esi value * (ebp+12) arg ebp value to be set for relay stub * (ebp+8) func CBClient relay stub address * (ebp+4) ret addr * (ebp) ebp */ static void BuildCallTo32CBClient( int isEx ) { function_header( isEx ? "CALL32_CBClientEx" : "CALL32_CBClient" ); /* Entry code */ output_cfi( ".cfi_startproc" ); output( "\tpushl %%ebp\n" ); output_cfi( ".cfi_adjust_cfa_offset 4" ); output_cfi( ".cfi_rel_offset %%ebp,0" ); output( "\tmovl %%esp,%%ebp\n" ); output_cfi( ".cfi_def_cfa_register %%ebp" ); output( "\tpushl %%edi\n" ); output_cfi( ".cfi_rel_offset %%edi,-4" ); output( "\tpushl %%esi\n" ); output_cfi( ".cfi_rel_offset %%esi,-8" ); output( "\tpushl %%ebx\n" ); output_cfi( ".cfi_rel_offset %%ebx,-12" ); /* Get pointer to temporary area and save the 32-bit stack pointer */ output( "\tmovl 16(%%ebp), %%ebx\n" ); output( "\tleal -8(%%esp), %%eax\n" ); if ( !isEx ) output( "\tmovl %%eax, -8(%%ebx)\n" ); else output( "\tmovl %%eax, 12(%%ebx)\n" ); /* Set up registers and call CBClient relay stub (simulating a far call) */ output( "\tmovl 20(%%ebp), %%esi\n" ); output( "\tmovl (%%esi), %%esi\n" ); output( "\tmovl 8(%%ebp), %%eax\n" ); output( "\tmovl 12(%%ebp), %%ebp\n" ); output( "\tpushl %%cs\n" ); output( "\tcall *%%eax\n" ); /* Return new esi value to caller */ output( "\tmovl 32(%%esp), %%edi\n" ); output( "\tmovl %%esi, (%%edi)\n" ); /* Return argument size to caller */ if ( isEx ) { output( "\tmovl 36(%%esp), %%ebx\n" ); output( "\tmovl %%ebp, (%%ebx)\n" ); } /* Restore registers and return */ output( "\tpopl %%ebx\n" ); output_cfi( ".cfi_same_value %%ebx" ); output( "\tpopl %%esi\n" ); output_cfi( ".cfi_same_value %%esi" ); output( "\tpopl %%edi\n" ); output_cfi( ".cfi_same_value %%edi" ); output( "\tpopl %%ebp\n" ); output_cfi( ".cfi_def_cfa %%esp,4" ); output_cfi( ".cfi_same_value %%ebp" ); output( "\tret\n" ); output_cfi( ".cfi_endproc" ); output_function_size( isEx ? "CALL32_CBClientEx" : "CALL32_CBClient" ); /* '16-bit' return stub */ function_header( isEx ? "CALL32_CBClientEx_Ret" : "CALL32_CBClient_Ret" ); if ( !isEx ) { output( "\tmovzwl %%sp, %%ebx\n" ); output( "\tlssl %%ss:-16(%%ebx), %%esp\n" ); } else { output( "\tmovzwl %%bp, %%ebx\n" ); output( "\tsubw %%bp, %%sp\n" ); output( "\tmovzwl %%sp, %%ebp\n" ); output( "\tlssl %%ss:-12(%%ebx), %%esp\n" ); } output( "\tlret\n" ); output_function_size( isEx ? "CALL32_CBClientEx_Ret" : "CALL32_CBClient_Ret" ); }
/******************************************************************* * BuildCallTo16Core * * This routine builds the core routines used in 32->16 thunks: * * extern DWORD WINAPI wine_call_to_16( FARPROC16 target, DWORD cbArgs, PEXCEPTION_HANDLER handler ); * extern void WINAPI wine_call_to_16_regs( CONTEXT86 *context, DWORD cbArgs, PEXCEPTION_HANDLER handler ); * * These routines can be called directly from 32-bit code. * * All routines expect that the 16-bit stack contents (arguments) and the * return address (segptr to CallTo16_Ret) were already set up by the * caller; nb_args must contain the number of bytes to be conserved. The * 16-bit SS:SP will be set accordingly. * * All other registers are either taken from the CONTEXT86 structure * or else set to default values. The target routine address is either * given directly or taken from the CONTEXT86. */ static void BuildCallTo16Core( int reg_func ) { const char *name = reg_func ? "wine_call_to_16_regs" : "wine_call_to_16"; /* Function header */ function_header( name ); /* Function entry sequence */ output_cfi( ".cfi_startproc" ); output( "\tpushl %%ebp\n" ); output_cfi( ".cfi_adjust_cfa_offset 4" ); output_cfi( ".cfi_rel_offset %%ebp,0" ); output( "\tmovl %%esp, %%ebp\n" ); output_cfi( ".cfi_def_cfa_register %%ebp" ); /* Save the 32-bit registers */ output( "\tpushl %%ebx\n" ); output_cfi( ".cfi_rel_offset %%ebx,-4" ); output( "\tpushl %%esi\n" ); output_cfi( ".cfi_rel_offset %%esi,-8" ); output( "\tpushl %%edi\n" ); output_cfi( ".cfi_rel_offset %%edi,-12" ); output( "\t.byte 0x64\n\tmov %%gs,(%d)\n", GS_OFFSET ); /* Setup exception frame */ output( "\t.byte 0x64\n\tpushl (%d)\n", STACKOFFSET ); output( "\tpushl 16(%%ebp)\n" ); /* handler */ output( "\t.byte 0x64\n\tpushl (0)\n" ); output( "\t.byte 0x64\n\tmovl %%esp,(0)\n" ); /* Call the actual CallTo16 routine (simulate a lcall) */ output( "\tpushl %%cs\n" ); output( "\tcall .L%s\n", name ); /* Remove exception frame */ output( "\t.byte 0x64\n\tpopl (0)\n" ); output( "\taddl $4, %%esp\n" ); output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); if ( !reg_func ) { /* Convert return value */ output( "\tandl $0xffff,%%eax\n" ); output( "\tshll $16,%%edx\n" ); output( "\torl %%edx,%%eax\n" ); } else { /* * Modify CONTEXT86 structure to contain new values * * NOTE: We restore only EAX, EBX, EDX, EDX, EBP, and ESP. * The segment registers as well as ESI and EDI should * not be modified by a well-behaved 16-bit routine in * any case. [If necessary, we could restore them as well, * at the cost of a somewhat less efficient return path.] */ output( "\tmovl 0x14(%%esp),%%edi\n" ); /* FIELD_OFFSET(STACK32FRAME,target) - FIELD_OFFSET(STACK32FRAME,edi) */ /* everything above edi has been popped already */ output( "\tmovl %%eax,0xb0(%%edi)\n"); /* Eax */ output( "\tmovl %%ebx,0xa4(%%edi)\n"); /* Ebx */ output( "\tmovl %%ecx,0xac(%%edi)\n"); /* Ecx */ output( "\tmovl %%edx,0xa8(%%edi)\n"); /* Edx */ output( "\tmovl %%ebp,0xb4(%%edi)\n"); /* Ebp */ output( "\tmovl %%esi,0xc4(%%edi)\n"); /* Esp */ /* The return glue code saved %esp into %esi */ } /* Restore the 32-bit registers */ output( "\tpopl %%edi\n" ); output_cfi( ".cfi_same_value %%edi" ); output( "\tpopl %%esi\n" ); output_cfi( ".cfi_same_value %%esi" ); output( "\tpopl %%ebx\n" ); output_cfi( ".cfi_same_value %%ebx" ); /* Function exit sequence */ output( "\tpopl %%ebp\n" ); output_cfi( ".cfi_def_cfa %%esp,4" ); output_cfi( ".cfi_same_value %%ebp" ); output( "\tret $12\n" ); output_cfi( ".cfi_endproc" ); /* Start of the actual CallTo16 routine */ output( ".L%s:\n", name ); /* Switch to the 16-bit stack */ output( "\tmovl %%esp,%%edx\n" ); output( "\t.byte 0x64\n\tmovw (%d),%%ss\n", STACKOFFSET + 2); output( "\t.byte 0x64\n\tmovw (%d),%%sp\n", STACKOFFSET ); output( "\t.byte 0x64\n\tmovl %%edx,(%d)\n", STACKOFFSET ); /* Make %bp point to the previous stackframe (built by CallFrom16) */ output( "\tmovzwl %%sp,%%ebp\n" ); output( "\tleal 0x2a(%%ebp),%%ebp\n"); /* FIELD_OFFSET(STACK16FRAME,bp) */ /* Add the specified offset to the new sp */ output( "\tsubw 0x2c(%%edx), %%sp\n"); /* FIELD_OFFSET(STACK32FRAME,nb_args) */ if (reg_func) { /* Push the called routine address */ output( "\tmovl 0x28(%%edx),%%edx\n"); /* FIELD_OFFSET(STACK32FRAME,target) */ output( "\tpushw 0xbc(%%edx)\n"); /* SegCs */ output( "\tpushw 0xb8(%%edx)\n"); /* Eip */ /* Get the registers */ output( "\tpushw 0x98(%%edx)\n"); /* SegDs */ output( "\tpushl 0x94(%%edx)\n"); /* SegEs */ output( "\tpopl %%es\n" ); output( "\tpushl 0x90(%%edx)\n"); /* SegFs */ output( "\tpopl %%fs\n" ); output( "\tpushl 0x8c(%%edx)\n"); /* SegGs */ output( "\tpopl %%gs\n" ); output( "\tmovl 0xb4(%%edx),%%ebp\n"); /* Ebp */ output( "\tmovl 0xa0(%%edx),%%esi\n"); /* Esi */ output( "\tmovl 0x9c(%%edx),%%edi\n"); /* Edi */ output( "\tmovl 0xb0(%%edx),%%eax\n"); /* Eax */ output( "\tmovl 0xa4(%%edx),%%ebx\n"); /* Ebx */ output( "\tmovl 0xac(%%edx),%%ecx\n"); /* Ecx */ output( "\tmovl 0xa8(%%edx),%%edx\n"); /* Edx */ /* Get the 16-bit ds */ output( "\tpopw %%ds\n" ); } else /* not a register function */ { /* Push the called routine address */ output( "\tpushl 0x28(%%edx)\n"); /* FIELD_OFFSET(STACK32FRAME,target) */ /* Set %fs and %gs to the value saved by the last CallFrom16 */ output( "\tpushw -22(%%ebp)\n" ); /* FIELD_OFFSET(STACK16FRAME,fs)-FIELD_OFFSET(STACK16FRAME,bp) */ output( "\tpopw %%fs\n" ); output( "\tpushw -20(%%ebp)\n" ); /* FIELD_OFFSET(STACK16FRAME,gs)-FIELD_OFFSET(STACK16FRAME,bp) */ output( "\tpopw %%gs\n" ); /* Set %ds and %es (and %ax just in case) equal to %ss */ output( "\tmovw %%ss,%%ax\n" ); output( "\tmovw %%ax,%%ds\n" ); output( "\tmovw %%ax,%%es\n" ); } /* Jump to the called routine */ output( "\t.byte 0x66\n" ); output( "\tlret\n" ); /* Function footer */ output_function_size( name ); }
/******************************************************************* * BuildCallFrom16Core * * This routine builds the core routines used in 16->32 thunks: * CallFrom16Word, CallFrom16Long, CallFrom16Register, and CallFrom16Thunk. * * These routines are intended to be called via a far call (with 32-bit * operand size) from 16-bit code. The 16-bit code stub must push %bp, * the 32-bit entry point to be called, and the argument conversion * routine to be used (see stack layout below). * * The core routine completes the STACK16FRAME on the 16-bit stack and * switches to the 32-bit stack. Then, the argument conversion routine * is called; it gets passed the 32-bit entry point and a pointer to the * 16-bit arguments (on the 16-bit stack) as parameters. (You can either * use conversion routines automatically generated by BuildCallFrom16, * or write your own for special purposes.) * * The conversion routine must call the 32-bit entry point, passing it * the converted arguments, and return its return value to the core. * After the conversion routine has returned, the core switches back * to the 16-bit stack, converts the return value to the DX:AX format * (CallFrom16Long), and returns to the 16-bit call stub. All parameters, * including %bp, are popped off the stack. * * The 16-bit call stub now returns to the caller, popping the 16-bit * arguments if necessary (pascal calling convention). * * In the case of a 'register' function, CallFrom16Register fills a * CONTEXT86 structure with the values all registers had at the point * the first instruction of the 16-bit call stub was about to be * executed. A pointer to this CONTEXT86 is passed as third parameter * to the argument conversion routine, which typically passes it on * to the called 32-bit entry point. * * CallFrom16Thunk is a special variant used by the implementation of * the Win95 16->32 thunk functions C16ThkSL and C16ThkSL01 and is * implemented as follows: * On entry, the EBX register is set up to contain a flat pointer to the * 16-bit stack such that EBX+22 points to the first argument. * Then, the entry point is called, while EBP is set up to point * to the return address (on the 32-bit stack). * The called function returns with CX set to the number of bytes * to be popped of the caller's stack. * * Stack layout upon entry to the core routine (STACK16FRAME): * ... ... * (sp+24) word first 16-bit arg * (sp+22) word cs * (sp+20) word ip * (sp+18) word bp * (sp+14) long 32-bit entry point (reused for Win16 mutex recursion count) * (sp+12) word ip of actual entry point (necessary for relay debugging) * (sp+8) long relay (argument conversion) function entry point * (sp+4) long cs of 16-bit entry point * (sp) long ip of 16-bit entry point * * Added on the stack: * (sp-2) word saved gs * (sp-4) word saved fs * (sp-6) word saved es * (sp-8) word saved ds * (sp-12) long saved ebp * (sp-16) long saved ecx * (sp-20) long saved edx * (sp-24) long saved previous stack */ static void BuildCallFrom16Core( int reg_func, int thunk ) { /* Function header */ if (thunk) function_header( "__wine_call_from_16_thunk" ); else if (reg_func) function_header( "__wine_call_from_16_regs" ); else function_header( "__wine_call_from_16" ); /* Create STACK16FRAME (except STACK32FRAME link) */ output( "\tpushw %%gs\n" ); output( "\tpushw %%fs\n" ); output( "\tpushw %%es\n" ); output( "\tpushw %%ds\n" ); output( "\tpushl %%ebp\n" ); output( "\tpushl %%ecx\n" ); output( "\tpushl %%edx\n" ); /* Save original EFlags register */ if (reg_func) output( "\tpushfl\n" ); if ( UsePIC ) { output( "\tcall 1f\n" ); output( "1:\tpopl %%ecx\n" ); output( "\t.byte 0x2e\n\tmovl %s-1b(%%ecx),%%edx\n", asm_name("CallTo16_DataSelector") ); } else output( "\t.byte 0x2e\n\tmovl %s,%%edx\n", asm_name("CallTo16_DataSelector") ); /* Load 32-bit segment registers */ output( "\tmovw %%dx, %%ds\n" ); output( "\tmovw %%dx, %%es\n" ); if ( UsePIC ) output( "\tmovw %s-1b(%%ecx), %%fs\n", asm_name("CallTo16_TebSelector") ); else output( "\tmovw %s, %%fs\n", asm_name("CallTo16_TebSelector") ); output( "\t.byte 0x64\n\tmov (%d),%%gs\n", GS_OFFSET ); /* Translate STACK16FRAME base to flat offset in %edx */ output( "\tmovw %%ss, %%dx\n" ); output( "\tandl $0xfff8, %%edx\n" ); output( "\tshrl $1, %%edx\n" ); if (UsePIC) { output( "\taddl wine_ldt_copy_ptr-1b(%%ecx),%%edx\n" ); output( "\tmovl (%%edx), %%edx\n" ); } else output( "\tmovl %s(%%edx), %%edx\n", asm_name("wine_ldt_copy") ); output( "\tmovzwl %%sp, %%ebp\n" ); output( "\tleal %d(%%ebp,%%edx), %%edx\n", reg_func ? 0 : -4 ); /* Get saved flags into %ecx */ if (reg_func) output( "\tpopl %%ecx\n" ); /* Get the 32-bit stack pointer from the TEB and complete STACK16FRAME */ output( "\t.byte 0x64\n\tmovl (%d), %%ebp\n", STACKOFFSET ); output( "\tpushl %%ebp\n" ); /* Switch stacks */ output( "\t.byte 0x64\n\tmovw %%ss, (%d)\n", STACKOFFSET + 2 ); output( "\t.byte 0x64\n\tmovw %%sp, (%d)\n", STACKOFFSET ); output( "\tpushl %%ds\n" ); output( "\tpopl %%ss\n" ); output( "\tmovl %%ebp, %%esp\n" ); output( "\taddl $0x20,%%ebp\n"); /* FIELD_OFFSET(STACK32FRAME,ebp) */ /* At this point: STACK16FRAME is completely set up DS, ES, SS: flat data segment FS: current TEB ESP: points to last STACK32FRAME EBP: points to ebp member of last STACK32FRAME EDX: points to current STACK16FRAME ECX: contains saved flags all other registers: unchanged */ /* Special case: C16ThkSL stub */ if ( thunk ) { /* Set up registers as expected and call thunk */ output( "\tleal 0x1a(%%edx),%%ebx\n" ); /* sizeof(STACK16FRAME)-22 */ output( "\tleal -4(%%esp), %%ebp\n" ); output( "\tcall *0x26(%%edx)\n"); /* FIELD_OFFSET(STACK16FRAME,entry_point) */ /* Switch stack back */ output( "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 ); output( "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET ); output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); /* Restore registers and return directly to caller */ output( "\taddl $8, %%esp\n" ); output( "\tpopl %%ebp\n" ); output( "\tpopw %%ds\n" ); output( "\tpopw %%es\n" ); output( "\tpopw %%fs\n" ); output( "\tpopw %%gs\n" ); output( "\taddl $20, %%esp\n" ); output( "\txorb %%ch, %%ch\n" ); output( "\tpopl %%ebx\n" ); output( "\taddw %%cx, %%sp\n" ); output( "\tpush %%ebx\n" ); output( "\t.byte 0x66\n" ); output( "\tlret\n" ); output_function_size( "__wine_call_from_16_thunk" ); return; } /* Build register CONTEXT */ if ( reg_func ) { output( "\tsubl $0x2cc,%%esp\n" ); /* sizeof(CONTEXT86) */ output( "\tmovl %%ecx,0xc0(%%esp)\n" ); /* EFlags */ output( "\tmovl %%eax,0xb0(%%esp)\n" ); /* Eax */ output( "\tmovl %%ebx,0xa4(%%esp)\n" ); /* Ebx */ output( "\tmovl %%esi,0xa0(%%esp)\n" ); /* Esi */ output( "\tmovl %%edi,0x9c(%%esp)\n" ); /* Edi */ output( "\tmovl 0x0c(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,ebp) */ output( "\tmovl %%eax,0xb4(%%esp)\n" ); /* Ebp */ output( "\tmovl 0x08(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,ecx) */ output( "\tmovl %%eax,0xac(%%esp)\n" ); /* Ecx */ output( "\tmovl 0x04(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,edx) */ output( "\tmovl %%eax,0xa8(%%esp)\n" ); /* Edx */ output( "\tmovzwl 0x10(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,ds) */ output( "\tmovl %%eax,0x98(%%esp)\n" ); /* SegDs */ output( "\tmovzwl 0x12(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,es) */ output( "\tmovl %%eax,0x94(%%esp)\n" ); /* SegEs */ output( "\tmovzwl 0x14(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,fs) */ output( "\tmovl %%eax,0x90(%%esp)\n" ); /* SegFs */ output( "\tmovzwl 0x16(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,gs) */ output( "\tmovl %%eax,0x8c(%%esp)\n" ); /* SegGs */ output( "\tmovzwl 0x2e(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,cs) */ output( "\tmovl %%eax,0xbc(%%esp)\n" ); /* SegCs */ output( "\tmovzwl 0x2c(%%edx),%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,ip) */ output( "\tmovl %%eax,0xb8(%%esp)\n" ); /* Eip */ output( "\t.byte 0x64\n\tmovzwl (%d), %%eax\n", STACKOFFSET+2 ); output( "\tmovl %%eax,0xc8(%%esp)\n" ); /* SegSs */ output( "\t.byte 0x64\n\tmovzwl (%d), %%eax\n", STACKOFFSET ); output( "\taddl $0x2c,%%eax\n"); /* FIELD_OFFSET(STACK16FRAME,ip) */ output( "\tmovl %%eax,0xc4(%%esp)\n" ); /* Esp */ #if 0 output( "\tfsave 0x1c(%%esp)\n" ); /* FloatSave */ #endif /* Push address of CONTEXT86 structure -- popped by the relay routine */ output( "\tmovl %%esp,%%eax\n" ); output( "\tandl $~15,%%esp\n" ); output( "\tsubl $4,%%esp\n" ); output( "\tpushl %%eax\n" ); } else { output( "\tsubl $8,%%esp\n" ); output( "\tandl $~15,%%esp\n" ); output( "\taddl $8,%%esp\n" ); } /* Call relay routine (which will call the API entry point) */ output( "\tleal 0x30(%%edx),%%eax\n" ); /* sizeof(STACK16FRAME) */ output( "\tpushl %%eax\n" ); output( "\tpushl 0x26(%%edx)\n"); /* FIELD_OFFSET(STACK16FRAME,entry_point) */ output( "\tcall *0x20(%%edx)\n"); /* FIELD_OFFSET(STACK16FRAME,relay) */ if ( reg_func ) { output( "\tleal -748(%%ebp),%%ebx\n" ); /* sizeof(CONTEXT) + FIELD_OFFSET(STACK32FRAME,ebp) */ /* Switch stack back */ output( "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 ); output( "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET ); output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); /* Get return address to CallFrom16 stub */ output( "\taddw $0x14,%%sp\n" ); /* FIELD_OFFSET(STACK16FRAME,callfrom_ip)-4 */ output( "\tpopl %%eax\n" ); output( "\tpopl %%edx\n" ); /* Restore all registers from CONTEXT */ output( "\tmovw 0xc8(%%ebx),%%ss\n"); /* SegSs */ output( "\tmovl 0xc4(%%ebx),%%esp\n"); /* Esp */ output( "\taddl $4, %%esp\n" ); /* room for final return address */ output( "\tpushw 0xbc(%%ebx)\n"); /* SegCs */ output( "\tpushw 0xb8(%%ebx)\n"); /* Eip */ output( "\tpushl %%edx\n" ); output( "\tpushl %%eax\n" ); output( "\tpushl 0xc0(%%ebx)\n"); /* EFlags */ output( "\tpushl 0x98(%%ebx)\n"); /* SegDs */ output( "\tpushl 0x94(%%ebx)\n"); /* SegEs */ output( "\tpopl %%es\n" ); output( "\tpushl 0x90(%%ebx)\n"); /* SegFs */ output( "\tpopl %%fs\n" ); output( "\tpushl 0x8c(%%ebx)\n"); /* SegGs */ output( "\tpopl %%gs\n" ); output( "\tmovl 0xb4(%%ebx),%%ebp\n"); /* Ebp */ output( "\tmovl 0xa0(%%ebx),%%esi\n"); /* Esi */ output( "\tmovl 0x9c(%%ebx),%%edi\n"); /* Edi */ output( "\tmovl 0xb0(%%ebx),%%eax\n"); /* Eax */ output( "\tmovl 0xa8(%%ebx),%%edx\n"); /* Edx */ output( "\tmovl 0xac(%%ebx),%%ecx\n"); /* Ecx */ output( "\tmovl 0xa4(%%ebx),%%ebx\n"); /* Ebx */ output( "\tpopl %%ds\n" ); output( "\tpopfl\n" ); output( "\tlret\n" ); output_function_size( "__wine_call_from_16_regs" ); } else { /* Switch stack back */ output( "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 ); output( "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET ); output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); /* Restore registers */ output( "\tpopl %%edx\n" ); output( "\tpopl %%ecx\n" ); output( "\tpopl %%ebp\n" ); output( "\tpopw %%ds\n" ); output( "\tpopw %%es\n" ); output( "\tpopw %%fs\n" ); output( "\tpopw %%gs\n" ); /* Return to return stub which will return to caller */ output( "\tlret $12\n" ); output_function_size( "__wine_call_from_16" ); } }
/******************************************************************* * BuildCallFrom32Regs * * Build a 32-bit-to-Wine call-back function for a 'register' function. * 'args' is the number of dword arguments. * * Stack layout: * ... * (ebp+20) first arg * (ebp+16) ret addr to user code * (ebp+12) func to call * (ebp+8) number of args * (ebp+4) ret addr to relay code * (ebp+0) saved ebp * (ebp-128) buffer area to allow stack frame manipulation * (ebp-332) CONTEXT86 struct * (ebp-336) CONTEXT86 *argument * .... other arguments copied from (ebp+12) * * The entry point routine is called with a CONTEXT* extra argument, * following the normal args. In this context structure, EIP_reg * contains the return address to user code, and ESP_reg the stack * pointer on return (with the return address and arguments already * removed). */ static void BuildCallFrom32Regs( FILE *outfile ) { static const int STACK_SPACE = 128 + sizeof(CONTEXT86); /* Function header */ function_header( outfile, "__wine_call_from_32_regs" ); /* Allocate some buffer space on the stack */ fprintf( outfile, "\tpushl %%ebp\n" ); fprintf( outfile, "\tmovl %%esp,%%ebp\n "); fprintf( outfile, "\tleal -%d(%%esp), %%esp\n", STACK_SPACE ); /* Build the context structure */ fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Eax) - STACK_SPACE ); fprintf( outfile, "\tpushfl\n" ); fprintf( outfile, "\tpopl %%eax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(EFlags) - STACK_SPACE ); fprintf( outfile, "\tmovl 0(%%ebp),%%eax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Ebp) - STACK_SPACE ); fprintf( outfile, "\tmovl %%ebx,%d(%%ebp)\n", CONTEXTOFFSET(Ebx) - STACK_SPACE ); fprintf( outfile, "\tmovl %%ecx,%d(%%ebp)\n", CONTEXTOFFSET(Ecx) - STACK_SPACE ); fprintf( outfile, "\tmovl %%edx,%d(%%ebp)\n", CONTEXTOFFSET(Edx) - STACK_SPACE ); fprintf( outfile, "\tmovl %%esi,%d(%%ebp)\n", CONTEXTOFFSET(Esi) - STACK_SPACE ); fprintf( outfile, "\tmovl %%edi,%d(%%ebp)\n", CONTEXTOFFSET(Edi) - STACK_SPACE ); fprintf( outfile, "\txorl %%eax,%%eax\n" ); fprintf( outfile, "\tmovw %%cs,%%ax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegCs) - STACK_SPACE ); fprintf( outfile, "\tmovw %%es,%%ax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegEs) - STACK_SPACE ); fprintf( outfile, "\tmovw %%fs,%%ax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegFs) - STACK_SPACE ); fprintf( outfile, "\tmovw %%gs,%%ax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegGs) - STACK_SPACE ); fprintf( outfile, "\tmovw %%ss,%%ax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegSs) - STACK_SPACE ); fprintf( outfile, "\tmovw %%ds,%%ax\n" ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegDs) - STACK_SPACE ); fprintf( outfile, "\tmovw %%ax,%%es\n" ); /* set %es equal to %ds just in case */ fprintf( outfile, "\tmovl $0x%x,%%eax\n", CONTEXT86_FULL ); fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(ContextFlags) - STACK_SPACE ); fprintf( outfile, "\tmovl 16(%%ebp),%%eax\n" ); /* Get %eip at time of call */ fprintf( outfile, "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Eip) - STACK_SPACE ); /* Transfer the arguments */ fprintf( outfile, "\tmovl 8(%%ebp),%%ecx\n" ); /* fetch number of args to copy */ fprintf( outfile, "\tleal 4(,%%ecx,4),%%edx\n" ); /* add context arg */ fprintf( outfile, "\tsubl %%edx,%%esp\n" ); /* update stack pointer to create room for the copy of the args */ fprintf( outfile, "\tandl $~15,%%esp\n" ); /* and align it */ fprintf( outfile, "\tleal 20(%%ebp),%%esi\n" ); /* get %esp at time of call to get original args */ fprintf( outfile, "\tmovl %%esp,%%edi\n" ); /* get destination for args */ fprintf( outfile, "\ttest %%ecx,%%ecx\n" ); /* check if we have any args to copy */ fprintf( outfile, "\tjz 1f\n" ); fprintf( outfile, "\tcld\n" ); fprintf( outfile, "\trep\n\tmovsl\n" ); /* copy args */ fprintf( outfile, "1:\tleal %d(%%ebp),%%eax\n", -STACK_SPACE ); /* Get CONTEXT location */ fprintf( outfile, "\tmovl %%eax,(%%edi)\n" ); /* Put pointer to it as parameter */ fprintf( outfile, "\tmovl %%esi,%d(%%ebp)\n", CONTEXTOFFSET(Esp) - STACK_SPACE ); /* Call the entry point */ fprintf( outfile, "\tmovl 4(%%ebp),%%eax\n" ); /* get relay code addr */ fprintf( outfile, "\taddl 12(%%ebp),%%eax\n" ); /* add offset to function to call, since it's passed int as a relative address instead of absolute */ fprintf( outfile, "\tcall *%%eax\n" ); fprintf( outfile, "\tleal -%d(%%ebp),%%ebx\n", STACK_SPACE ); /* Stick pointer to the CONTEXT86 in ebx for ease of reading */ /* Restore all registers from CONTEXT */ fprintf( outfile, "2:\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegEs) ); fprintf( outfile, "\tpopl %%es\n" ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegFs) ); fprintf( outfile, "\tpopl %%fs\n" ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegGs) ); fprintf( outfile, "\tpopl %%gs\n" ); fprintf( outfile, "\tmovl %d(%%ebx),%%edi\n", CONTEXTOFFSET(Edi) ); fprintf( outfile, "\tmovl %d(%%ebx),%%esi\n", CONTEXTOFFSET(Esi) ); fprintf( outfile, "\tmovl %d(%%ebx),%%edx\n", CONTEXTOFFSET(Edx) ); fprintf( outfile, "\tmovl %d(%%ebx),%%ecx\n", CONTEXTOFFSET(Ecx) ); fprintf( outfile, "\tmovl %d(%%ebx),%%eax\n", CONTEXTOFFSET(Eax) ); fprintf( outfile, "\tmovl %d(%%ebx),%%ebp\n", CONTEXTOFFSET(Ebp) ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegSs) ); fprintf( outfile, "\tpopl %%ss\n" ); fprintf( outfile, "\tmovl %d(%%ebx),%%esp\n", CONTEXTOFFSET(Esp) ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(EFlags) ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegCs) ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(Eip) ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegDs) ); fprintf( outfile, "\tmovl %d(%%ebx),%%ebx\n", CONTEXTOFFSET(Ebx) ); fprintf( outfile, "\tpopl %%ds\n" ); fprintf( outfile, "\tiret\n" ); /* This entrypoint is called from dlls/ntdll/signal_i386.c as the cleanup after handling an exception, since it also needs thread state restored from a CONTEXT86 structure on the stack. However, the stack layout's different than __wine_call_from_32_regs, so we need to do a different adjustment to find the CONTEXT86 structure */ function_header( outfile, "__wine_ret_to_32_regs" ); /* don't use ebp for offsets, as we'll get a stack fault when we set %ss if it's a different value from the current one; ebx is safe, as we don't reset %ds until right at the end */ fprintf( outfile, "\tleal 4(%%esp),%%ebx\n" ); fprintf( outfile, "\tjmp 2b\n" ); }
/******************************************************************* * BuildCallTo16Core * * This routine builds the core routines used in 32->16 thunks: * * extern void WINAPI wine_call_to_16_word( SEGPTR target, int nb_args ); * extern void WINAPI wine_call_to_16_long( SEGPTR target, int nb_args ); * extern void WINAPI wine_call_to_16_regs_short( const CONTEXT86 *context, int nb_args ); * extern void WINAPI wine_call_to_16_regs_long ( const CONTEXT86 *context, int nb_args ); * * These routines can be called directly from 32-bit code. * * All routines expect that the 16-bit stack contents (arguments) were * already set up by the caller; nb_args must contain the number of bytes * to be conserved. The 16-bit SS:SP will be set accordinly. * * All other registers are either taken from the CONTEXT86 structure * or else set to default values. The target routine address is either * given directly or taken from the CONTEXT86. * * If you want to call a 16-bit routine taking only standard argument types * (WORD and LONG), you can also have an appropriate argument conversion * stub automatically generated (see BuildCallTo16); you'd then call this * stub, which in turn would prepare the 16-bit stack and call the appropiate * core routine. * */ static void BuildCallTo16Core( FILE *outfile, int short_ret, int reg_func ) { char *name = reg_func == 2 ? "regs_long" : reg_func == 1 ? "regs_short" : short_ret? "word" : "long"; /* Function header */ if (reg_func == 2) function_header( outfile, "wine_call_to_16_regs_long" ); else if (reg_func == 1) function_header( outfile, "wine_call_to_16_regs_short" ); else if (short_ret) function_header( outfile, "wine_call_to_16_word" ); else function_header( outfile, "wine_call_to_16_long" ); /* Function entry sequence */ fprintf( outfile, "\tpushl %%ebp\n" ); fprintf( outfile, "\tmovl %%esp, %%ebp\n" ); /* Save the 32-bit registers */ fprintf( outfile, "\tpushl %%ebx\n" ); fprintf( outfile, "\tpushl %%ecx\n" ); fprintf( outfile, "\tpushl %%edx\n" ); fprintf( outfile, "\tpushl %%esi\n" ); fprintf( outfile, "\tpushl %%edi\n" ); if ( UsePIC ) { fprintf( outfile, "\tcall 1f\n" ); fprintf( outfile, "1:\tpopl %%ebx\n" ); } /* Enter Win16 Mutex */ fprintf( outfile, "\tcall " PREFIX "_EnterWin16Lock\n" ); /* Print debugging info */ if (debugging) { /* Push flags, number of arguments, and target */ fprintf( outfile, "\tpushl $%d\n", reg_func ); fprintf( outfile, "\tpushl 12(%%ebp)\n" ); fprintf( outfile, "\tpushl 8(%%ebp)\n" ); fprintf( outfile, "\tcall " PREFIX "RELAY_DebugCallTo16\n" ); fprintf( outfile, "\taddl $12, %%esp\n" ); } /* Get return address */ if ( UsePIC ) fprintf( outfile, "\tmovl " PREFIX "CallTo16_RetAddr-1b(%%ebx), %%ecx\n" ); else fprintf( outfile, "\tmovl " PREFIX "CallTo16_RetAddr, %%ecx\n" ); /* Call the actual CallTo16 routine (simulate a lcall) */ fprintf( outfile, "\tpushl %%cs\n" ); fprintf( outfile, "\tcall .Lwine_call_to_16_%s\n", name ); if ( !reg_func ) { /* Convert and push return value */ if ( short_ret ) { fprintf( outfile, "\tmovzwl %%ax, %%eax\n" ); fprintf( outfile, "\tpushl %%eax\n" ); } else { fprintf( outfile, "\tshll $16,%%edx\n" ); fprintf( outfile, "\tmovw %%ax,%%dx\n" ); fprintf( outfile, "\tpushl %%edx\n" ); } } else { /* * Modify CONTEXT86 structure to contain new values * * NOTE: We restore only EAX, EBX, EDX, EDX, EBP, and ESP. * The segment registers as well as ESI and EDI should * not be modified by a well-behaved 16-bit routine in * any case. [If necessary, we could restore them as well, * at the cost of a somewhat less efficient return path.] */ fprintf( outfile, "\tmovl %d(%%esp), %%edi\n", STACK32OFFSET(target)-12 ); fprintf( outfile, "\tmovl %%eax, %d(%%edi)\n", CONTEXTOFFSET(Eax) ); fprintf( outfile, "\tmovl %%ebx, %d(%%edi)\n", CONTEXTOFFSET(Ebx) ); fprintf( outfile, "\tmovl %%ecx, %d(%%edi)\n", CONTEXTOFFSET(Ecx) ); fprintf( outfile, "\tmovl %%edx, %d(%%edi)\n", CONTEXTOFFSET(Edx) ); fprintf( outfile, "\tmovl %%ebp, %d(%%edi)\n", CONTEXTOFFSET(Ebp) ); fprintf( outfile, "\tmovl %%esi, %d(%%edi)\n", CONTEXTOFFSET(Esp) ); /* The return glue code saved %esp into %esi */ fprintf( outfile, "\tpushl %%edi\n" ); } /* Print debugging info */ if (debugging) { fprintf( outfile, "\tpushl $%d\n", reg_func ); fprintf( outfile, "\tcall " PREFIX "RELAY_DebugCallTo16Ret\n" ); fprintf( outfile, "\taddl $4, %%esp\n" ); } /* Leave Win16 Mutex */ fprintf( outfile, "\tcall " PREFIX "_LeaveWin16Lock\n" ); /* Get return value */ fprintf( outfile, "\tpopl %%eax\n" ); /* Restore the 32-bit registers */ fprintf( outfile, "\tpopl %%edi\n" ); fprintf( outfile, "\tpopl %%esi\n" ); fprintf( outfile, "\tpopl %%edx\n" ); fprintf( outfile, "\tpopl %%ecx\n" ); fprintf( outfile, "\tpopl %%ebx\n" ); /* Function exit sequence */ fprintf( outfile, "\tpopl %%ebp\n" ); fprintf( outfile, "\tret $8\n" ); /* Start of the actual CallTo16 routine */ fprintf( outfile, ".Lwine_call_to_16_%s:\n", name ); /* Complete STACK32FRAME */ fprintf( outfile, "\t.byte 0x64\n\tpushl (%d)\n", STACKOFFSET ); fprintf( outfile, "\tmovl %%esp,%%edx\n" ); /* Switch to the 16-bit stack */ #ifdef __svr4__ fprintf( outfile,"\tdata16\n"); #endif fprintf( outfile, "\t.byte 0x64\n\tmovw (%d),%%ss\n", STACKOFFSET + 2); fprintf( outfile, "\t.byte 0x64\n\tmovw (%d),%%sp\n", STACKOFFSET ); fprintf( outfile, "\t.byte 0x64\n\tmovl %%edx,(%d)\n", STACKOFFSET ); /* Make %bp point to the previous stackframe (built by CallFrom16) */ fprintf( outfile, "\tmovzwl %%sp,%%ebp\n" ); fprintf( outfile, "\tleal %d(%%ebp),%%ebp\n", STACK16OFFSET(bp) ); /* Add the specified offset to the new sp */ fprintf( outfile, "\tsubw %d(%%edx), %%sp\n", STACK32OFFSET(nb_args) ); /* Push the return address * With sreg suffix, we push 16:16 address (normal lret) * With lreg suffix, we push 16:32 address (0x66 lret, for KERNEL32_45) */ if (reg_func != 2) fprintf( outfile, "\tpushl %%ecx\n" ); else { fprintf( outfile, "\tshldl $16, %%ecx, %%eax\n" ); fprintf( outfile, "\tpushw $0\n" ); fprintf( outfile, "\tpushw %%ax\n" ); fprintf( outfile, "\tpushw $0\n" ); fprintf( outfile, "\tpushw %%cx\n" ); } if (reg_func) { /* Push the called routine address */ fprintf( outfile, "\tmovl %d(%%edx),%%edx\n", STACK32OFFSET(target) ); fprintf( outfile, "\tpushw %d(%%edx)\n", CONTEXTOFFSET(SegCs) ); fprintf( outfile, "\tpushw %d(%%edx)\n", CONTEXTOFFSET(Eip) ); /* Get the registers */ fprintf( outfile, "\tpushw %d(%%edx)\n", CONTEXTOFFSET(SegDs) ); fprintf( outfile, "\tmovl %d(%%edx),%%eax\n", CONTEXTOFFSET(SegEs) ); fprintf( outfile, "\tmovw %%ax,%%es\n" ); fprintf( outfile, "\tmovl %d(%%edx),%%eax\n", CONTEXTOFFSET(SegFs) ); fprintf( outfile, "\tmovw %%ax,%%fs\n" ); fprintf( outfile, "\tmovl %d(%%edx),%%ebp\n", CONTEXTOFFSET(Ebp) ); fprintf( outfile, "\tmovl %d(%%edx),%%esi\n", CONTEXTOFFSET(Esi) ); fprintf( outfile, "\tmovl %d(%%edx),%%edi\n", CONTEXTOFFSET(Edi) ); fprintf( outfile, "\tmovl %d(%%edx),%%eax\n", CONTEXTOFFSET(Eax) ); fprintf( outfile, "\tmovl %d(%%edx),%%ebx\n", CONTEXTOFFSET(Ebx) ); fprintf( outfile, "\tmovl %d(%%edx),%%ecx\n", CONTEXTOFFSET(Ecx) ); fprintf( outfile, "\tmovl %d(%%edx),%%edx\n", CONTEXTOFFSET(Edx) ); /* Get the 16-bit ds */ fprintf( outfile, "\tpopw %%ds\n" ); } else /* not a register function */ { /* Push the called routine address */ fprintf( outfile, "\tpushl %d(%%edx)\n", STACK32OFFSET(target) ); /* Set %fs to the value saved by the last CallFrom16 */ fprintf( outfile, "\tmovw %d(%%ebp),%%ax\n", STACK16OFFSET(fs)-STACK16OFFSET(bp) ); fprintf( outfile, "\tmovw %%ax,%%fs\n" ); /* Set %ds and %es (and %ax just in case) equal to %ss */ fprintf( outfile, "\tmovw %%ss,%%ax\n" ); fprintf( outfile, "\tmovw %%ax,%%ds\n" ); fprintf( outfile, "\tmovw %%ax,%%es\n" ); } /* Jump to the called routine */ fprintf( outfile, "\t.byte 0x66\n" ); fprintf( outfile, "\tlret\n" ); }
/******************************************************************* * BuildCallFrom16Core * * This routine builds the core routines used in 16->32 thunks: * CallFrom16Word, CallFrom16Long, CallFrom16Register, and CallFrom16Thunk. * * These routines are intended to be called via a far call (with 32-bit * operand size) from 16-bit code. The 16-bit code stub must push %bp, * the 32-bit entry point to be called, and the argument conversion * routine to be used (see stack layout below). * * The core routine completes the STACK16FRAME on the 16-bit stack and * switches to the 32-bit stack. Then, the argument conversion routine * is called; it gets passed the 32-bit entry point and a pointer to the * 16-bit arguments (on the 16-bit stack) as parameters. (You can either * use conversion routines automatically generated by BuildCallFrom16, * or write your own for special purposes.) * * The conversion routine must call the 32-bit entry point, passing it * the converted arguments, and return its return value to the core. * After the conversion routine has returned, the core switches back * to the 16-bit stack, converts the return value to the DX:AX format * (CallFrom16Long), and returns to the 16-bit call stub. All parameters, * including %bp, are popped off the stack. * * The 16-bit call stub now returns to the caller, popping the 16-bit * arguments if necessary (pascal calling convention). * * In the case of a 'register' function, CallFrom16Register fills a * CONTEXT86 structure with the values all registers had at the point * the first instruction of the 16-bit call stub was about to be * executed. A pointer to this CONTEXT86 is passed as third parameter * to the argument conversion routine, which typically passes it on * to the called 32-bit entry point. * * CallFrom16Thunk is a special variant used by the implementation of * the Win95 16->32 thunk functions C16ThkSL and C16ThkSL01 and is * implemented as follows: * On entry, the EBX register is set up to contain a flat pointer to the * 16-bit stack such that EBX+22 points to the first argument. * Then, the entry point is called, while EBP is set up to point * to the return address (on the 32-bit stack). * The called function returns with CX set to the number of bytes * to be popped of the caller's stack. * * Stack layout upon entry to the core routine (STACK16FRAME): * ... ... * (sp+24) word first 16-bit arg * (sp+22) word cs * (sp+20) word ip * (sp+18) word bp * (sp+14) long 32-bit entry point (reused for Win16 mutex recursion count) * (sp+12) word ip of actual entry point (necessary for relay debugging) * (sp+8) long relay (argument conversion) function entry point * (sp+4) long cs of 16-bit entry point * (sp) long ip of 16-bit entry point * * Added on the stack: * (sp-2) word saved gs * (sp-4) word saved fs * (sp-6) word saved es * (sp-8) word saved ds * (sp-12) long saved ebp * (sp-16) long saved ecx * (sp-20) long saved edx * (sp-24) long saved previous stack */ static void BuildCallFrom16Core( FILE *outfile, int reg_func, int thunk, int short_ret ) { /* Function header */ if (thunk) function_header( outfile, "__wine_call_from_16_thunk" ); else if (reg_func) function_header( outfile, "__wine_call_from_16_regs" ); else if (short_ret) function_header( outfile, "__wine_call_from_16_word" ); else function_header( outfile, "__wine_call_from_16_long" ); /* Create STACK16FRAME (except STACK32FRAME link) */ fprintf( outfile, "\tpushw %%gs\n" ); fprintf( outfile, "\tpushw %%fs\n" ); fprintf( outfile, "\tpushw %%es\n" ); fprintf( outfile, "\tpushw %%ds\n" ); fprintf( outfile, "\tpushl %%ebp\n" ); fprintf( outfile, "\tpushl %%ecx\n" ); fprintf( outfile, "\tpushl %%edx\n" ); /* Save original EFlags register */ fprintf( outfile, "\tpushfl\n" ); if ( UsePIC ) { /* Get Global Offset Table into %ecx */ fprintf( outfile, "\tcall 1f\n" ); fprintf( outfile, "1:\tpopl %%ecx\n" ); } if (UsePIC) fprintf( outfile, "\t.byte 0x2e\n\tmovl " PREFIX "CallTo16_DataSelector-1b(%%ecx),%%edx\n" ); else fprintf( outfile, "\t.byte 0x2e\n\tmovl " PREFIX "CallTo16_DataSelector,%%edx\n" ); /* Load 32-bit segment registers */ #ifdef __svr4__ fprintf( outfile, "\tdata16\n"); #endif fprintf( outfile, "\tmovw %%dx, %%ds\n" ); #ifdef __svr4__ fprintf( outfile, "\tdata16\n"); #endif fprintf( outfile, "\tmovw %%dx, %%es\n" ); if ( UsePIC ) fprintf( outfile, "\tmovw " PREFIX "SYSLEVEL_Win16CurrentTeb-1b(%%ecx), %%fs\n" ); else fprintf( outfile, "\tmovw " PREFIX "SYSLEVEL_Win16CurrentTeb, %%fs\n" ); /* Get address of wine_ldt_copy array into %ecx */ if ( UsePIC ) fprintf( outfile, "\tmovl wine_ldt_copy_ptr-1b(%%ecx), %%ecx\n" ); else fprintf( outfile, "\tmovl $" PREFIX "wine_ldt_copy, %%ecx\n" ); /* Translate STACK16FRAME base to flat offset in %edx */ fprintf( outfile, "\tmovw %%ss, %%dx\n" ); fprintf( outfile, "\tandl $0xfff8, %%edx\n" ); fprintf( outfile, "\tshrl $1, %%edx\n" ); fprintf( outfile, "\tmovl (%%ecx,%%edx), %%edx\n" ); fprintf( outfile, "\tmovzwl %%sp, %%ebp\n" ); fprintf( outfile, "\tleal (%%ebp,%%edx), %%edx\n" ); /* Get saved flags into %ecx */ fprintf( outfile, "\tpopl %%ecx\n" ); /* Get the 32-bit stack pointer from the TEB and complete STACK16FRAME */ fprintf( outfile, "\t.byte 0x64\n\tmovl (%d), %%ebp\n", STACKOFFSET ); fprintf( outfile, "\tpushl %%ebp\n" ); /* Switch stacks */ #ifdef __svr4__ fprintf( outfile,"\tdata16\n"); #endif fprintf( outfile, "\t.byte 0x64\n\tmovw %%ss, (%d)\n", STACKOFFSET + 2 ); fprintf( outfile, "\t.byte 0x64\n\tmovw %%sp, (%d)\n", STACKOFFSET ); fprintf( outfile, "\tpushl %%ds\n" ); fprintf( outfile, "\tpopl %%ss\n" ); fprintf( outfile, "\tmovl %%ebp, %%esp\n" ); fprintf( outfile, "\taddl $%d, %%ebp\n", STRUCTOFFSET(STACK32FRAME, ebp) ); /* At this point: STACK16FRAME is completely set up DS, ES, SS: flat data segment FS: current TEB ESP: points to last STACK32FRAME EBP: points to ebp member of last STACK32FRAME EDX: points to current STACK16FRAME ECX: contains saved flags all other registers: unchanged */ /* Special case: C16ThkSL stub */ if ( thunk ) { /* Set up registers as expected and call thunk */ fprintf( outfile, "\tleal %lu(%%edx), %%ebx\n", sizeof(STACK16FRAME)-22 ); fprintf( outfile, "\tleal -4(%%esp), %%ebp\n" ); fprintf( outfile, "\tcall *%d(%%edx)\n", STACK16OFFSET(entry_point) ); /* Switch stack back */ fprintf( outfile, "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 ); fprintf( outfile, "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET ); fprintf( outfile, "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); /* Restore registers and return directly to caller */ fprintf( outfile, "\taddl $8, %%esp\n" ); fprintf( outfile, "\tpopl %%ebp\n" ); fprintf( outfile, "\tpopw %%ds\n" ); fprintf( outfile, "\tpopw %%es\n" ); fprintf( outfile, "\tpopw %%fs\n" ); fprintf( outfile, "\tpopw %%gs\n" ); fprintf( outfile, "\taddl $20, %%esp\n" ); fprintf( outfile, "\txorb %%ch, %%ch\n" ); fprintf( outfile, "\tpopl %%ebx\n" ); fprintf( outfile, "\taddw %%cx, %%sp\n" ); fprintf( outfile, "\tpush %%ebx\n" ); fprintf( outfile, "\t.byte 0x66\n" ); fprintf( outfile, "\tlret\n" ); return; } /* Build register CONTEXT */ if ( reg_func ) { fprintf( outfile, "\tsubl $%lu, %%esp\n", sizeof(CONTEXT86) ); fprintf( outfile, "\tmovl %%ecx, %d(%%esp)\n", CONTEXTOFFSET(EFlags) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Eax) ); fprintf( outfile, "\tmovl %%ebx, %d(%%esp)\n", CONTEXTOFFSET(Ebx) ); fprintf( outfile, "\tmovl %%esi, %d(%%esp)\n", CONTEXTOFFSET(Esi) ); fprintf( outfile, "\tmovl %%edi, %d(%%esp)\n", CONTEXTOFFSET(Edi) ); fprintf( outfile, "\tmovl %d(%%edx), %%eax\n", STACK16OFFSET(ebp) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Ebp) ); fprintf( outfile, "\tmovl %d(%%edx), %%eax\n", STACK16OFFSET(ecx) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Ecx) ); fprintf( outfile, "\tmovl %d(%%edx), %%eax\n", STACK16OFFSET(edx) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Edx) ); fprintf( outfile, "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(ds) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegDs) ); fprintf( outfile, "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(es) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegEs) ); fprintf( outfile, "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(fs) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegFs) ); fprintf( outfile, "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(gs) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegGs) ); fprintf( outfile, "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(cs) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegCs) ); fprintf( outfile, "\tmovzwl %d(%%edx), %%eax\n", STACK16OFFSET(ip) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Eip) ); fprintf( outfile, "\t.byte 0x64\n\tmovzwl (%d), %%eax\n", STACKOFFSET+2 ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(SegSs) ); fprintf( outfile, "\t.byte 0x64\n\tmovzwl (%d), %%eax\n", STACKOFFSET ); fprintf( outfile, "\taddl $%d, %%eax\n", STACK16OFFSET(ip) ); fprintf( outfile, "\tmovl %%eax, %d(%%esp)\n", CONTEXTOFFSET(Esp) ); #if 0 fprintf( outfile, "\tfsave %d(%%esp)\n", CONTEXTOFFSET(FloatSave) ); #endif /* Push address of CONTEXT86 structure -- popped by the relay routine */ fprintf( outfile, "\tpushl %%esp\n" ); } /* Print debug info before call */ if ( debugging ) { fprintf( outfile, "\tpushl %%edx\n" ); if ( reg_func ) fprintf( outfile, "\tleal -%lu(%%ebp), %%eax\n\tpushl %%eax\n", sizeof(CONTEXT) + STRUCTOFFSET(STACK32FRAME, ebp) ); else fprintf( outfile, "\tpushl $0\n" ); fprintf( outfile, "\tcall " PREFIX "RELAY_DebugCallFrom16\n "); fprintf( outfile, "\tpopl %%edx\n" ); fprintf( outfile, "\tpopl %%edx\n" ); } /* Call relay routine (which will call the API entry point) */ fprintf( outfile, "\tleal %lu(%%edx), %%eax\n", sizeof(STACK16FRAME) ); fprintf( outfile, "\tpushl %%eax\n" ); fprintf( outfile, "\tpushl %d(%%edx)\n", STACK16OFFSET(entry_point) ); fprintf( outfile, "\tcall *%d(%%edx)\n", STACK16OFFSET(relay) ); /* Print debug info after call */ if ( debugging ) { fprintf( outfile, "\tpushl %%eax\n" ); if ( reg_func ) fprintf( outfile, "\tleal -%lu(%%ebp), %%eax\n\tpushl %%eax\n", sizeof(CONTEXT) + STRUCTOFFSET(STACK32FRAME, ebp) ); else fprintf( outfile, "\tpushl $0\n" ); fprintf( outfile, "\tcall " PREFIX "RELAY_DebugCallFrom16Ret\n "); fprintf( outfile, "\tpopl %%eax\n" ); fprintf( outfile, "\tpopl %%eax\n" ); } if ( reg_func ) { fprintf( outfile, "\tmovl %%esp, %%ebx\n" ); /* Switch stack back */ fprintf( outfile, "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 ); fprintf( outfile, "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET ); fprintf( outfile, "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); /* Get return address to CallFrom16 stub */ fprintf( outfile, "\taddw $%d, %%sp\n", STACK16OFFSET(callfrom_ip)-4 ); fprintf( outfile, "\tpopl %%eax\n" ); fprintf( outfile, "\tpopl %%edx\n" ); /* Restore all registers from CONTEXT */ fprintf( outfile, "\tmovw %d(%%ebx), %%ss\n", CONTEXTOFFSET(SegSs) ); fprintf( outfile, "\tmovl %d(%%ebx), %%esp\n", CONTEXTOFFSET(Esp) ); fprintf( outfile, "\taddl $4, %%esp\n" ); /* room for final return address */ fprintf( outfile, "\tpushw %d(%%ebx)\n", CONTEXTOFFSET(SegCs) ); fprintf( outfile, "\tpushw %d(%%ebx)\n", CONTEXTOFFSET(Eip) ); fprintf( outfile, "\tpushl %%edx\n" ); fprintf( outfile, "\tpushl %%eax\n" ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(EFlags) ); fprintf( outfile, "\tpushl %d(%%ebx)\n", CONTEXTOFFSET(SegDs) ); fprintf( outfile, "\tmovw %d(%%ebx), %%es\n", CONTEXTOFFSET(SegEs) ); fprintf( outfile, "\tmovw %d(%%ebx), %%fs\n", CONTEXTOFFSET(SegFs) ); fprintf( outfile, "\tmovw %d(%%ebx), %%gs\n", CONTEXTOFFSET(SegGs) ); fprintf( outfile, "\tmovl %d(%%ebx), %%ebp\n", CONTEXTOFFSET(Ebp) ); fprintf( outfile, "\tmovl %d(%%ebx), %%esi\n", CONTEXTOFFSET(Esi) ); fprintf( outfile, "\tmovl %d(%%ebx), %%edi\n", CONTEXTOFFSET(Edi) ); fprintf( outfile, "\tmovl %d(%%ebx), %%eax\n", CONTEXTOFFSET(Eax) ); fprintf( outfile, "\tmovl %d(%%ebx), %%edx\n", CONTEXTOFFSET(Edx) ); fprintf( outfile, "\tmovl %d(%%ebx), %%ecx\n", CONTEXTOFFSET(Ecx) ); fprintf( outfile, "\tmovl %d(%%ebx), %%ebx\n", CONTEXTOFFSET(Ebx) ); fprintf( outfile, "\tpopl %%ds\n" ); fprintf( outfile, "\tpopfl\n" ); fprintf( outfile, "\tlret\n" ); } else { /* Switch stack back */ fprintf( outfile, "\t.byte 0x64\n\tmovw (%d), %%ss\n", STACKOFFSET+2 ); fprintf( outfile, "\t.byte 0x64\n\tmovzwl (%d), %%esp\n", STACKOFFSET ); fprintf( outfile, "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); /* Restore registers */ fprintf( outfile, "\tpopl %%edx\n" ); fprintf( outfile, "\tpopl %%ecx\n" ); fprintf( outfile, "\tpopl %%ebp\n" ); fprintf( outfile, "\tpopw %%ds\n" ); fprintf( outfile, "\tpopw %%es\n" ); fprintf( outfile, "\tpopw %%fs\n" ); fprintf( outfile, "\tpopw %%gs\n" ); /* Prepare return value and set flags accordingly */ if ( !short_ret ) fprintf( outfile, "\tshldl $16, %%eax, %%edx\n" ); fprintf( outfile, "\torl %%eax, %%eax\n" ); /* Return to return stub which will return to caller */ fprintf( outfile, "\tlret $12\n" ); } }
/******************************************************************* * BuildCallFrom32Regs * * Build a 32-bit-to-Wine call-back function for a 'register' function. * 'args' is the number of dword arguments. * * Stack layout: * ... * (ebp+16) first arg * (ebp+12) ret addr to user code * (ebp+8) eax saved by relay code * (ebp+4) ret addr to relay code * (ebp+0) saved ebp * (ebp-128) buffer area to allow stack frame manipulation * (ebp-332) CONTEXT86 struct * (ebp-336) padding for stack alignment * (ebp-336-n) CONTEXT86 *argument * .... other arguments copied from (ebp+12) * * The entry point routine is called with a CONTEXT* extra argument, * following the normal args. In this context structure, EIP_reg * contains the return address to user code, and ESP_reg the stack * pointer on return (with the return address and arguments already * removed). */ static void BuildCallFrom32Regs(void) { static const int STACK_SPACE = 128 + sizeof(CONTEXT86); /* Function header */ function_header( "__wine_call_from_32_regs" ); /* Allocate some buffer space on the stack */ output( "\tpushl %%ebp\n" ); output( "\tmovl %%esp,%%ebp\n "); output( "\tleal -%d(%%esp), %%esp\n", STACK_SPACE + 4 /* for context arg */); /* Build the context structure */ output( "\tpushfl\n" ); output( "\tpopl %%eax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(EFlags) - STACK_SPACE ); output( "\tmovl 0(%%ebp),%%eax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Ebp) - STACK_SPACE ); output( "\tmovl 8(%%ebp),%%eax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Eax) - STACK_SPACE ); output( "\tmovl %%ebx,%d(%%ebp)\n", CONTEXTOFFSET(Ebx) - STACK_SPACE ); output( "\tmovl %%ecx,%d(%%ebp)\n", CONTEXTOFFSET(Ecx) - STACK_SPACE ); output( "\tmovl %%edx,%d(%%ebp)\n", CONTEXTOFFSET(Edx) - STACK_SPACE ); output( "\tmovl %%esi,%d(%%ebp)\n", CONTEXTOFFSET(Esi) - STACK_SPACE ); output( "\tmovl %%edi,%d(%%ebp)\n", CONTEXTOFFSET(Edi) - STACK_SPACE ); output( "\txorl %%eax,%%eax\n" ); output( "\tmovw %%cs,%%ax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegCs) - STACK_SPACE ); output( "\tmovw %%es,%%ax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegEs) - STACK_SPACE ); output( "\tmovw %%fs,%%ax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegFs) - STACK_SPACE ); output( "\tmovw %%gs,%%ax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegGs) - STACK_SPACE ); output( "\tmovw %%ss,%%ax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegSs) - STACK_SPACE ); output( "\tmovw %%ds,%%ax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(SegDs) - STACK_SPACE ); output( "\tmovw %%ax,%%es\n" ); /* set %es equal to %ds just in case */ output( "\tmovl $0x%x,%%eax\n", CONTEXT86_FULL ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(ContextFlags) - STACK_SPACE ); output( "\tmovl 12(%%ebp),%%eax\n" ); /* Get %eip at time of call */ output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Eip) - STACK_SPACE ); /* Transfer the arguments */ output( "\tmovl 4(%%ebp),%%ebx\n" ); /* get relay code addr */ output( "\tmovzbl 4(%%ebx),%%ecx\n" ); /* fetch number of args to copy */ output( "\tsubl %%ecx,%%esp\n" ); output( "\tandl $~15,%%esp\n" ); output( "\tleal 16(%%ebp),%%esi\n" ); /* get %esp at time of call */ output( "\tmovl %%esp,%%edi\n" ); output( "\tshrl $2,%%ecx\n" ); output( "\tjz 1f\n" ); output( "\tcld\n" ); output( "\trep\n\tmovsl\n" ); /* copy args */ output( "1:\tleal %d(%%ebp),%%eax\n", -STACK_SPACE ); /* get addr of context struct */ output( "\tmovl %%eax,(%%edi)\n" ); /* and pass it as extra arg */ output( "\tmovzbl 5(%%ebx),%%eax\n" ); /* fetch number of args to remove */ output( "\tleal 16(%%ebp,%%eax),%%eax\n" ); output( "\tmovl %%eax,%d(%%ebp)\n", CONTEXTOFFSET(Esp) - STACK_SPACE ); /* Call the entry point */ output( "\taddl (%%ebx),%%ebx\n" ); output( "\tcall *%%ebx\n" ); output( "\tleal -%d(%%ebp),%%ecx\n", STACK_SPACE ); /* Restore the context structure */ output( "2:\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegEs) ); output( "\tpopl %%es\n" ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegFs) ); output( "\tpopl %%fs\n" ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegGs) ); output( "\tpopl %%gs\n" ); output( "\tmovl %d(%%ecx),%%edi\n", CONTEXTOFFSET(Edi) ); output( "\tmovl %d(%%ecx),%%esi\n", CONTEXTOFFSET(Esi) ); output( "\tmovl %d(%%ecx),%%edx\n", CONTEXTOFFSET(Edx) ); output( "\tmovl %d(%%ecx),%%ebx\n", CONTEXTOFFSET(Ebx) ); output( "\tmovl %d(%%ecx),%%eax\n", CONTEXTOFFSET(Eax) ); output( "\tmovl %d(%%ecx),%%ebp\n", CONTEXTOFFSET(Ebp) ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegSs) ); output( "\tpopl %%ss\n" ); output( "\tmovl %d(%%ecx),%%esp\n", CONTEXTOFFSET(Esp) ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(EFlags) ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegCs) ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(Eip) ); output( "\tpushl %d(%%ecx)\n", CONTEXTOFFSET(SegDs) ); output( "\tmovl %d(%%ecx),%%ecx\n", CONTEXTOFFSET(Ecx) ); output( "\tpopl %%ds\n" ); output( "\tiret\n" ); output_function_size( "__wine_call_from_32_regs" ); function_header( "__wine_call_from_32_restore_regs" ); output( "\tmovl 4(%%esp),%%ecx\n" ); output( "\tjmp 2b\n" ); output_function_size( "__wine_call_from_32_restore_regs" ); }
/******************************************************************* * BuildCallTo16Core * * This routine builds the core routines used in 32->16 thunks: * * extern DWORD WINAPI wine_call_to_16( FARPROC16 target, DWORD cbArgs, PEXCEPTION_HANDLER handler ); * extern void WINAPI wine_call_to_16_regs( CONTEXT86 *context, DWORD cbArgs, PEXCEPTION_HANDLER handler ); * * These routines can be called directly from 32-bit code. * * All routines expect that the 16-bit stack contents (arguments) and the * return address (segptr to CallTo16_Ret) were already set up by the * caller; nb_args must contain the number of bytes to be conserved. The * 16-bit SS:SP will be set accordingly. * * All other registers are either taken from the CONTEXT86 structure * or else set to default values. The target routine address is either * given directly or taken from the CONTEXT86. */ static void BuildCallTo16Core( int reg_func ) { const char *name = reg_func ? "wine_call_to_16_regs" : "wine_call_to_16"; /* Function header */ function_header( name ); /* Function entry sequence */ output( "\tpushl %%ebp\n" ); output( "\tmovl %%esp, %%ebp\n" ); /* Save the 32-bit registers */ output( "\tpushl %%ebx\n" ); output( "\tpushl %%esi\n" ); output( "\tpushl %%edi\n" ); output( "\t.byte 0x64\n\tmov %%gs,(%d)\n", GS_OFFSET ); /* Setup exception frame */ output( "\t.byte 0x64\n\tpushl (%d)\n", STACKOFFSET ); output( "\tpushl 16(%%ebp)\n" ); /* handler */ output( "\t.byte 0x64\n\tpushl (0)\n" ); output( "\t.byte 0x64\n\tmovl %%esp,(0)\n" ); /* Call the actual CallTo16 routine (simulate a lcall) */ output( "\tpushl %%cs\n" ); output( "\tcall .L%s\n", name ); /* Remove exception frame */ output( "\t.byte 0x64\n\tpopl (0)\n" ); output( "\taddl $4, %%esp\n" ); output( "\t.byte 0x64\n\tpopl (%d)\n", STACKOFFSET ); if ( !reg_func ) { /* Convert return value */ output( "\tandl $0xffff,%%eax\n" ); output( "\tshll $16,%%edx\n" ); output( "\torl %%edx,%%eax\n" ); } else { /* * Modify CONTEXT86 structure to contain new values * * NOTE: We restore only EAX, EBX, EDX, EDX, EBP, and ESP. * The segment registers as well as ESI and EDI should * not be modified by a well-behaved 16-bit routine in * any case. [If necessary, we could restore them as well, * at the cost of a somewhat less efficient return path.] */ output( "\tmovl %d(%%esp), %%edi\n", STACK32OFFSET(target) - STACK32OFFSET(edi)); /* everything above edi has been popped already */ output( "\tmovl %%eax, %d(%%edi)\n", CONTEXTOFFSET(Eax) ); output( "\tmovl %%ebx, %d(%%edi)\n", CONTEXTOFFSET(Ebx) ); output( "\tmovl %%ecx, %d(%%edi)\n", CONTEXTOFFSET(Ecx) ); output( "\tmovl %%edx, %d(%%edi)\n", CONTEXTOFFSET(Edx) ); output( "\tmovl %%ebp, %d(%%edi)\n", CONTEXTOFFSET(Ebp) ); output( "\tmovl %%esi, %d(%%edi)\n", CONTEXTOFFSET(Esp) ); /* The return glue code saved %esp into %esi */ } /* Restore the 32-bit registers */ output( "\tpopl %%edi\n" ); output( "\tpopl %%esi\n" ); output( "\tpopl %%ebx\n" ); /* Function exit sequence */ output( "\tpopl %%ebp\n" ); output( "\tret $12\n" ); /* Start of the actual CallTo16 routine */ output( ".L%s:\n", name ); /* Switch to the 16-bit stack */ output( "\tmovl %%esp,%%edx\n" ); output( "\t.byte 0x64\n\tmovw (%d),%%ss\n", STACKOFFSET + 2); output( "\t.byte 0x64\n\tmovw (%d),%%sp\n", STACKOFFSET ); output( "\t.byte 0x64\n\tmovl %%edx,(%d)\n", STACKOFFSET ); /* Make %bp point to the previous stackframe (built by CallFrom16) */ output( "\tmovzwl %%sp,%%ebp\n" ); output( "\tleal %d(%%ebp),%%ebp\n", STACK16OFFSET(bp) ); /* Add the specified offset to the new sp */ output( "\tsubw %d(%%edx), %%sp\n", STACK32OFFSET(nb_args) ); if (reg_func) { /* Push the called routine address */ output( "\tmovl %d(%%edx),%%edx\n", STACK32OFFSET(target) ); output( "\tpushw %d(%%edx)\n", CONTEXTOFFSET(SegCs) ); output( "\tpushw %d(%%edx)\n", CONTEXTOFFSET(Eip) ); /* Get the registers */ output( "\tpushw %d(%%edx)\n", CONTEXTOFFSET(SegDs) ); output( "\tpushl %d(%%edx)\n", CONTEXTOFFSET(SegEs) ); output( "\tpopl %%es\n" ); output( "\tpushl %d(%%edx)\n", CONTEXTOFFSET(SegFs) ); output( "\tpopl %%fs\n" ); output( "\tpushl %d(%%edx)\n", CONTEXTOFFSET(SegGs) ); output( "\tpopl %%gs\n" ); output( "\tmovl %d(%%edx),%%ebp\n", CONTEXTOFFSET(Ebp) ); output( "\tmovl %d(%%edx),%%esi\n", CONTEXTOFFSET(Esi) ); output( "\tmovl %d(%%edx),%%edi\n", CONTEXTOFFSET(Edi) ); output( "\tmovl %d(%%edx),%%eax\n", CONTEXTOFFSET(Eax) ); output( "\tmovl %d(%%edx),%%ebx\n", CONTEXTOFFSET(Ebx) ); output( "\tmovl %d(%%edx),%%ecx\n", CONTEXTOFFSET(Ecx) ); output( "\tmovl %d(%%edx),%%edx\n", CONTEXTOFFSET(Edx) ); /* Get the 16-bit ds */ output( "\tpopw %%ds\n" ); } else /* not a register function */ { /* Push the called routine address */ output( "\tpushl %d(%%edx)\n", STACK32OFFSET(target) ); /* Set %fs and %gs to the value saved by the last CallFrom16 */ output( "\tpushw %d(%%ebp)\n", STACK16OFFSET(fs)-STACK16OFFSET(bp) ); output( "\tpopw %%fs\n" ); output( "\tpushw %d(%%ebp)\n", STACK16OFFSET(gs)-STACK16OFFSET(bp) ); output( "\tpopw %%gs\n" ); /* Set %ds and %es (and %ax just in case) equal to %ss */ output( "\tmovw %%ss,%%ax\n" ); output( "\tmovw %%ax,%%ds\n" ); output( "\tmovw %%ax,%%es\n" ); } /* Jump to the called routine */ output( "\t.byte 0x66\n" ); output( "\tlret\n" ); /* Function footer */ output_function_size( name ); }