/* * This software is part of the SBCL system. See the README file for * more information. * * This software is derived from the CMU CL system, which was * written at Carnegie Mellon University and released into the * public domain. The software is in the public domain and is * provided with absolutely no warranty. See the COPYING and CREDITS * files for more information. */ #include #include "sbcl.h" #include "arch.h" #include "globals.h" #include "validate.h" #include "os.h" #include "lispregs.h" #include "signal.h" #include "interrupt.h" #include "interr.h" #include "breakpoint.h" #include "alloc.h" #if defined(LISP_FEATURE_GENCGC) #include "gencgc-alloc-region.h" #endif /* The header files may not define PT_DAR/PT_DSISR. This definition is correct for all versions of ppc linux >= 2.0.30 As of DR2.1u4, MkLinux doesn't pass these registers to signal handlers correctly; a patch is necessary in order to (partially) correct this. Even with the patch, the DSISR may not have its 'write' bit set correctly (it tends not to be set if the fault was caused by something other than a protection violation.) Caveat callers. */ #if defined (LISP_FEATURE_DARWIN) || defined(LISP_FEATURE_LINUX) #ifndef PT_DAR #define PT_DAR 41 #endif #ifndef PT_DSISR #define PT_DSISR 42 #endif #endif void arch_init() { } os_vm_address_t arch_get_bad_addr(int sig, siginfo_t *code, os_context_t *context) { os_vm_address_t addr; #if defined(LISP_FEATURE_NETBSD) addr = (os_vm_address_t) (code->si_addr); #else addr = (os_vm_address_t) (*os_context_register_addr(context,PT_DAR)); #endif return addr; } void arch_skip_instruction(os_context_t *context) { char** pcptr; pcptr = (char**) os_context_pc_addr(context); *pcptr += 4; } unsigned char * arch_internal_error_arguments(os_context_t *context) { return (unsigned char *)(*os_context_pc_addr(context)+4); } boolean arch_pseudo_atomic_atomic(os_context_t *context) { /* FIXME: this foreign_function_call_active test is dubious at * best. If a foreign call is made in a pseudo atomic section * (?) or more likely a pseudo atomic section is in a foreign * call then an interrupt is executed immediately. Maybe it * has to do with C code not maintaining pseudo atomic * properly. MG - 2005-08-10 * * The foreign_function_call_active used to live at each call-site * to arch_pseudo_atomic_atomic, but this seems clearer. * --NS 2007-05-15 */ return (!foreign_function_call_active) && ((*os_context_register_addr(context,reg_ALLOC)) & 4); } void arch_set_pseudo_atomic_interrupted(os_context_t *context) { *os_context_register_addr(context,reg_ALLOC) |= 1; } void arch_clear_pseudo_atomic_interrupted(os_context_t *context) { *os_context_register_addr(context,reg_ALLOC) &= ~1; } unsigned int arch_install_breakpoint(void *pc) { unsigned int *ptr = (unsigned int *)pc; unsigned int result = *ptr; *ptr = (3<<26) | (5 << 21) | trap_Breakpoint; os_flush_icache((os_vm_address_t) pc, sizeof(unsigned int)); return result; } void arch_remove_breakpoint(void *pc, unsigned int orig_inst) { *(unsigned int *)pc = orig_inst; os_flush_icache((os_vm_address_t) pc, sizeof(unsigned int)); } /* * Perform the instruction that we overwrote with a breakpoint. As we * don't have a single-step facility, this means we have to: * - put the instruction back * - put a second breakpoint at the following instruction, * set after_breakpoint and continue execution. * * When the second breakpoint is hit (very shortly thereafter, we hope) * sigtrap_handler gets called again, but follows the AfterBreakpoint * arm, which * - puts a bpt back in the first breakpoint place (running across a * breakpoint shouldn't cause it to be uninstalled) * - replaces the second bpt with the instruction it was meant to be * - carries on * * Clear? */ static unsigned int *skipped_break_addr, displaced_after_inst; static sigset_t orig_sigmask; void arch_do_displaced_inst(os_context_t *context, unsigned int orig_inst) { /* not sure how we ensure that we get the breakpoint reinstalled * after doing this -dan */ unsigned int *pc = (unsigned int *)(*os_context_pc_addr(context)); orig_sigmask = *os_context_sigmask_addr(context); sigaddset_blockable(os_context_sigmask_addr(context)); *pc = orig_inst; os_flush_icache((os_vm_address_t) pc, sizeof(unsigned int)); skipped_break_addr = pc; /* FIXME: we should apparently be installing the after-breakpoint * here, but would need to find the next instruction address for * it first. alpha-arch.c shows how to do it. --NS 2007-04-02 */ } #ifdef LISP_FEATURE_GENCGC /* * Return non-zero if the current instruction is an allocation trap */ static int allocation_trap_p(os_context_t * context) { int result; unsigned int *pc; unsigned inst; unsigned opcode; unsigned src; unsigned dst; result = 0; /* * First, the instruction has to be a TWLGE temp, NL3, which has the * format. * | 6| 5| 5 | 5 | 10|1| width * |31|5 |dst|src| 4|0| field */ pc = (unsigned int *) (*os_context_pc_addr(context)); inst = *pc; #if 0 fprintf(stderr, "allocation_trap_p at %p: inst = 0x%08x\n", pc, inst); #endif opcode = inst >> 26; src = (inst >> 11) & 0x1f; dst = (inst >> 16) & 0x1f; if ((opcode == 31) && (src == reg_NL3) && (5 == ((inst >> 21) & 0x1f)) && (4 == ((inst >> 1) & 0x3ff))) { /* * We got the instruction. Now, look back to make sure it was * proceeded by what we expected. 2 instructions back should be * an ADD or ADDI instruction. */ unsigned int add_inst; add_inst = pc[-3]; #if 0 fprintf(stderr, " add inst at %p: inst = 0x%08x\n", pc - 3, add_inst); #endif opcode = add_inst >> 26; if ((opcode == 31) && (266 == ((add_inst >> 1) & 0x1ff))) { return 1; } else if ((opcode == 14)) { return 1; } else { fprintf(stderr, "Whoa! Got allocation trap but could not find ADD or ADDI instruction: 0x%08x in the proper place\n", add_inst); } } return 0; } extern struct alloc_region boxed_region; void handle_allocation_trap(os_context_t * context) { unsigned int *pc; unsigned int inst; unsigned int target, target_ptr, end_addr; unsigned int opcode; int size; boolean were_in_lisp; char *memory; target = 0; size = 0; #if 0 fprintf(stderr, "In handle_allocation_trap\n"); #endif /* I don't think it's possible for us NOT to be in lisp when we get * here. Remove this later? */ were_in_lisp = !foreign_function_call_active; if (were_in_lisp) { fake_foreign_function_call(context); } else { fprintf(stderr, "**** Whoa! allocation trap and we weren't in lisp!\n"); } /* * Look at current instruction: TWNE temp, NL3. We're here because * temp > NL3 and temp is the end of the allocation, and NL3 is * current-region-end-addr. * * We need to adjust temp and alloc-tn. */ pc = (unsigned int *) (*os_context_pc_addr(context)); inst = pc[0]; end_addr = (inst >> 11) & 0x1f; target = (inst >> 16) & 0x1f; target_ptr = *os_context_register_addr(context, target); #if 0 fprintf(stderr, "handle_allocation_trap at %p:\n", pc); fprintf(stderr, "boxed_region.free_pointer: %p\n", boxed_region.free_pointer); fprintf(stderr, "boxed_region.end_addr: %p\n", boxed_region.end_addr); fprintf(stderr, "target reg: %d, end_addr reg: %d\n", target, end_addr); fprintf(stderr, "target: %x\n", *os_context_register_addr(context, target)); fprintf(stderr, "end_addr: %x\n", *os_context_register_addr(context, end_addr)); #endif #if 0 fprintf(stderr, "handle_allocation_trap at %p:\n", pc); fprintf(stderr, " trap inst = 0x%08x\n", inst); fprintf(stderr, " target reg = %s\n", lisp_register_names[target]); #endif /* * Go back and look at the add/addi instruction. The second src arg * is the size of the allocation. Get it and call alloc to allocate * new space. */ inst = pc[-3]; opcode = inst >> 26; #if 0 fprintf(stderr, " add inst = 0x%08x, opcode = %d\n", inst, opcode); #endif if (opcode == 14) { /* * ADDI temp-tn, alloc-tn, size * * Extract the size */ size = (inst & 0xffff); } else if (opcode == 31) { /* * ADD temp-tn, alloc-tn, size-tn * * Extract the size */ int reg; reg = (inst >> 11) & 0x1f; #if 0 fprintf(stderr, " add, reg = %s\n", lisp_register_names[reg]); #endif size = *os_context_register_addr(context, reg); } #if 0 fprintf(stderr, "Alloc %d to %s\n", size, lisp_register_names[target]); #endif #if INLINE_ALLOC_DEBUG if ((((unsigned long)boxed_region.end_addr + size) / PAGE_SIZE) == (((unsigned long)boxed_region.end_addr) / PAGE_SIZE)) { fprintf(stderr,"*** possibly bogus trap allocation of %d bytes at %p\n", size, target_ptr); fprintf(stderr, " dynamic_space_free_pointer: %p, boxed_region.end_addr %p\n", dynamic_space_free_pointer, boxed_region.end_addr); } #endif #if 0 fprintf(stderr, "Ready to alloc\n"); fprintf(stderr, "free_pointer = 0x%08x\n", dynamic_space_free_pointer); #endif /* * alloc-tn was incremented by size. Need to decrement it by size * to restore its original value. This is not true on GENCGC * anymore. d_s_f_p and reg_alloc get out of sync, but the p_a * bits stay intact and we set it to the proper value when it * needs to be. Keep this comment here for the moment in case * somebody tries to figure out what happened here. */ /* dynamic_space_free_pointer = (lispobj *) ((long) dynamic_space_free_pointer - size); */ #if 0 fprintf(stderr, "free_pointer = 0x%08x new\n", dynamic_space_free_pointer); #endif memory = (char *) alloc(size); #if 0 fprintf(stderr, "alloc returned %p\n", memory); fprintf(stderr, "free_pointer = 0x%08x\n", dynamic_space_free_pointer); #endif /* * The allocation macro wants the result to point to the end of the * object! */ memory += size; #if 0 fprintf(stderr, "object end at %p\n", memory); #endif *os_context_register_addr(context, target) = (unsigned long) memory; *os_context_register_addr(context, reg_ALLOC) = (unsigned long) dynamic_space_free_pointer | (*os_context_register_addr(context, reg_ALLOC) & LOWTAG_MASK); if (were_in_lisp) { undo_fake_foreign_function_call(context); } } #endif void arch_handle_breakpoint(os_context_t *context) { handle_breakpoint(context); } void arch_handle_fun_end_breakpoint(os_context_t *context) { *os_context_pc_addr(context) =(int)handle_fun_end_breakpoint(context); } void arch_handle_after_breakpoint(os_context_t *context) { *skipped_break_addr = trap_Breakpoint; skipped_break_addr = NULL; *(unsigned int *)*os_context_pc_addr(context) = displaced_after_inst; *os_context_sigmask_addr(context)= orig_sigmask; os_flush_icache((os_vm_address_t) *os_context_pc_addr(context), sizeof(unsigned int)); } void arch_handle_single_step_trap(os_context_t *context, int trap) { unsigned int code = *((u32 *)(*os_context_pc_addr(context))); int register_offset = code >> 5 & 0x1f; handle_single_step_trap(context, trap, register_offset); arch_skip_instruction(context); } static void sigtrap_handler(int signal, siginfo_t *siginfo, void *void_context) { unsigned int code; os_context_t *context = void_context; #ifdef LISP_FEATURE_LINUX os_restore_fp_control(context); #endif code=*((u32 *)(*os_context_pc_addr(context))); if (code == ((3 << 26) | (0x18 << 21) | (reg_NL3 << 16))) { arch_clear_pseudo_atomic_interrupted(context); arch_skip_instruction(context); /* interrupt or GC was requested in PA; now we're done with the PA section we may as well get around to it */ interrupt_handle_pending(context); return; } #ifdef LISP_FEATURE_GENCGC /* Is this an allocation trap? */ if (allocation_trap_p(context)) { handle_allocation_trap(context); arch_skip_instruction(context); return; } #endif if ((code >> 16) == ((3 << 10) | (6 << 5))) { /* twllei reg_ZERO,N will always trap if reg_ZERO = 0 */ int trap = code & 0x1f; handle_trap(context,trap); return; } if (((code >> 26) == 3) && (((code >> 21) & 31) == 24)) { interrupt_internal_error(context, 0); return; } interrupt_handle_now(signal, (siginfo_t *)code, context); } void arch_install_interrupt_handlers() { undoably_install_low_level_interrupt_handler(SIGILL, sigtrap_handler); undoably_install_low_level_interrupt_handler(SIGTRAP, sigtrap_handler); } void ppc_flush_icache(os_vm_address_t address, os_vm_size_t length) { os_vm_address_t end = (os_vm_address_t) ((int)(address+length+(32-1)) &~(32-1)); extern void ppc_flush_cache_line(os_vm_address_t); while (address < end) { ppc_flush_cache_line(address); address += 32; } } #ifdef LISP_FEATURE_LINKAGE_TABLE /* Linkage tables for PowerPC * * Linkage entry size is 16, because we need at least 4 instructions to * implement a jump. */ /* * Define the registers to use in the linkage jump table. Can be the * same. Some care must be exercised when choosing these. It has to be * a register that is not otherwise being used. reg_NFP is a good * choice. call_into_c trashes reg_NFP without preserving it, so we can * trash it in the linkage jump table. */ #define LINKAGE_TEMP_REG reg_NFP #define LINKAGE_ADDR_REG reg_NFP /* * Insert the necessary jump instructions at the given address. */ void arch_write_linkage_table_jmp(void* reloc_addr, void *target_addr) { /* * Make JMP to function entry. * * The instruction sequence is: * * addis 13, 0, (hi part of addr) * ori 13, 13, (low part of addr) * mtctr 13 * bctr * */ int* inst_ptr; unsigned long hi; /* Top 16 bits of address */ unsigned long lo; /* Low 16 bits of address */ unsigned int inst; inst_ptr = (int*) reloc_addr; /* * Split the target address into hi and lo parts for the sethi * instruction. hi is the top 22 bits. lo is the low 10 bits. */ hi = (unsigned long) target_addr; lo = hi & 0xffff; hi >>= 16; /* * addis 13, 0, (hi part) */ inst = (15 << 26) | (LINKAGE_TEMP_REG << 21) | (0 << 16) | hi; *inst_ptr++ = inst; /* * ori 13, 13, (lo part) */ inst = (24 << 26) | (LINKAGE_TEMP_REG << 21) | (LINKAGE_TEMP_REG << 16) | lo; *inst_ptr++ = inst; /* * mtctr 13 */ inst = (31 << 26) | (LINKAGE_TEMP_REG << 21) | (9 << 16) | (467 << 1); *inst_ptr++ = inst; /* * bctr */ inst = (19 << 26) | (20 << 21) | (528 << 1); *inst_ptr++ = inst; *inst_ptr++ = inst; os_flush_icache((os_vm_address_t) reloc_addr, (char*) inst_ptr - (char*) reloc_addr); } void arch_write_linkage_table_ref(void * reloc_addr, void *target_addr) { *(unsigned long *)reloc_addr = (unsigned long)target_addr; } #endif