📄 ivt.s
字号:
/* * arch/ia64/kernel/ivt.S * * Copyright (C) 1998-2000 Hewlett-Packard Co * Copyright (C) 1998, 1999 Stephane Eranian <eranian@hpl.hp.com> * Copyright (C) 1998-2000 David Mosberger <davidm@hpl.hp.com> * * 00/08/23 Asit Mallick <asit.k.mallick@intel.com> TLB handling for SMP * 00/12/20 David Mosberger-Tang <davidm@hpl.hp.com> DTLB/ITLB handler now uses virtual PT. *//* * This file defines the interrupt vector table used by the CPU. * It does not include one entry per possible cause of interruption. * * External interrupts only use 1 entry. All others are internal interrupts * * The first 20 entries of the table contain 64 bundles each while the * remaining 48 entries contain only 16 bundles each. * * The 64 bundles are used to allow inlining the whole handler for critical * interrupts like TLB misses. * * For each entry, the comment is as follows: * * // 0x1c00 Entry 7 (size 64 bundles) Data Key Miss (12,51) * entry offset ----/ / / / / * entry number ---------/ / / / * size of the entry -------------/ / / * vector name -------------------------------------/ / * related interrupts (what is the real interrupt?) ----------/ * * The table is 32KB in size and must be aligned on 32KB boundary. * (The CPU ignores the 15 lower bits of the address) * * Table is based upon EAS2.6 (Oct 1999) */#include <linux/config.h>#include <asm/break.h>#include <asm/offsets.h>#include <asm/pgtable.h>#include <asm/processor.h>#include <asm/ptrace.h>#include <asm/system.h>#include <asm/unistd.h>#define MINSTATE_VIRT /* needed by minstate.h */#include "minstate.h"#define FAULT(n) \ mov r31=pr; \ mov r19=n;; /* prepare to save predicates */ \ br.sptk.many dispatch_to_fault_handler/* * As we don't (hopefully) use the space available, we need to fill it with * nops. the parameter may be used for debugging and is representing the entry * number */ #define BREAK_BUNDLE(a) break.m (a); \ break.i (a); \ break.i (a)/* * 4 breaks bundles all together */#define BREAK_BUNDLE4(a); BREAK_BUNDLE(a); BREAK_BUNDLE(a); BREAK_BUNDLE(a); BREAK_BUNDLE(a)/* * 8 bundles all together (too lazy to use only 4 at a time !) */#define BREAK_BUNDLE8(a); BREAK_BUNDLE4(a); BREAK_BUNDLE4(a) .psr abi64 .psr lsb .lsb .section __ivt_section,"ax" .align 32768 // align on 32KB boundary .global ia64_ivtia64_ivt://///////////////////////////////////////////////////////////////////////////////////////// 0x0000 Entry 0 (size 64 bundles) VHPT Translation (8,20,47) /* * The VHPT vector is invoked when the TLB entry for the virtual page table * is missing. This happens only as a result of a previous * (the "original") TLB miss, which may either be caused by an instruction * fetch or a data access (or non-access). * * What we do here is normal TLB miss handing for the _original_ miss, followed * by inserting the TLB entry for the virtual page table page that the VHPT * walker was attempting to access. The latter gets inserted as long * as both L1 and L2 have valid mappings for the faulting address. * The TLB entry for the original miss gets inserted only if * the L3 entry indicates that the page is present. * * do_page_fault gets invoked in the following cases: * - the faulting virtual address uses unimplemented address bits * - the faulting virtual address has no L1, L2, or L3 mapping */ mov r16=cr.ifa // get address that caused the TLB miss ;; rsm psr.dt // use physical addressing for data mov r31=pr // save the predicate registers mov r19=ar.k7 // get page table base address shl r21=r16,3 // shift bit 60 into sign bit shr.u r17=r16,61 // get the region number into r17 ;; cmp.eq p6,p7=5,r17 // is IFA pointing into to region 5? shr.u r18=r16,PGDIR_SHIFT // get bits 33-63 of the faulting address ;;(p7) dep r17=r17,r19,(PAGE_SHIFT-3),3 // put region number bits in place srlz.d // ensure "rsm psr.dt" has taken effect(p6) movl r19=__pa(SWAPPER_PGD_ADDR) // region 5 is rooted at swapper_pg_dir(p6) shr.u r21=r21,PGDIR_SHIFT+PAGE_SHIFT(p7) shr.u r21=r21,PGDIR_SHIFT+PAGE_SHIFT-3 ;;(p6) dep r17=r18,r19,3,(PAGE_SHIFT-3) // r17=PTA + IFA(33,42)*8(p7) dep r17=r18,r17,3,(PAGE_SHIFT-6) // r17=PTA + (((IFA(61,63) << 7) | IFA(33,39))*8) cmp.eq p7,p6=0,r21 // unused address bits all zeroes? shr.u r18=r16,PMD_SHIFT // shift L2 index into position ;; ld8 r17=[r17] // fetch the L1 entry (may be 0) ;;(p7) cmp.eq p6,p7=r17,r0 // was L1 entry NULL? dep r17=r18,r17,3,(PAGE_SHIFT-3) // compute address of L2 page table entry ;;(p7) ld8 r20=[r17] // fetch the L2 entry (may be 0) shr.u r19=r16,PAGE_SHIFT // shift L3 index into position ;;(p7) cmp.eq.or.andcm p6,p7=r20,r0 // was L2 entry NULL? dep r21=r19,r20,3,(PAGE_SHIFT-3) // compute address of L3 page table entry ;;(p7) ld8 r18=[r21] // read the L3 PTE mov r19=cr.isr // cr.isr bit 0 tells us if this is an insn miss ;;(p7) tbit.z p6,p7=r18,_PAGE_P_BIT // page present bit cleared? mov r22=cr.iha // get the VHPT address that caused the TLB miss ;; // avoid RAW on p7(p7) tbit.nz.unc p10,p11=r19,32 // is it an instruction TLB miss? dep r23=0,r20,0,PAGE_SHIFT // clear low bits to get page address ;;(p10) itc.i r18 // insert the instruction TLB entry(p11) itc.d r18 // insert the data TLB entry(p6) br.spnt.many page_fault // handle bad address/page not present (page fault) mov cr.ifa=r22 // Now compute and insert the TLB entry for the virtual page table. // We never execute in a page table page so there is no need to set // the exception deferral bit. adds r24=__DIRTY_BITS_NO_ED|_PAGE_PL_0|_PAGE_AR_RW,r23 ;;(p7) itc.d r24 ;;#ifdef CONFIG_SMP // // Re-check L2 and L3 pagetable. If they changed, we may have received // a ptc.g between reading the pagetable and the "itc". If so, // flush the entry we inserted and retry. // ld8 r25=[r21] // read L3 PTE again ld8 r26=[r17] // read L2 entry again ;; cmp.ne p6,p7=r26,r20 // did L2 entry change mov r27=PAGE_SHIFT<<2 ;;(p6) ptc.l r22,r27 // purge PTE page translation(p7) cmp.ne.or.andcm p6,p7=r25,r18 // did L3 PTE change ;;(p6) ptc.l r16,r27 // purge translation#endif mov pr=r31,-1 // restore predicate registers rfi ;; .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x0400 Entry 1 (size 64 bundles) ITLB (21) /* * The ITLB handler accesses the L3 PTE via the virtually mapped linear * page table. If a nested TLB miss occurs, we switch into physical * mode, walk the page table, and then re-execute the L3 PTE read * and go on normally after that. */itlb_fault: mov r16=cr.ifa // get virtual address mov r29=b0 // save b0 mov r31=pr // save predicates mov r17=cr.iha // get virtual address of L3 PTE movl r30=1f // load nested fault continuation point ;;1: ld8 r18=[r17] // read L3 PTE ;; tbit.z p6,p0=r18,_PAGE_P_BIT // page present bit cleared?(p6) br.cond.spnt.many page_fault ;; itc.i r18 ;;#ifdef CONFIG_SMP ld8 r19=[r17] // read L3 PTE again and see if same mov r20=PAGE_SHIFT<<2 // setup page size for purge ;; cmp.ne p7,p0=r18,r19 ;;(p7) ptc.l r16,r20#endif mov pr=r31,-1 rfi ;; .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x0800 Entry 2 (size 64 bundles) DTLB (9,48) /* * The DTLB handler accesses the L3 PTE via the virtually mapped linear * page table. If a nested TLB miss occurs, we switch into physical * mode, walk the page table, and then re-execute the L3 PTE read * and go on normally after that. */dtlb_fault: mov r16=cr.ifa // get virtual address mov r29=b0 // save b0 mov r31=pr // save predicates mov r17=cr.iha // get virtual address of L3 PTE movl r30=1f // load nested fault continuation point ;;1: ld8 r18=[r17] // read L3 PTE ;; tbit.z p6,p0=r18,_PAGE_P_BIT // page present bit cleared?(p6) br.cond.spnt.many page_fault ;; itc.d r18 ;;#ifdef CONFIG_SMP ld8 r19=[r17] // read L3 PTE again and see if same mov r20=PAGE_SHIFT<<2 // setup page size for purge ;; cmp.ne p7,p0=r18,r19 ;;(p7) ptc.l r16,r20#endif mov pr=r31,-1 rfi ;; .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x0c00 Entry 3 (size 64 bundles) Alt ITLB (19) mov r16=cr.ifa // get address that caused the TLB miss movl r17=__DIRTY_BITS|_PAGE_PL_0|_PAGE_AR_RWX mov r21=cr.ipsr mov r31=pr ;;#ifdef CONFIG_DISABLE_VHPT shr.u r22=r16,61 // get the region number into r21 ;; cmp.gt p8,p0=6,r22 // user mode ;;(p8) thash r17=r16 ;;(p8) mov cr.iha=r17(p8) br.cond.dptk.many itlb_fault#endif extr.u r23=r21,IA64_PSR_CPL0_BIT,2 // extract psr.cpl shr.u r18=r16,57 // move address bit 61 to bit 4 dep r19=0,r16,IA64_MAX_PHYS_BITS,(64-IA64_MAX_PHYS_BITS) // clear ed & reserved bits ;; andcm r18=0x10,r18 // bit 4=~address-bit(61) cmp.ne p8,p0=r0,r23 // psr.cpl != 0? dep r19=r17,r19,0,12 // insert PTE control bits into r19 ;; or r19=r19,r18 // set bit 4 (uncached) if the access was to region 6(p8) br.cond.spnt.many page_fault ;; itc.i r19 // insert the TLB entry mov pr=r31,-1 rfi ;; .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x1000 Entry 4 (size 64 bundles) Alt DTLB (7,46) mov r16=cr.ifa // get address that caused the TLB miss movl r17=__DIRTY_BITS|_PAGE_PL_0|_PAGE_AR_RWX mov r20=cr.isr mov r21=cr.ipsr mov r31=pr ;;#ifdef CONFIG_DISABLE_VHPT shr.u r22=r16,61 // get the region number into r21 ;; cmp.gt p8,p0=6,r22 // access to region 0-5 ;;(p8) thash r17=r16 ;;(p8) mov cr.iha=r17(p8) br.cond.dptk.many dtlb_fault#endif extr.u r23=r21,IA64_PSR_CPL0_BIT,2 // extract psr.cpl tbit.nz p6,p7=r20,IA64_ISR_SP_BIT // is speculation bit on? shr.u r18=r16,57 // move address bit 61 to bit 4 dep r19=0,r16,IA64_MAX_PHYS_BITS,(64-IA64_MAX_PHYS_BITS) // clear ed & reserved bits ;; andcm r18=0x10,r18 // bit 4=~address-bit(61) cmp.ne p8,p0=r0,r23(p8) br.cond.spnt.many page_fault dep r21=-1,r21,IA64_PSR_ED_BIT,1 dep r19=r17,r19,0,12 // insert PTE control bits into r19 ;; or r19=r19,r18 // set bit 4 (uncached) if the access was to region 6(p6) mov cr.ipsr=r21 ;;(p7) itc.d r19 // insert the TLB entry mov pr=r31,-1 rfi ;; //----------------------------------------------------------------------------------- // call do_page_fault (predicates are in r31, psr.dt may be off, r16 is faulting address)page_fault: ssm psr.dt ;; srlz.i ;; SAVE_MIN_WITH_COVER // // Copy control registers to temporary registers, then turn on psr bits, // then copy the temporary regs to the output regs. We have to do this // because the "alloc" can cause a mandatory store which could lead to // an "Alt DTLB" fault which we can handle only if psr.ic is on. // mov r8=cr.ifa mov r9=cr.isr adds r3=8,r2 // set up second base pointer ;; ssm psr.ic ;; srlz.i // guarantee that interrupt collection is enabled ;;(p15) ssm psr.i // restore psr.i movl r14=ia64_leave_kernel ;; alloc r15=ar.pfs,0,0,3,0 // must be first in insn group mov out0=r8 mov out1=r9 ;; SAVE_REST mov rp=r14 ;; adds out2=16,r12 // out2 = pointer to pt_regs br.call.sptk.many b6=ia64_do_page_fault // ignore return address ;; .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x1400 Entry 5 (size 64 bundles) Data nested TLB (6,45) // // In the absence of kernel bugs, we get here when the virtually mapped linear page // table is accessed non-speculatively (e.g., in the Dirty-bit, Instruction // Access-bit, or Data Access-bit faults). If the DTLB entry for the virtual page // table is missing, a nested TLB miss fault is triggered and control is transferred // to this point. When this happens, we lookup the pte for the faulting address // by walking the page table in physical mode and return to the continuation point // passed in register r30 (or call page_fault if the address is not mapped). // // Input: r16: faulting address // r29: saved b0 // r30: continuation address // r31: saved pr // // Output: r17: physical address of L3 PTE of faulting address // r29: saved b0 // r30: continuation address // r31: saved pr // // Clobbered: b0, r18, r19, r21, psr.dt (cleared) // rsm psr.dt // switch to using physical data addressing mov r19=ar.k7 // get the page table base address shl r21=r16,3 // shift bit 60 into sign bit ;; shr.u r17=r16,61 // get the region number into r17 ;; cmp.eq p6,p7=5,r17 // is faulting address in region 5? shr.u r18=r16,PGDIR_SHIFT // get bits 33-63 of faulting address ;;(p7) dep r17=r17,r19,(PAGE_SHIFT-3),3 // put region number bits in place srlz.d(p6) movl r19=__pa(SWAPPER_PGD_ADDR) // region 5 is rooted at swapper_pg_dir(p6) shr.u r21=r21,PGDIR_SHIFT+PAGE_SHIFT(p7) shr.u r21=r21,PGDIR_SHIFT+PAGE_SHIFT-3 ;;(p6) dep r17=r18,r19,3,(PAGE_SHIFT-3) // r17=PTA + IFA(33,42)*8(p7) dep r17=r18,r17,3,(PAGE_SHIFT-6) // r17=PTA + (((IFA(61,63) << 7) | IFA(33,39))*8) cmp.eq p7,p6=0,r21 // unused address bits all zeroes? shr.u r18=r16,PMD_SHIFT // shift L2 index into position ;; ld8 r17=[r17] // fetch the L1 entry (may be 0) mov b0=r30 ;;(p7) cmp.eq p6,p7=r17,r0 // was L1 entry NULL? dep r17=r18,r17,3,(PAGE_SHIFT-3) // compute address of L2 page table entry ;;(p7) ld8 r17=[r17] // fetch the L2 entry (may be 0) shr.u r19=r16,PAGE_SHIFT // shift L3 index into position ;;(p7) cmp.eq.or.andcm p6,p7=r17,r0 // was L2 entry NULL? dep r17=r19,r17,3,(PAGE_SHIFT-3) // compute address of L3 page table entry ;;(p6) br.cond.spnt.many page_fault br.sptk.many b0 // return to continuation point ;; .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x1800 Entry 6 (size 64 bundles) Instruction Key Miss (24) FAULT(6) .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x1c00 Entry 7 (size 64 bundles) Data Key Miss (12,51) FAULT(7) .align 1024/////////////////////////////////////////////////////////////////////////////////////////// 0x2000 Entry 8 (size 64 bundles) Dirty-bit (54) // // What we do here is to simply turn on the dirty bit in the PTE. We need // to update both the page-table and the TLB entry. To efficiently access // the PTE, we address it through the virtual page table. Most likely, the // TLB entry for the relevant virtual page table page is still present in // the TLB so we can normally do this without additional TLB misses. // In case the necessary virtual page table TLB entry isn't present, we take // a nested TLB miss hit where we look up the physical address of the L3 PTE // and then continue at label 1 below. // mov r16=cr.ifa // get the address that caused the fault movl r30=1f // load continuation point in case of nested fault ;; thash r17=r16 // compute virtual address of L3 PTE mov r29=b0 // save b0 in case of nested fault mov r31=pr // save pr#ifdef CONFIG_SMP mov r28=ar.ccv // save ar.ccv ;;1: ld8 r18=[r17] ;; // avoid RAW on r18
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -