📄 hashtable.s
字号:
#define SET_V(r) ori r,r,PTE_V#define CLR_V(r,t) li t,PTE_V; andc r,r,t#endif /* CONFIG_PPC64BRIDGE */#define HASH_LEFT 31-(LG_PTEG_SIZE+Hash_bits-1)#define HASH_RIGHT 31-LG_PTEG_SIZE_GLOBAL(create_hpte) /* Convert linux-style PTE (r5) to low word of PPC-style PTE (r8) */ rlwinm r8,r5,32-10,31,31 /* _PAGE_RW -> PP lsb */ rlwinm r0,r5,32-7,31,31 /* _PAGE_DIRTY -> PP lsb */ and r8,r8,r0 /* writable if _RW & _DIRTY */ rlwimi r5,r5,32-1,30,30 /* _PAGE_USER -> PP msb */ rlwimi r5,r5,32-2,31,31 /* _PAGE_USER -> PP lsb */ ori r8,r8,0xe14 /* clear out reserved bits and M */ andc r8,r5,r8 /* PP = user? (rw&dirty? 2: 3): 0 */#ifdef CONFIG_SMP ori r8,r8,_PAGE_COHERENT /* set M (coherence required) */#endif#ifdef CONFIG_POWER4 /* * XXX hack hack hack - translate 32-bit "physical" addresses * in the linux page tables to 42-bit real addresses in such * a fashion that we can get at the I/O we need to access. * -- paulus */ cmpwi r8,0 rlwinm r0,r8,16,16,30 bge 57f cmplwi r0,0xfe00 li r0,0x3fd bne 56f li r0,0x3ff56: sldi r0,r0,32 or r8,r8,r057:#endif /* Construct the high word of the PPC-style PTE (r5) */#ifndef CONFIG_PPC64BRIDGE rlwinm r5,r3,7,1,24 /* put VSID in 0x7fffff80 bits */ rlwimi r5,r4,10,26,31 /* put in API (abbrev page index) */#else /* CONFIG_PPC64BRIDGE */ clrlwi r3,r3,8 /* reduce vsid to 24 bits */ sldi r5,r3,12 /* shift vsid into position */ rlwimi r5,r4,16,20,24 /* put in API (abbrev page index) */#endif /* CONFIG_PPC64BRIDGE */ SET_V(r5) /* set V (valid) bit */ /* Get the address of the primary PTE group in the hash table (r3) */ .globl hash_page_patch_Ahash_page_patch_A: addis r0,r7,Hash_base@h /* base address of hash table */ rlwimi r0,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* VSID -> hash */ rlwinm r3,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */ xor r3,r3,r0 /* make primary hash */ li r0,8 /* PTEs/group */ /* * Test the _PAGE_HASHPTE bit in the old linux PTE, and skip the search * if it is clear, meaning that the HPTE isn't there already... */ andi. r6,r6,_PAGE_HASHPTE beq+ 10f /* no PTE: go look for an empty slot */ tlbie r4 addis r4,r7,htab_hash_searches@ha lwz r6,htab_hash_searches@l(r4) addi r6,r6,1 /* count how many searches we do */ stw r6,htab_hash_searches@l(r4) /* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */ mtctr r0 addi r4,r3,-PTE_SIZE1: LDPTEu r6,PTE_SIZE(r4) /* get next PTE */ CMPPTE 0,r6,r5 bdnzf 2,1b /* loop while ctr != 0 && !cr0.eq */ beq+ found_slot /* Search the secondary PTEG for a matching PTE */ ori r5,r5,PTE_H /* set H (secondary hash) bit */ .globl hash_page_patch_Bhash_page_patch_B: xoris r4,r3,Hash_msk>>16 /* compute secondary hash */ xori r4,r4,(-PTEG_SIZE & 0xffff) addi r4,r4,-PTE_SIZE mtctr r02: LDPTEu r6,PTE_SIZE(r4) CMPPTE 0,r6,r5 bdnzf 2,2b beq+ found_slot xori r5,r5,PTE_H /* clear H bit again */ /* Search the primary PTEG for an empty slot */10: mtctr r0 addi r4,r3,-PTE_SIZE /* search primary PTEG */1: LDPTEu r6,PTE_SIZE(r4) /* get next PTE */ TST_V(r6) /* test valid bit */ bdnzf 2,1b /* loop while ctr != 0 && !cr0.eq */ beq+ found_empty /* update counter of times that the primary PTEG is full */ addis r4,r7,primary_pteg_full@ha lwz r6,primary_pteg_full@l(r4) addi r6,r6,1 stw r6,primary_pteg_full@l(r4) /* Search the secondary PTEG for an empty slot */ ori r5,r5,PTE_H /* set H (secondary hash) bit */ .globl hash_page_patch_Chash_page_patch_C: xoris r4,r3,Hash_msk>>16 /* compute secondary hash */ xori r4,r4,(-PTEG_SIZE & 0xffff) addi r4,r4,-PTE_SIZE mtctr r02: LDPTEu r6,PTE_SIZE(r4) TST_V(r6) bdnzf 2,2b beq+ found_empty xori r5,r5,PTE_H /* clear H bit again */ /* * Choose an arbitrary slot in the primary PTEG to overwrite. * Since both the primary and secondary PTEGs are full, and we * have no information that the PTEs in the primary PTEG are * more important or useful than those in the secondary PTEG, * and we know there is a definite (although small) speed * advantage to putting the PTE in the primary PTEG, we always * put the PTE in the primary PTEG. */ addis r4,r7,next_slot@ha lwz r6,next_slot@l(r4) addi r6,r6,PTE_SIZE andi. r6,r6,7*PTE_SIZE#ifdef CONFIG_POWER4 /* * Since we don't have BATs on POWER4, we rely on always having * PTEs in the hash table to map the hash table and the code * that manipulates it in virtual mode, namely flush_hash_page and * flush_hash_segments. Otherwise we can get a DSI inside those * routines which leads to a deadlock on the hash_table_lock on * SMP machines. We avoid this by never overwriting the first * PTE of each PTEG if it is already valid. * -- paulus. */ bne 102f li r6,PTE_SIZE102:#endif /* CONFIG_POWER4 */ stw r6,next_slot@l(r4) add r4,r3,r6 /* update counter of evicted pages */ addis r6,r7,htab_evicts@ha lwz r3,htab_evicts@l(r6) addi r3,r3,1 stw r3,htab_evicts@l(r6)#ifndef CONFIG_SMP /* Store PTE in PTEG */found_empty: STPTE r5,0(r4)found_slot: STPTE r8,PTE_SIZE/2(r4)#else /* CONFIG_SMP *//* * Between the tlbie above and updating the hash table entry below, * another CPU could read the hash table entry and put it in its TLB. * There are 3 cases: * 1. using an empty slot * 2. updating an earlier entry to change permissions (i.e. enable write) * 3. taking over the PTE for an unrelated address * * In each case it doesn't really matter if the other CPUs have the old * PTE in their TLB. So we don't need to bother with another tlbie here, * which is convenient as we've overwritten the register that had the * address. :-) The tlbie above is mainly to make sure that this CPU comes * and gets the new PTE from the hash table. * * We do however have to make sure that the PTE is never in an invalid * state with the V bit set. */found_empty:found_slot: CLR_V(r5,r0) /* clear V (valid) bit in PTE */ STPTE r5,0(r4) sync TLBSYNC STPTE r8,PTE_SIZE/2(r4) /* put in correct RPN, WIMG, PP bits */ sync SET_V(r5) STPTE r5,0(r4) /* finally set V bit in PTE */#endif /* CONFIG_SMP */ sync /* make sure pte updates get to memory */ blr .comm next_slot,4 .comm primary_pteg_full,4 .comm htab_hash_searches,4/* * Flush the entry for a particular page from the hash table. * * flush_hash_page(unsigned context, unsigned long va, pte_t *ptep) * * We assume that there is a hash table in use (Hash != 0). */_GLOBAL(flush_hash_page) /* Convert context and va to VSID */ mulli r3,r3,897*16 /* multiply context by context skew */ rlwinm r0,r4,4,28,31 /* get ESID (top 4 bits of va) */ mulli r0,r0,0x111 /* multiply by ESID skew */ add r3,r3,r0 /* note code below trims to 24 bits */ /* * We disable interrupts here, even on UP, because we want * the _PAGE_HASHPTE bit to be a reliable indication of * whether the HPTE exists. -- paulus */ mfmsr r10 rlwinm r0,r10,0,17,15 /* clear bit 16 (MSR_EE) */ SYNC mtmsr r0 SYNC#ifdef CONFIG_SMP lis r9,hash_table_lock@h ori r9,r9,hash_table_lock@l lwz r8,PROCESSOR(r2) oris r8,r8,910: lwarx r7,0,r9 cmpi 0,r7,0 bne- 11f stwcx. r8,0,r9 beq+ 12f11: lwz r7,0(r9) cmpi 0,r7,0 beq 10b b 11b12: isync#endif /* * Check the _PAGE_HASHPTE bit in the linux PTE. If it is * already clear, we're done. If not, clear it (atomically) * and proceed. -- paulus. */1: lwarx r6,0,r5 /* fetch the pte */ andi. r0,r6,_PAGE_HASHPTE beq 9f /* done if HASHPTE is already clear */ rlwinm r6,r6,0,31,29 /* clear HASHPTE bit */ stwcx. r6,0,r5 /* update the pte */ bne- 1b /* Construct the high word of the PPC-style PTE (r5) */#ifndef CONFIG_PPC64BRIDGE rlwinm r5,r3,7,1,24 /* put VSID in 0x7fffff80 bits */ rlwimi r5,r4,10,26,31 /* put in API (abbrev page index) */#else /* CONFIG_PPC64BRIDGE */ clrlwi r3,r3,8 /* reduce vsid to 24 bits */ sldi r5,r3,12 /* shift vsid into position */ rlwimi r5,r4,16,20,24 /* put in API (abbrev page index) */#endif /* CONFIG_PPC64BRIDGE */ SET_V(r5) /* set V (valid) bit */ /* Get the address of the primary PTE group in the hash table (r3) */ .globl flush_hash_patch_Aflush_hash_patch_A: lis r8,Hash_base@h /* base address of hash table */ rlwimi r8,r3,LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* VSID -> hash */ rlwinm r3,r4,20+LG_PTEG_SIZE,HASH_LEFT,HASH_RIGHT /* PI -> hash */ xor r3,r3,r8 /* make primary hash */ li r8,8 /* PTEs/group */ /* Search the primary PTEG for a PTE whose 1st (d)word matches r5 */ mtctr r8 addi r7,r3,-PTE_SIZE1: LDPTEu r0,PTE_SIZE(r7) /* get next PTE */ CMPPTE 0,r0,r5 bdnzf 2,1b /* loop while ctr != 0 && !cr0.eq */ beq+ 3f /* Search the secondary PTEG for a matching PTE */ ori r5,r5,PTE_H /* set H (secondary hash) bit */ .globl flush_hash_patch_Bflush_hash_patch_B: xoris r7,r3,Hash_msk>>16 /* compute secondary hash */ xori r7,r7,(-PTEG_SIZE & 0xffff) addi r7,r7,-PTE_SIZE mtctr r82: LDPTEu r0,PTE_SIZE(r7) CMPPTE 0,r0,r5 bdnzf 2,2b bne- 4f /* should never fail to find it */3: li r0,0 STPTE r0,0(r7) /* invalidate entry */4: sync tlbie r4 /* in hw tlb too */ sync#ifdef CONFIG_SMP TLBSYNC9: li r0,0 stw r0,0(r9) /* clear hash_table_lock */#endif9: mtmsr r10 SYNC blr
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -