plan9fox/sys/src/9/teg2/l.s

895 lines
19 KiB
ArmAsm

/*
* tegra 2 SoC machine assist
* dual arm cortex-a9 processors
*
* ARM v7 arch. ref. man. §B1.3.3 says that we don't need barriers
* around writes to CPSR.
*
* LDREX/STREX use an exclusive monitor, which is part of the data cache unit
* for the L1 cache, so they won't work right if the L1 cache is disabled.
*/
#include "arm.s"
#define LDREX(fp,t) WORD $(0xe<<28|0x01900f9f | (fp)<<16 | (t)<<12)
/* `The order of operands is from left to right in dataflow order' - asm man */
#define STREX(f,tp,r) WORD $(0xe<<28|0x01800f90 | (tp)<<16 | (r)<<12 | (f)<<0)
#define MAXMB (KiB-1) /* last MB has vectors */
#define TMPSTACK (DRAMSIZE - 64*MiB) /* used only during cpu startup */
/* tas/cas strex debugging limits; started at 10000 */
#define MAXSC 100000
GLOBL testmem(SB), $4
/*
* Entered here from Das U-Boot or another Plan 9 kernel with MMU disabled.
* Until the MMU is enabled it is OK to call functions provided
* they are within ±32MiB relative and do not require any
* local variables or more than one argument (i.e. there is
* no stack).
*/
TEXT _start(SB), 1, $-4
CPSMODE(PsrMsvc)
CPSID /* interrupts off */
CPSAE
SETEND(0) /* little-endian */
BARRIERS
CLREX
SETZSB
MOVW CPSR, R0
ORR $PsrDfiq, R0
MOVW R0, CPSR
/* invalidate i-cache and branch-target cache */
MTCP CpSC, 0, PC, C(CpCACHE), C(CpCACHEinvi), CpCACHEall
BARRIERS
/* put cpus other than 0 to sleep until cpu 0 is ready */
CPUID(R1)
BEQ cpuinit
/* not cpu 0 */
PUTC('Z')
PUTC('Z')
BARRIERS
dowfi:
WFI
MOVW cpus_proceed(SB), R1
CMP $0, R1
BEQ dowfi
BL cpureset(SB)
B dowfi
cpuinit:
DELAY(printloopret, 1)
PUTC('\r')
DELAY(printloopnl, 1)
PUTC('\n')
DELAY(printloops, 1)
PUTC('P')
/* disable the PL310 L2 cache on cpu0 */
MOVW $(PHYSL2BAG+0x100), R1
MOVW $0, R2
MOVW R2, (R1)
BARRIERS
/* invalidate it */
MOVW $((1<<16)-1), R2
MOVW R2, 0x77c(R1)
BARRIERS
/*
* disable my MMU & caches
*/
MFCP CpSC, 0, R1, C(CpCONTROL), C(0), CpMainctl
ORR $CpCsbo, R1
BIC $(CpCsbz|CpCmmu|CpCdcache|CpCicache|CpCpredict), R1
MTCP CpSC, 0, R1, C(CpCONTROL), C(0), CpMainctl
BARRIERS
/* cortex-a9 model-specific initial configuration */
MOVW $0, R1
MTCP CpSC, 0, R1, C(CpCONTROL), C(0), CpAuxctl
BARRIERS
PUTC('l')
DELAY(printloop3, 1)
MOVW $testmem-KZERO(SB), R0
BL memdiag(SB)
PUTC('a')
/* clear Mach for cpu 0 */
MOVW $PADDR(MACHADDR), R4 /* address of Mach for cpu 0 */
MOVW $0, R0
_machZ:
MOVW R0, (R4)
ADD $4, R4
CMP.S $PADDR(L1+L1X(0)), R4 /* end at top-level page table */
BNE _machZ
/*
* set up the MMU page table for cpu 0
*/
PUTC('n')
/* clear all PTEs first, to provide a default */
// MOVW $PADDR(L1+L1X(0)), R4 /* address of PTE for 0 */
_ptenv0:
ZEROPTE()
CMP.S $PADDR(L1+16*KiB), R4
BNE _ptenv0
DELAY(printloop4, 2)
PUTC(' ')
/*
* set up double map of PHYSDRAM, KZERO to PHYSDRAM for first few MBs,
* but only if KZERO and PHYSDRAM differ.
*/
MOVW $PTEDRAM, R2 /* PTE bits */
MOVW $PHYSDRAM, R3 /* pa */
CMP $KZERO, R3
BEQ no2map
MOVW $PADDR(L1+L1X(PHYSDRAM)), R4 /* address of PTE for PHYSDRAM */
MOVW $DOUBLEMAPMBS, R5
_ptdbl:
FILLPTE()
SUB.S $1, R5
BNE _ptdbl
no2map:
/*
* back up and fill in PTEs for memory at KZERO.
* trimslice has 1 bank of 1GB at PHYSDRAM.
* Map the maximum.
*/
PUTC('9')
MOVW $PTEDRAM, R2 /* PTE bits */
MOVW $PHYSDRAM, R3
MOVW $PADDR(L1+L1X(KZERO)), R4 /* start with PTE for KZERO */
MOVW $MAXMB, R5 /* inner loop count (MBs) */
_ptekrw: /* set PTEs */
FILLPTE()
SUB.S $1, R5 /* decrement inner loop count */
BNE _ptekrw
/*
* back up and fill in PTEs for MMIO
*/
PUTC(' ')
MOVW $PTEIO, R2 /* PTE bits */
MOVW $PHYSIO, R3
MOVW $PADDR(L1+L1X(VIRTIO)), R4 /* start with PTE for VIRTIO */
_ptenv2:
FILLPTE()
CMP.S $PADDR(L1+L1X(PHYSIOEND)), R4
BNE _ptenv2
/* mmu.c sets up the trap vectors later */
MOVW $(PHYSDRAM | TMPSTACK), SP
/*
* learn l1 cache characteristics (on cpu 0 only).
*/
MOVW $(1-1), R0 /* l1 */
SLL $1, R0 /* R0 = (cache - 1) << 1 */
MTCP CpSC, CpIDcssel, R0, C(CpID), C(CpIDid), 0 /* select l1 cache */
BARRIERS
MFCP CpSC, CpIDcsize, R0, C(CpID), C(CpIDid), 0 /* get sets & ways */
MOVW $CACHECONF, R8
/* get log2linelen into l1setsh */
MOVW R0, R1
AND $3, R1
ADD $4, R1
/* l1 & l2 must have same cache line size, thus same set shift */
MOVW R1, 4(R8) /* +4 = l1setsh */
MOVW R1, 12(R8) /* +12 = l2setsh */
/* get nways in R1 */
SRA $3, R0, R1
AND $((1<<10)-1), R1
ADD $1, R1
/* get log2(nways) in R2 (assume nways is 2^n) */
MOVW $(BI2BY*BY2WD - 1), R2
CLZ(1, 1)
SUB.S R1, R2 /* R2 = 31 - clz(nways) */
ADD.EQ $1, R2
// MOVW R2, R3 /* print log2(nways): 2 */
MOVW $32, R1
SUB R2, R1 /* R1 = 32 - log2(nways) */
MOVW R1, 0(R8) /* +0 = l1waysh */
BARRIERS
MOVW $testmem-KZERO(SB), R0
BL memdiag(SB)
/*
* the mpcore manual says invalidate d-cache, scu, pl310 in that order,
* but says nothing about when to disable them.
*
* invalidate my caches before enabling
*/
BL cachedinv(SB)
MTCP CpSC, 0, PC, C(CpCACHE), C(CpCACHEinvi), CpCACHEall
BARRIERS
PUTC('f')
/*
* the mpcore manual says enable scu, d-cache, pl310, smp mode
* in that order. we have to reverse the last two; see main().
*/
BL scuon(SB)
/*
* turn my L1 cache on; need it for tas below.
*/
MFCP CpSC, 0, R1, C(CpCONTROL), C(0), CpMainctl
ORR $(CpCdcache|CpCicache|CpCalign|CpCpredict), R1
MTCP CpSC, 0, R1, C(CpCONTROL), C(0), CpMainctl
BARRIERS
/* cortex-a9 model-specific configuration */
MOVW $CpACl1pref, R1
MTCP CpSC, 0, R1, C(CpCONTROL), C(0), CpAuxctl
BARRIERS
/* we're supposed to wait until l1 & l2 are on before calling smpon */
PUTC('r')
/* set the domain access control */
MOVW $Client, R0
BL dacput(SB)
DELAY(printloop5, 2)
PUTC('o')
BL mmuinvalidate(SB)
MOVW $0, R0
BL pidput(SB)
/* set the translation table base */
MOVW $PADDR(L1), R0
BL ttbput(SB)
PUTC('m')
/*
* the little dance to turn the MMU on
*/
BL cacheuwbinv(SB)
BL mmuinvalidate(SB)
BL mmuenable(SB)
PUTC(' ')
/* warp the PC into the virtual map */
MOVW $KZERO, R0
BL _r15warp(SB)
/*
* cpu 0 is now running at KZERO+something!
*/
BARRIERS
MOVW $setR12(SB), R12 /* reload kernel SB */
MOVW $(KZERO | TMPSTACK), SP
BL cacheuwbinv(SB)
PUTC('B')
MOVW $PHYSDRAM, R3 /* pa */
CMP $KZERO, R3
BEQ no2unmap
/* undo double map of PHYSDRAM, KZERO & first few MBs */
MOVW $(L1+L1X(PHYSDRAM)), R4 /* addr. of PTE for PHYSDRAM */
MOVW $0, R0
MOVW $DOUBLEMAPMBS, R5
_ptudbl:
ZEROPTE()
SUB.S $1, R5
BNE _ptudbl
no2unmap:
BL cachedwb(SB)
BL mmuinvalidate(SB)
/*
* call main in C
* pass Mach to main and set up the stack in it
*/
MOVW $MACHADDR, R0 /* cpu 0 Mach */
MOVW R0, R(MACH) /* m = MACHADDR */
ADD $(MACHSIZE-4), R0, SP /* leave space for link register */
PUTC('e')
BL main(SB) /* main(m) */
limbo:
BL idlehands(SB)
B limbo
BL _div(SB) /* hack to load _div, etc. */
/*
* called on cpu(s) other than 0, to start them, from _vrst
* (reset vector) in lexception.s, with interrupts disabled
* and in SVC mode, running in the zero segment (pc is in lower 256MB).
* SB is set for the zero segment.
*/
TEXT cpureset(SB), 1, $-4
CLREX
MOVW CPSR, R0
ORR $PsrDfiq, R0
MOVW R0, CPSR
MOVW $(PHYSDRAM | TMPSTACK), SP /* stack for cache ops */
/* paranoia: turn my mmu and caches off. */
MFCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
ORR $CpCsbo, R0
BIC $(CpCsbz|CpCmmu|CpCdcache|CpCicache|CpCpredict), R0
MTCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
BARRIERS
/* cortex-a9 model-specific initial configuration */
MOVW $0, R1
MTCP CpSC, 0, R1, C(CpCONTROL), C(0), CpAuxctl
ISB
/* invalidate my caches before enabling */
BL cachedinv(SB)
MTCP CpSC, 0, PC, C(CpCACHE), C(CpCACHEinvi), CpCACHEall
BARRIERS
/*
* turn my L1 cache on; need it (and mmu) for tas below.
* need branch prediction to make delay() timing right.
*/
MFCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
ORR $(CpCdcache|CpCicache|CpCalign|CpCpredict), R0
MTCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
BARRIERS
/* enable l1 caches coherency, at minimum for ldrex/strex. */
BL smpon(SB)
BARRIERS
/*
* we used to write to PHYSEVP here; now we do it in C, which offers
* more assurance that we're up and won't go off the rails.
*/
/* set the domain access control */
MOVW $Client, R0
BL dacput(SB)
BL setmach(SB)
/*
* redo double map of PHYSDRAM, KZERO in this cpu's ptes.
* mmuinit will undo this later.
*/
MOVW $PHYSDRAM, R3
CMP $KZERO, R3
BEQ noun2map
/* launchinit set m->mmul1 to a copy of cpu0's l1 page table */
MOVW 12(R(MACH)), R0 /* m->mmul1 (virtual addr) */
BL k2paddr(SB) /* R0 = PADDR(m->mmul1) */
ADD $L1X(PHYSDRAM), R0, R4 /* R4 = address of PHYSDRAM's PTE */
MOVW $PTEDRAM, R2 /* PTE bits */
MOVW $DOUBLEMAPMBS, R5
_ptrdbl:
ORR R3, R2, R1 /* first identity-map 0 to 0, etc. */
MOVW R1, (R4)
ADD $4, R4 /* bump PTE address */
ADD $MiB, R3 /* bump pa */
SUB.S $1, R5
BNE _ptrdbl
noun2map:
MOVW $0, R0
BL pidput(SB)
/* set the translation table base to PADDR(m->mmul1) */
MOVW 12(R(MACH)), R0 /* m->mmul1 */
BL k2paddr(SB) /* R0 = PADDR(m->mmul1) */
BL ttbput(SB)
/*
* the little dance to turn the MMU on
*/
BL cacheuwbinv(SB)
BL mmuinvalidate(SB)
BL mmuenable(SB)
/*
* mmu is now on, with l1 pt at m->mmul1.
*/
/* warp the PC into the virtual map */
MOVW $KZERO, R0
BL _r15warp(SB)
/*
* now running at KZERO+something!
*/
BARRIERS
MOVW $setR12(SB), R12 /* reload kernel's SB */
MOVW $(KZERO | TMPSTACK), SP /* stack for cache ops*/
BL setmach(SB)
ADD $(MACHSIZE-4), R(MACH), SP /* leave space for link register */
BL cpustart(SB)
/*
* converts virtual address in R0 to a physical address.
*/
TEXT k2paddr(SB), 1, $-4
BIC $KSEGM, R0
ADD $PHYSDRAM, R0
RET
/*
* converts physical address in R0 to a virtual address.
*/
TEXT p2kaddr(SB), 1, $-4
BIC $KSEGM, R0
ORR $KZERO, R0
RET
/*
* converts address in R0 to the current segment, as defined by the PC.
* clobbers R1.
*/
TEXT addr2pcseg(SB), 1, $-4
BIC $KSEGM, R0
MOVW PC, R1
AND $KSEGM, R1 /* segment PC is in */
ORR R1, R0
RET
/* sets R(MACH), preserves other registers */
TEXT setmach(SB), 1, $-4
MOVM.DB.W [R14], (R13)
MOVM.DB.W [R0-R2], (R13)
CPUID(R2)
SLL $2, R2 /* convert to word index */
MOVW $machaddr(SB), R0
BL addr2pcseg(SB)
ADD R2, R0 /* R0 = &machaddr[cpuid] */
MOVW (R0), R0 /* R0 = machaddr[cpuid] */
CMP $0, R0
MOVW.EQ $MACHADDR, R0 /* paranoia: use MACHADDR if 0 */
BL addr2pcseg(SB)
MOVW R0, R(MACH) /* m = machaddr[cpuid] */
MOVM.IA.W (R13), [R0-R2]
MOVM.IA.W (R13), [R14]
RET
/*
* memory diagnostic
* tests word at (R0); modifies R7 and R8
*/
TEXT memdiag(SB), 1, $-4
MOVW $0xabcdef89, R7
MOVW R7, (R0)
MOVW (R0), R8
CMP R7, R8
BNE mbuggery /* broken memory */
BARRIERS
MOVW (R0), R8
CMP R7, R8
BNE mbuggery /* broken memory */
MOVW $0, R7
MOVW R7, (R0)
BARRIERS
RET
/* modifies R0, R3—R6 */
TEXT printhex(SB), 1, $-4
MOVW R0, R3
PUTC('0')
PUTC('x')
MOVW $(32-4), R5 /* bits to shift right */
nextdig:
SRA R5, R3, R4
AND $0xf, R4
ADD $'0', R4
CMP.S $'9', R4
BLE nothex /* if R4 <= 9, jump */
ADD $('a'-('9'+1)), R4
nothex:
PUTC(R4)
SUB.S $4, R5
BGE nextdig
PUTC('\r')
PUTC('\n')
DELAY(proct, 50)
RET
mbuggery:
PUTC('?')
PUTC('m')
mtopanic:
MOVW $membmsg(SB), R0
MOVW R14, R1 /* get R14's segment ... */
AND $KSEGM, R1
BIC $KSEGM, R0 /* strip segment from address */
ORR R1, R0 /* combine them */
BL panic(SB)
mbugloop:
WFI
B mbugloop
DATA membmsg+0(SB)/8,$"memory b"
DATA membmsg+8(SB)/6,$"roken\z"
GLOBL membmsg(SB), $14
TEXT _r15warp(SB), 1, $-4
BIC $KSEGM, R14 /* link reg, will become PC */
ORR R0, R14
BIC $KSEGM, SP
ORR R0, SP
RET
/*
* `single-element' cache operations.
* in arm arch v7, they operate on all architected cache levels, so separate
* l2 functions are usually unnecessary.
*/
TEXT cachedwbse(SB), $-4 /* D writeback SE */
MOVW R0, R2
MOVW CPSR, R3
CPSID /* splhi */
BARRIERS /* force outstanding stores to cache */
MOVW R2, R0
MOVW 4(FP), R1
ADD R0, R1 /* R1 is end address */
BIC $(CACHELINESZ-1), R0 /* cache line start */
_dwbse:
MTCP CpSC, 0, R0, C(CpCACHE), C(CpCACHEwb), CpCACHEse
ADD $CACHELINESZ, R0
CMP.S R0, R1
BGT _dwbse
B _wait
TEXT cachedwbinvse(SB), $-4 /* D writeback+invalidate SE */
MOVW R0, R2
MOVW CPSR, R3
CPSID /* splhi */
BARRIERS /* force outstanding stores to cache */
MOVW R2, R0
MOVW 4(FP), R1
ADD R0, R1 /* R1 is end address */
BIC $(CACHELINESZ-1), R0 /* cache line start */
_dwbinvse:
MTCP CpSC, 0, R0, C(CpCACHE), C(CpCACHEwbi), CpCACHEse
ADD $CACHELINESZ, R0
CMP.S R0, R1
BGT _dwbinvse
_wait: /* drain write buffer */
BARRIERS
MOVW R3, CPSR /* splx */
RET
TEXT cachedinvse(SB), $-4 /* D invalidate SE */
MOVW R0, R2
MOVW CPSR, R3
CPSID /* splhi */
BARRIERS /* force outstanding stores to cache */
MOVW R2, R0
MOVW 4(FP), R1
ADD R0, R1 /* R1 is end address */
/*
* if start & end addresses are not on cache-line boundaries,
* flush first & last cache lines before invalidating.
*/
AND.S $(CACHELINESZ-1), R0, R4
BEQ stok
BIC $(CACHELINESZ-1), R0, R4 /* cache line start */
MTCP CpSC, 0, R4, C(CpCACHE), C(CpCACHEwb), CpCACHEse
stok:
AND.S $(CACHELINESZ-1), R1, R4
BEQ endok
BIC $(CACHELINESZ-1), R1, R4 /* cache line start */
MTCP CpSC, 0, R4, C(CpCACHE), C(CpCACHEwb), CpCACHEse
endok:
BIC $(CACHELINESZ-1), R0 /* cache line start */
_dinvse:
MTCP CpSC, 0, R0, C(CpCACHE), C(CpCACHEinvd), CpCACHEse
ADD $CACHELINESZ, R0
CMP.S R0, R1
BGT _dinvse
B _wait
/*
* enable mmu and high vectors
*/
TEXT mmuenable(SB), 1, $-4
MFCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
ORR $CpCmmu, R0
MTCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
BARRIERS
RET
TEXT mmudisable(SB), 1, $-4
MFCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
BIC $CpCmmu, R0
MTCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
BARRIERS
RET
/*
* If one of these MCR instructions crashes or hangs the machine,
* check your Level 1 page table (at TTB) closely.
*/
TEXT mmuinvalidate(SB), $-4 /* invalidate all */
MOVW CPSR, R2
CPSID /* interrupts off */
BARRIERS
MTCP CpSC, 0, PC, C(CpTLB), C(CpTLBinvu), CpTLBinv
BARRIERS
MOVW R2, CPSR /* interrupts restored */
RET
TEXT mmuinvalidateaddr(SB), $-4 /* invalidate single entry */
MTCP CpSC, 0, R0, C(CpTLB), C(CpTLBinvu), CpTLBinvse
BARRIERS
RET
TEXT cpidget(SB), 1, $-4 /* main ID */
MFCP CpSC, 0, R0, C(CpID), C(CpIDidct), CpIDid
RET
TEXT cpctget(SB), 1, $-4 /* cache type */
MFCP CpSC, 0, R0, C(CpID), C(CpIDidct), CpIDct
RET
TEXT controlget(SB), 1, $-4 /* system control (sctlr) */
MFCP CpSC, 0, R0, C(CpCONTROL), C(0), CpMainctl
RET
TEXT ttbget(SB), 1, $-4 /* translation table base */
MFCP CpSC, 0, R0, C(CpTTB), C(0), CpTTB0
RET
TEXT ttbput(SB), 1, $-4 /* translation table base */
MOVW CPSR, R2
CPSID
MOVW R0, R1
BARRIERS /* finish prior accesses before changing ttb */
MTCP CpSC, 0, R1, C(CpTTB), C(0), CpTTB0
MTCP CpSC, 0, R1, C(CpTTB), C(0), CpTTB1 /* non-secure too */
MOVW $0, R0
MTCP CpSC, 0, R0, C(CpTTB), C(0), CpTTBctl
BARRIERS
MOVW R2, CPSR
RET
TEXT dacget(SB), 1, $-4 /* domain access control */
MFCP CpSC, 0, R0, C(CpDAC), C(0)
RET
TEXT dacput(SB), 1, $-4 /* domain access control */
MOVW R0, R1
BARRIERS
MTCP CpSC, 0, R1, C(CpDAC), C(0)
ISB
RET
TEXT fsrget(SB), 1, $-4 /* fault status */
MFCP CpSC, 0, R0, C(CpFSR), C(0), CpDFSR
RET
TEXT farget(SB), 1, $-4 /* fault address */
MFCP CpSC, 0, R0, C(CpFAR), C(0), CpDFAR
RET
TEXT getpsr(SB), 1, $-4
MOVW CPSR, R0
RET
TEXT getscr(SB), 1, $-4 /* secure configuration */
MFCP CpSC, 0, R0, C(CpCONTROL), C(CpCONTROLscr), CpSCRscr
RET
TEXT pidget(SB), 1, $-4 /* address translation pid */
MFCP CpSC, 0, R0, C(CpPID), C(0x0)
RET
TEXT pidput(SB), 1, $-4 /* address translation pid */
MTCP CpSC, 0, R0, C(CpPID), C(0), 0 /* pid, v7a deprecated */
MTCP CpSC, 0, R0, C(CpPID), C(0), 1 /* context id, errata 754322 */
ISB
RET
/*
* access to yet more coprocessor registers
*/
TEXT getauxctl(SB), 1, $-4 /* get cortex-a9 aux. ctl. */
MFCP CpSC, 0, R0, C(CpCONTROL), C(0), CpAuxctl
RET
TEXT putauxctl(SB), 1, $-4 /* put cortex-a9 aux. ctl. */
BARRIERS
MTCP CpSC, 0, R0, C(CpCONTROL), C(0), CpAuxctl
BARRIERS
RET
TEXT getclvlid(SB), 1, $-4
MFCP CpSC, CpIDcsize, R0, C(CpID), C(CpIDidct), CpIDclvlid
RET
TEXT getcyc(SB), 1, $-4
MFCP CpSC, 0, R0, C(CpCLD), C(CpCLDcyc), 0
RET
TEXT getdebug(SB), 1, $-4 /* get cortex-a9 debug enable register */
MFCP CpSC, 0, R0, C(1), C(1), 1
RET
TEXT getpc(SB), 1, $-4
MOVW PC, R0
RET
TEXT getsb(SB), 1, $-4
MOVW R12, R0
RET
TEXT setsp(SB), 1, $-4
MOVW R0, SP
RET
TEXT splhi(SB), 1, $-4
MOVW CPSR, R0 /* return old CPSR */
CPSID /* turn off interrupts */
CMP.S $0, R(MACH)
MOVW.NE R14, 4(R(MACH)) /* save caller pc in m->splpc */
RET
TEXT spllo(SB), 1, $-4 /* start marker for devkprof.c */
MOVW CPSR, R0 /* return old CPSR */
MOVW $0, R1
CMP.S R1, R(MACH)
MOVW.NE R1, 4(R(MACH)) /* clear m->splpc */
CPSIE
RET
TEXT splx(SB), 1, $-4
MOVW CPSR, R3 /* must return old CPSR */
CPSID
CMP.S $0, R(MACH)
MOVW.NE R14, 4(R(MACH)) /* save caller pc in m->splpc */
MOVW R0, CPSR /* reset interrupt level */
MOVW R3, R0 /* must return old CPSR */
RET
TEXT spldone(SB), 1, $0 /* end marker for devkprof.c */
RET
TEXT islo(SB), 1, $-4
MOVW CPSR, R0
AND $(PsrDirq), R0
EOR $(PsrDirq), R0
RET
TEXT clz(SB), $-4
CLZ(0, 0) /* 0 is R0 */
RET
TEXT setlabel(SB), 1, $-4
MOVW SP, 0(R0)
MOVW R14, 4(R0) /* pc */
MOVW $0, R0
RET
TEXT gotolabel(SB), 1, $-4
MOVW 0(R0), SP
MOVW 4(R0), R14 /* pc */
MOVW $1, R0
RET
TEXT getcallerpc(SB), 1, $-4
MOVW 0(SP), R0
RET
TEXT wfi(SB), $-4
MOVW CPSR, R1
/*
* an interrupt should break us out of wfi. masking interrupts
* slows interrupt response slightly but prevents recursion.
*/
// CPSIE
CPSID
BARRIERS
WFI
MOVW R1, CPSR
RET
TEXT coherence(SB), $-4
BARRIERS
RET
GLOBL cpus_proceed+0(SB), $4
#include "cache.v7.s"
TEXT cas(SB),0,$12
TEXT cmpswap(SB),0,$12 /* r0 holds p */
MOVW ov+4(FP), R1
MOVW nv+8(FP), R2
spin:
/* LDREX 0(R0),R3 */
LDREX(0,3)
CMP.S R3, R1
BNE fail
/* STREX 0(R0),R2,R4 */
STREX(0,2,4)
CMP.S $0, R4
BNE spin
MOVW $1, R0
DMB
RET
fail:
MOVW $0, R0
RET
TEXT tas(SB), $-4 /* _tas(ulong *) */
TEXT _tas(SB), $-4
/* returns old (R0) after modifying (R0) */
MOVW R0,R5
DMB
MOVW $1,R2 /* new value of (R0) */
MOVW $MAXSC, R8
tas1:
LDREX(5,7) /* LDREX 0(R5),R7 */
CMP.S $0, R7 /* old value non-zero (lock taken)? */
BNE lockbusy /* we lose */
SUB.S $1, R8
BEQ lockloop2
STREX(2,5,4) /* STREX R2,(R5),R4 */
CMP.S $0, R4
BNE tas1 /* strex failed? try again */
DMB
B tas0
lockloop2:
PUTC('?')
PUTC('l')
PUTC('t')
BL abort(SB)
lockbusy:
CLREX
tas0:
MOVW R7, R0 /* return old value */
RET