URL https://opencores.org/ocsvn/openrisc_2011-10-31/openrisc_2011-10-31/trunk

Subversion Repositories openrisc_2011-10-31

[/] [openrisc/] [trunk/] [gnu-src/] [newlib-1.18.0/] [libgloss/] [mips/] [vr5xxx.S] - Blame information for rev 252

Go to most recent revision | Details | Compare with Previous | View Log


/*
 * vr5xxx.S -- CPU specific support routines
 *
 * Copyright (c) 1999 Cygnus Solutions
 *
 * The authors hereby grant permission to use, copy, modify, distribute,
 * and license this software and its documentation for any purpose, provided
 * that existing copyright notices are retained in all copies and that this
 * notice is included verbatim in any distributions. No written agreement,
 * license, or royalty fee is required for any of the authorized uses.
 * Modifications to this software may be copyrighted by their authors
 * and need not follow the licensing terms described here, provided that
 * the new terms are clearly indicated on the first page of each file where
 * they apply.
 */
 
/* This file cloned from vr4300.S by dlindsay@cygnus.com
 * and recoded to suit Vr5432 and Vr5000.
 * Should be no worse for Vr43{00,05,10}.
 * Specifically, __cpu_flush() has been changed (a) to allow for the hardware
 * difference (in set associativity) between the Vr5432 and Vr5000,
 * and (b) to flush the optional secondary cache of the Vr5000.
 */
 
/* Processor Revision Identifier (PRID) Register: Implementation Numbers */
#define IMPL_VR5432     0x54
 
/* Cache Constants not determinable dynamically */
#define VR5000_2NDLINE 32       /* secondary cache line size */
#define VR5432_LINE 32          /* I,Dcache line sizes */
#define VR5432_SIZE (16*1024)   /* I,Dcache half-size */
 
 
#ifndef __mips64
        .set mips3
#endif
#ifdef __mips16
/* This file contains 32 bit assembly code.  */
        .set nomips16
#endif
 
#include "regs.S"
 
        .text
        .align  2
 
        # Taken from "R4300 Preliminary RISC Processor Specification
        # Revision 2.0 January 1995" page 39: "The Count
        # register... increments at a constant rate... at one-half the
        # PClock speed."
        # We can use this fact to provide small polled delays.
        .globl  __cpu_timer_poll
        .ent    __cpu_timer_poll
__cpu_timer_poll:
        .set    noreorder
        # in:   a0 = (unsigned int) number of PClock ticks to wait for
        # out:  void
 
        # The Vr4300 counter updates at half PClock, so divide by 2 to
        # get counter delta:
        bnezl   a0, 1f          # continue if delta non-zero
        srl     a0, a0, 1       # divide ticks by 2             {DELAY SLOT}
        # perform a quick return to the caller:
        j       ra
        nop                     #                               {DELAY SLOT}
1:
        mfc0    v0, C0_COUNT    # get current counter value
        nop
        nop
        # We cannot just do the simple test, of adding our delta onto
        # the current value (ignoring overflow) and then checking for
        # equality. The counter is incrementing every two PClocks,
        # which means the counter value can change between
        # instructions, making it hard to sample at the exact value
        # desired.
 
        # However, we do know that our entry delta value is less than
        # half the number space (since we divide by 2 on entry). This
        # means we can use a difference in signs to indicate timer
        # overflow.
        addu    a0, v0, a0      # unsigned add (ignore overflow)
        # We know have our end value (which will have been
        # sign-extended to fill the 64bit register value).
2:
        # get current counter value:
        mfc0    v0, C0_COUNT
        nop
        nop
        # This is an unsigned 32bit subtraction:
        subu    v0, a0, v0      # delta = (end - now)           {DELAY SLOT}
        bgtzl   v0, 2b          # looping back is most likely
        nop
        # We have now been delayed (in the foreground) for AT LEAST
        # the required number of counter ticks.
        j       ra              # return to caller
        nop                     #                               {DELAY SLOT}
        .set    reorder
        .end    __cpu_timer_poll
 
        # Flush the processor caches to memory:
 
        .globl  __cpu_flush
        .ent    __cpu_flush
__cpu_flush:
        .set    noreorder
        # NOTE: The Vr4300 and Vr5432 *CANNOT* have any secondary cache.
        # On those, SC (bit 17 of CONFIG register) is hard-wired to 1,
        # except that email from Dennis_Han@el.nec.com says that old
        # versions of the Vr5432 incorrectly hard-wired this bit to 0.
        # The Vr5000 has an optional direct-mapped secondary cache,
        # and the SC bit correctly indicates this.
 
        # So, for the 4300 and 5432 we want to just
        # flush the primary Data and Instruction caches.
        # For the 5000 it is desired to flush the secondary cache too.
        # There is an operation difference worth noting.
        # The 4300 and 5000 primary caches use VA bit 14 to choose cache set,
        # whereas 5432 primary caches use VA bit 0.
 
        # This code interprets the relevant Config register bits as
        # much as possible, except for the 5432.
        # The code therefore has some portability.
        # However, the associativity issues mean you should not just assume
        # that this code works anywhere. Also, the secondary cache set
        # size is hardwired, since the 5000 series does not define codes
        # for variant sizes.
 
        # Note: this version of the code flushes D$ before I$.
        #   It is difficult to construct a case where that matters,
        #   but it cant hurt.
 
        mfc0    a0, C0_PRID     # a0 = Processor Revision register
        nop                     # dlindsay: unclear why the nops, but
        nop                     # vr4300.S had such so I do too.
        srl     a2, a0, PR_IMP  # want bits 8..15
        andi    a2, a2, 0x255   # mask: now a2 = Implementation # field
        li      a1, IMPL_VR5432
        beq     a1, a2, 8f      # use Vr5432-specific flush algorithm
        nop
 
        # Non-Vr5432 version of the code.
        # (The distinctions being: CONFIG is truthful about secondary cache,
        # and we act as if the primary Icache and Dcache are direct mapped.)
 
        mfc0    t0, C0_CONFIG   # t0 = CONFIG register
        nop
        nop
        li      a1, 1           # a1=1, a useful constant
 
        srl     a2, t0, CR_IC   # want IC field of CONFIG
        andi    a2, a2, 0x7     # mask: now a2= code for Icache size
        add     a2, a2, 12      # +12
        sllv    a2, a1, a2      # a2=primary instruction cache size in bytes
 
        srl     a3, t0, CR_DC   # DC field of CONFIG
        andi    a3, a3, 0x7     # mask: now a3= code for Dcache size
        add     a3, a3, 12      # +12
        sllv    a3, a1, a3      # a3=primary data cache size in bytes
 
        li      t2, (1 << CR_IB) # t2=mask over IB boolean
        and     t2, t2, t0      # test IB field of CONFIG register value
        beqz    t2, 1f          #
        li      a1, 16          # 16 bytes (branch shadow: always loaded.)
        li      a1, 32          # non-zero, then 32bytes
1:
 
        li      t2, (1 << CR_DB) # t2=mask over DB boolean
        and     t2, t2, t0      # test BD field of CONFIG register value
        beqz    t2, 2f          #
        li      a0, 16          # 16bytes (branch shadow: always loaded.)
        li      a0, 32          # non-zero, then 32bytes
2:
        lui     t1, ((K0BASE >> 16) & 0xFFFF)
        ori     t1, t1, (K0BASE & 0xFFFF)
 
        # At this point,
        # a0 = primary Dcache line size in bytes
        # a1 = primary Icache line size in bytes
        # a2 = primary Icache size in bytes
        # a3 = primary Dcache size in bytes
        # t0 = CONFIG value
        # t1 = a round unmapped cached base address (we are in kernel mode)
        # t2,t3 scratch
 
        addi    t3, t1, 0       # t3=t1=start address for any cache
        add     t2, t3, a3      # t2=end adress+1 of Dcache
        sub     t2, t2, a0      # t2=address of last line in Dcache
3:
        cache   INDEX_WRITEBACK_INVALIDATE_D,0(t3)
        bne     t3, t2, 3b      #
        addu    t3, a0          # (delay slot) increment by Dcache line size
 
 
        # Now check CONFIG to see if there is a secondary cache
        lui     t2, (1 << (CR_SC-16)) # t2=mask over SC boolean
        and     t2, t2, t0      # test SC in CONFIG
        bnez    t2, 6f
 
        # There is a secondary cache. Find out its sizes.
 
        srl     t3, t0, CR_SS   # want SS field of CONFIG
        andi    t3, t3, 0x3     # mask: now t3= code for cache size.
        beqz    t3, 4f
        lui     a3, ((512*1024)>>16)    # a3= 512K, code was 0
        addu    t3, -1                  # decrement code
        beqz    t3, 4f
        lui     a3, ((1024*1024)>>16)   # a3= 1 M, code  1
        addu    t3, -1                  # decrement code
        beqz    t3, 4f
        lui     a3, ((2*1024*1024)>>16) # a3= 2 M, code 2
        j       6f                      # no secondary cache, code 3
 
4:      # a3 = secondary cache size in bytes
        li      a0, VR5000_2NDLINE      # no codes assigned for other than 32
 
        # At this point,
        # a0 = secondary cache line size in bytes
        # a1 = primary Icache line size in bytes
        # a2 = primary Icache size in bytes
        # a3 = secondary cache size in bytes
        # t1 = a round unmapped cached base address (we are in kernel mode)
        # t2,t3 scratch
 
        addi    t3, t1, 0       # t3=t1=start address for any cache
        add     t2, t3, a3      # t2=end address+1 of secondary cache
        sub     t2, t2, a0      # t2=address of last line in secondary cache
5:
        cache   INDEX_WRITEBACK_INVALIDATE_SD,0(t3)
        bne     t3, t2, 5b
        addu    t3, a0          # (delay slot) increment by line size
 
 
6:      # Any optional secondary cache done.  Now do I-cache and return.
 
        # At this point,
        # a1 = primary Icache line size in bytes
        # a2 = primary Icache size in bytes
        # t1 = a round unmapped cached base address (we are in kernel mode)
        # t2,t3 scratch
 
        add     t2, t1, a2      # t2=end adress+1 of Icache
        sub     t2, t2, a1      # t2=address of last line in Icache
7:
        cache   INDEX_INVALIDATE_I,0(t1)
        bne     t1, t2, 7b
        addu    t1, a1          # (delay slot) increment by Icache line size
 
        j       ra      # return to the caller
        nop
 
8:
 
# Vr5432 version of the cpu_flush code.
# (The distinctions being: CONFIG can not be trusted about secondary
# cache (which does not exist). The primary caches use Virtual Address Bit 0
# to control set selection.
 
# Code does not consult CONFIG about cache sizes: knows the hardwired sizes.
# Since both I and D have the same size and line size, uses a merged loop.
 
        li      a0, VR5432_LINE
        li      a1, VR5432_SIZE
        lui     t1, ((K0BASE >> 16) & 0xFFFF)
        ori     t1, t1, (K0BASE & 0xFFFF)
 
        # a0 = cache line size in bytes
        # a1 = 1/2 cache size in bytes
        # t1 = a round unmapped cached base address (we are in kernel mode)
 
        add     t2, t1, a1      # t2=end address+1
        sub     t2, t2, a0      # t2=address of last line in Icache
 
9:
        cache   INDEX_WRITEBACK_INVALIDATE_D,0(t1)      # set 0
        cache   INDEX_WRITEBACK_INVALIDATE_D,1(t1)      # set 1
        cache   INDEX_INVALIDATE_I,0(t1)        # set 0
        cache   INDEX_INVALIDATE_I,1(t1)        # set 1
        bne     t1, t2, 9b
        addu    t1, a0
 
        j       ra      # return to the caller
        nop
        .set    reorder
        .end    __cpu_flush
 
        # NOTE: This variable should *NOT* be addressed relative to
        # the $gp register since this code is executed before $gp is
        # initialised... hence we leave it in the text area. This will
        # cause problems if this routine is ever ROMmed:
 
        .globl  __buserr_cnt
__buserr_cnt:
        .word   0
        .align  3
__k1_save:
        .word   0
        .word   0
        .align  2
 
        .ent __buserr
        .globl __buserr
__buserr:
        .set noat
        .set noreorder
        # k0 and k1 available for use:
        mfc0    k0,C0_CAUSE
        nop
        nop
        andi    k0,k0,0x7c
        sub     k0,k0,7 << 2
        beq     k0,$0,__buserr_do
        nop
        # call the previous handler
        la      k0,__previous
        jr      k0
        nop
        #
__buserr_do:
        # TODO: check that the cause is indeed a bus error
        # - if not then just jump to the previous handler
        la      k0,__k1_save
        sd      k1,0(k0)
        #
        la      k1,__buserr_cnt
        lw      k0,0(k1)        # increment counter
        addu    k0,1
        sw      k0,0(k1)
        #
        la      k0,__k1_save
        ld      k1,0(k0)
        #
        mfc0    k0,C0_EPC
        nop
        nop
        addu    k0,k0,4         # skip offending instruction
        mtc0    k0,C0_EPC       # update EPC
        nop
        nop
        eret
#        j       k0
#        rfe
        .set reorder
        .set at
        .end __buserr
 
__exception_code:
        .set noreorder
        lui     k0,%hi(__buserr)
        daddiu  k0,k0,%lo(__buserr)
        jr      k0
        nop
        .set reorder
__exception_code_end:
 
        .data
__previous:
        .space  (__exception_code_end - __exception_code)
        # This subtracting two addresses is working
        # but is not garenteed to continue working.
        # The assemble reserves the right to put these
        # two labels into different frags, and then
        # cant take their difference.
 
        .text
 
        .ent    __default_buserr_handler
        .globl  __default_buserr_handler
__default_buserr_handler:
        .set noreorder
        # attach our simple bus error handler:
        # in:  void
        # out: void
        mfc0    a0,C0_SR
        nop
        li      a1,SR_BEV
        and     a1,a1,a0
        beq     a1,$0,baseaddr
        lui     a0,0x8000       # delay slot
        lui     a0,0xbfc0
        daddiu  a0,a0,0x0200
baseaddr:
        daddiu  a0,a0,0x0180
        # a0 = base vector table address
        la      a1,__exception_code_end
        la      a2,__exception_code
        subu    a1,a1,a2
        la      a3,__previous
        # there must be a better way of doing this????
copyloop:
        lw      v0,0(a0)
        sw      v0,0(a3)
        lw      v0,0(a2)
        sw      v0,0(a0)
        daddiu  a0,a0,4
        daddiu  a2,a2,4
        daddiu  a3,a3,4
        subu    a1,a1,4
        bne     a1,$0,copyloop
        nop
        la      a0,__buserr_cnt
        sw      $0,0(a0)
        j       ra
        nop
        .set reorder
        .end    __default_buserr_handler
 
        .ent    __restore_buserr_handler
        .globl  __restore_buserr_handler
__restore_buserr_handler:
        .set noreorder
        # restore original (monitor) bus error handler
        # in:  void
        # out: void
        mfc0    a0,C0_SR
        nop
        li      a1,SR_BEV
        and     a1,a1,a0
        beq     a1,$0,res_baseaddr
        lui     a0,0x8000       # delay slot
        lui     a0,0xbfc0
        daddiu  a0,a0,0x0200
res_baseaddr:
        daddiu  a0,a0,0x0180
        # a0 = base vector table address
        la      a1,__exception_code_end
        la      a3,__exception_code
        subu    a1,a1,a3
        la      a3,__previous
        # there must be a better way of doing this????
res_copyloop:
        lw      v0,0(a3)
        sw      v0,0(a0)
        daddiu  a0,a0,4
        daddiu  a3,a3,4
        subu    a1,a1,4
        bne     a1,$0,res_copyloop
        nop
        j       ra
        nop
        .set reorder
        .end    __restore_buserr_handler
 
        .ent    __buserr_count
        .globl  __buserr_count
__buserr_count:
        .set noreorder
        # restore original (monitor) bus error handler
        # in:  void
        # out: unsigned int __buserr_cnt
        la      v0,__buserr_cnt
        lw      v0,0(v0)
        j       ra
        nop
        .set reorder
        .end    __buserr_count
 
/* EOF vr5xxx.S */

Browse

Tools

Subversion Repositories openrisc_2011-10-31

[/] [openrisc/] [trunk/] [gnu-src/] [newlib-1.18.0/] [libgloss/] [mips/] [vr5xxx.S] - Blame information for rev 252

Line No.	Rev	Author	Line
1	207	jeremybenn	`/*`
2			`* vr5xxx.S -- CPU specific support routines`
3			`*`
4			`* Copyright (c) 1999 Cygnus Solutions`
5			`*`
6			`* The authors hereby grant permission to use, copy, modify, distribute,`
7			`* and license this software and its documentation for any purpose, provided`
8			`* that existing copyright notices are retained in all copies and that this`
9			`* notice is included verbatim in any distributions. No written agreement,`
10			`* license, or royalty fee is required for any of the authorized uses.`
11			`* Modifications to this software may be copyrighted by their authors`
12			`* and need not follow the licensing terms described here, provided that`
13			`* the new terms are clearly indicated on the first page of each file where`
14			`* they apply.`
15			`*/`
16
17			`/* This file cloned from vr4300.S by dlindsay@cygnus.com`
18			`* and recoded to suit Vr5432 and Vr5000.`
19			`* Should be no worse for Vr43{00,05,10}.`
20			`* Specifically, __cpu_flush() has been changed (a) to allow for the hardware`
21			`* difference (in set associativity) between the Vr5432 and Vr5000,`
22			`* and (b) to flush the optional secondary cache of the Vr5000.`
23			`*/`
24
25			`/* Processor Revision Identifier (PRID) Register: Implementation Numbers */`
26			`#define IMPL_VR5432 0x54`
27
28			`/* Cache Constants not determinable dynamically */`
29			`#define VR5000_2NDLINE 32 /* secondary cache line size */`
30			`#define VR5432_LINE 32 /* I,Dcache line sizes */`
31			`#define VR5432_SIZE (161024) / I,Dcache half-size */`
32
33
34			`#ifndef __mips64`
35			`.set mips3`
36			`#endif`
37			`#ifdef __mips16`
38			`/* This file contains 32 bit assembly code. */`
39			`.set nomips16`
40			`#endif`
41
42			`#include "regs.S"`
43
44			`.text`
45			`.align 2`
46
47			`# Taken from "R4300 Preliminary RISC Processor Specification`
48			`# Revision 2.0 January 1995" page 39: "The Count`
49			`# register... increments at a constant rate... at one-half the`
50			`# PClock speed."`
51			`# We can use this fact to provide small polled delays.`
52			`.globl __cpu_timer_poll`
53			`.ent __cpu_timer_poll`
54			`__cpu_timer_poll:`
55			`.set noreorder`
56			`# in: a0 = (unsigned int) number of PClock ticks to wait for`
57			`# out: void`
58
59			`# The Vr4300 counter updates at half PClock, so divide by 2 to`
60			`# get counter delta:`
61			`bnezl a0, 1f # continue if delta non-zero`
62			`srl a0, a0, 1 # divide ticks by 2 {DELAY SLOT}`
63			`# perform a quick return to the caller:`
64			`j ra`
65			`nop # {DELAY SLOT}`
66			`1:`
67			`mfc0 v0, C0_COUNT # get current counter value`
68			`nop`
69			`nop`
70			`# We cannot just do the simple test, of adding our delta onto`
71			`# the current value (ignoring overflow) and then checking for`
72			`# equality. The counter is incrementing every two PClocks,`
73			`# which means the counter value can change between`
74			`# instructions, making it hard to sample at the exact value`
75			`# desired.`
76
77			`# However, we do know that our entry delta value is less than`
78			`# half the number space (since we divide by 2 on entry). This`
79			`# means we can use a difference in signs to indicate timer`
80			`# overflow.`
81			`addu a0, v0, a0 # unsigned add (ignore overflow)`
82			`# We know have our end value (which will have been`
83			`# sign-extended to fill the 64bit register value).`
84			`2:`
85			`# get current counter value:`
86			`mfc0 v0, C0_COUNT`
87			`nop`
88			`nop`
89			`# This is an unsigned 32bit subtraction:`
90			`subu v0, a0, v0 # delta = (end - now) {DELAY SLOT}`
91			`bgtzl v0, 2b # looping back is most likely`
92			`nop`
93			`# We have now been delayed (in the foreground) for AT LEAST`
94			`# the required number of counter ticks.`
95			`j ra # return to caller`
96			`nop # {DELAY SLOT}`
97			`.set reorder`
98			`.end __cpu_timer_poll`
99
100			`# Flush the processor caches to memory:`
101
102			`.globl __cpu_flush`
103			`.ent __cpu_flush`
104			`__cpu_flush:`
105			`.set noreorder`
106			`# NOTE: The Vr4300 and Vr5432 CANNOT have any secondary cache.`
107			`# On those, SC (bit 17 of CONFIG register) is hard-wired to 1,`
108			`# except that email from Dennis_Han@el.nec.com says that old`
109			`# versions of the Vr5432 incorrectly hard-wired this bit to 0.`
110			`# The Vr5000 has an optional direct-mapped secondary cache,`
111			`# and the SC bit correctly indicates this.`
112
113			`# So, for the 4300 and 5432 we want to just`
114			`# flush the primary Data and Instruction caches.`
115			`# For the 5000 it is desired to flush the secondary cache too.`
116			`# There is an operation difference worth noting.`
117			`# The 4300 and 5000 primary caches use VA bit 14 to choose cache set,`
118			`# whereas 5432 primary caches use VA bit 0.`
119
120			`# This code interprets the relevant Config register bits as`
121			`# much as possible, except for the 5432.`
122			`# The code therefore has some portability.`
123			`# However, the associativity issues mean you should not just assume`
124			`# that this code works anywhere. Also, the secondary cache set`
125			`# size is hardwired, since the 5000 series does not define codes`
126			`# for variant sizes.`
127
128			`# Note: this version of the code flushes D$ before I$.`
129			`# It is difficult to construct a case where that matters,`
130			`# but it cant hurt.`
131
132			`mfc0 a0, C0_PRID # a0 = Processor Revision register`
133			`nop # dlindsay: unclear why the nops, but`
134			`nop # vr4300.S had such so I do too.`
135			`srl a2, a0, PR_IMP # want bits 8..15`
136			`andi a2, a2, 0x255 # mask: now a2 = Implementation # field`
137			`li a1, IMPL_VR5432`
138			`beq a1, a2, 8f # use Vr5432-specific flush algorithm`
139			`nop`
140
141			`# Non-Vr5432 version of the code.`
142			`# (The distinctions being: CONFIG is truthful about secondary cache,`
143			`# and we act as if the primary Icache and Dcache are direct mapped.)`
144
145			`mfc0 t0, C0_CONFIG # t0 = CONFIG register`
146			`nop`
147			`nop`
148			`li a1, 1 # a1=1, a useful constant`
149
150			`srl a2, t0, CR_IC # want IC field of CONFIG`
151			`andi a2, a2, 0x7 # mask: now a2= code for Icache size`
152			`add a2, a2, 12 # +12`
153			`sllv a2, a1, a2 # a2=primary instruction cache size in bytes`
154
155			`srl a3, t0, CR_DC # DC field of CONFIG`
156			`andi a3, a3, 0x7 # mask: now a3= code for Dcache size`
157			`add a3, a3, 12 # +12`
158			`sllv a3, a1, a3 # a3=primary data cache size in bytes`
159
160			`li t2, (1 << CR_IB) # t2=mask over IB boolean`
161			`and t2, t2, t0 # test IB field of CONFIG register value`
162			`beqz t2, 1f #`
163			`li a1, 16 # 16 bytes (branch shadow: always loaded.)`
164			`li a1, 32 # non-zero, then 32bytes`
165			`1:`
166
167			`li t2, (1 << CR_DB) # t2=mask over DB boolean`
168			`and t2, t2, t0 # test BD field of CONFIG register value`
169			`beqz t2, 2f #`
170			`li a0, 16 # 16bytes (branch shadow: always loaded.)`
171			`li a0, 32 # non-zero, then 32bytes`
172			`2:`
173			`lui t1, ((K0BASE >> 16) & 0xFFFF)`
174			`ori t1, t1, (K0BASE & 0xFFFF)`
175
176			`# At this point,`
177			`# a0 = primary Dcache line size in bytes`
178			`# a1 = primary Icache line size in bytes`
179			`# a2 = primary Icache size in bytes`
180			`# a3 = primary Dcache size in bytes`
181			`# t0 = CONFIG value`
182			`# t1 = a round unmapped cached base address (we are in kernel mode)`
183			`# t2,t3 scratch`
184
185			`addi t3, t1, 0 # t3=t1=start address for any cache`
186			`add t2, t3, a3 # t2=end adress+1 of Dcache`
187			`sub t2, t2, a0 # t2=address of last line in Dcache`
188			`3:`
189			`cache INDEX_WRITEBACK_INVALIDATE_D,0(t3)`
190			`bne t3, t2, 3b #`
191			`addu t3, a0 # (delay slot) increment by Dcache line size`
192
193
194			`# Now check CONFIG to see if there is a secondary cache`
195			`lui t2, (1 << (CR_SC-16)) # t2=mask over SC boolean`
196			`and t2, t2, t0 # test SC in CONFIG`
197			`bnez t2, 6f`
198
199			`# There is a secondary cache. Find out its sizes.`
200
201			`srl t3, t0, CR_SS # want SS field of CONFIG`
202			`andi t3, t3, 0x3 # mask: now t3= code for cache size.`
203			`beqz t3, 4f`
204			`lui a3, ((512*1024)>>16) # a3= 512K, code was 0`
205			`addu t3, -1 # decrement code`
206			`beqz t3, 4f`
207			`lui a3, ((1024*1024)>>16) # a3= 1 M, code 1`
208			`addu t3, -1 # decrement code`
209			`beqz t3, 4f`
210			`lui a3, ((210241024)>>16) # a3= 2 M, code 2`
211			`j 6f # no secondary cache, code 3`
212
213			`4: # a3 = secondary cache size in bytes`
214			`li a0, VR5000_2NDLINE # no codes assigned for other than 32`
215
216			`# At this point,`
217			`# a0 = secondary cache line size in bytes`
218			`# a1 = primary Icache line size in bytes`
219			`# a2 = primary Icache size in bytes`
220			`# a3 = secondary cache size in bytes`
221			`# t1 = a round unmapped cached base address (we are in kernel mode)`
222			`# t2,t3 scratch`
223
224			`addi t3, t1, 0 # t3=t1=start address for any cache`
225			`add t2, t3, a3 # t2=end address+1 of secondary cache`
226			`sub t2, t2, a0 # t2=address of last line in secondary cache`
227			`5:`
228			`cache INDEX_WRITEBACK_INVALIDATE_SD,0(t3)`
229			`bne t3, t2, 5b`
230			`addu t3, a0 # (delay slot) increment by line size`
231
232
233			`6: # Any optional secondary cache done. Now do I-cache and return.`
234
235			`# At this point,`
236			`# a1 = primary Icache line size in bytes`
237			`# a2 = primary Icache size in bytes`
238			`# t1 = a round unmapped cached base address (we are in kernel mode)`
239			`# t2,t3 scratch`
240
241			`add t2, t1, a2 # t2=end adress+1 of Icache`
242			`sub t2, t2, a1 # t2=address of last line in Icache`
243			`7:`
244			`cache INDEX_INVALIDATE_I,0(t1)`
245			`bne t1, t2, 7b`
246			`addu t1, a1 # (delay slot) increment by Icache line size`
247
248			`j ra # return to the caller`
249			`nop`
250
251			`8:`
252
253			`# Vr5432 version of the cpu_flush code.`
254			`# (The distinctions being: CONFIG can not be trusted about secondary`
255			`# cache (which does not exist). The primary caches use Virtual Address Bit 0`
256			`# to control set selection.`
257
258			`# Code does not consult CONFIG about cache sizes: knows the hardwired sizes.`
259			`# Since both I and D have the same size and line size, uses a merged loop.`
260
261			`li a0, VR5432_LINE`
262			`li a1, VR5432_SIZE`
263			`lui t1, ((K0BASE >> 16) & 0xFFFF)`
264			`ori t1, t1, (K0BASE & 0xFFFF)`
265
266			`# a0 = cache line size in bytes`
267			`# a1 = 1/2 cache size in bytes`
268			`# t1 = a round unmapped cached base address (we are in kernel mode)`
269
270			`add t2, t1, a1 # t2=end address+1`
271			`sub t2, t2, a0 # t2=address of last line in Icache`
272
273			`9:`
274			`cache INDEX_WRITEBACK_INVALIDATE_D,0(t1) # set 0`
275			`cache INDEX_WRITEBACK_INVALIDATE_D,1(t1) # set 1`
276			`cache INDEX_INVALIDATE_I,0(t1) # set 0`
277			`cache INDEX_INVALIDATE_I,1(t1) # set 1`
278			`bne t1, t2, 9b`
279			`addu t1, a0`
280
281			`j ra # return to the caller`
282			`nop`
283			`.set reorder`
284			`.end __cpu_flush`
285
286			`# NOTE: This variable should NOT be addressed relative to`
287			`# the $gp register since this code is executed before $gp is`
288			`# initialised... hence we leave it in the text area. This will`
289			`# cause problems if this routine is ever ROMmed:`
290
291			`.globl __buserr_cnt`
292			`__buserr_cnt:`
293			`.word 0`
294			`.align 3`
295			`__k1_save:`
296			`.word 0`
297			`.word 0`
298			`.align 2`
299
300			`.ent __buserr`
301			`.globl __buserr`
302			`__buserr:`
303			`.set noat`
304			`.set noreorder`
305			`# k0 and k1 available for use:`
306			`mfc0 k0,C0_CAUSE`
307			`nop`
308			`nop`
309			`andi k0,k0,0x7c`
310			`sub k0,k0,7 << 2`
311			`beq k0,$0,__buserr_do`
312			`nop`
313			`# call the previous handler`
314			`la k0,__previous`
315			`jr k0`
316			`nop`
317			`#`
318			`__buserr_do:`
319			`# TODO: check that the cause is indeed a bus error`
320			`# - if not then just jump to the previous handler`
321			`la k0,__k1_save`
322			`sd k1,0(k0)`
323			`#`
324			`la k1,__buserr_cnt`
325			`lw k0,0(k1) # increment counter`
326			`addu k0,1`
327			`sw k0,0(k1)`
328			`#`
329			`la k0,__k1_save`
330			`ld k1,0(k0)`
331			`#`
332			`mfc0 k0,C0_EPC`
333			`nop`
334			`nop`
335			`addu k0,k0,4 # skip offending instruction`
336			`mtc0 k0,C0_EPC # update EPC`
337			`nop`
338			`nop`
339			`eret`
340			`# j k0`
341			`# rfe`
342			`.set reorder`
343			`.set at`
344			`.end __buserr`
345
346			`__exception_code:`
347			`.set noreorder`
348			`lui k0,%hi(__buserr)`
349			`daddiu k0,k0,%lo(__buserr)`
350			`jr k0`
351			`nop`
352			`.set reorder`
353			`__exception_code_end:`
354
355			`.data`
356			`__previous:`
357			`.space (__exception_code_end - __exception_code)`
358			`# This subtracting two addresses is working`
359			`# but is not garenteed to continue working.`
360			`# The assemble reserves the right to put these`
361			`# two labels into different frags, and then`
362			`# cant take their difference.`
363
364			`.text`
365
366			`.ent __default_buserr_handler`
367			`.globl __default_buserr_handler`
368			`__default_buserr_handler:`
369			`.set noreorder`
370			`# attach our simple bus error handler:`
371			`# in: void`
372			`# out: void`
373			`mfc0 a0,C0_SR`
374			`nop`
375			`li a1,SR_BEV`
376			`and a1,a1,a0`
377			`beq a1,$0,baseaddr`
378			`lui a0,0x8000 # delay slot`
379			`lui a0,0xbfc0`
380			`daddiu a0,a0,0x0200`
381			`baseaddr:`
382			`daddiu a0,a0,0x0180`
383			`# a0 = base vector table address`
384			`la a1,__exception_code_end`
385			`la a2,__exception_code`
386			`subu a1,a1,a2`
387			`la a3,__previous`
388			`# there must be a better way of doing this????`
389			`copyloop:`
390			`lw v0,0(a0)`
391			`sw v0,0(a3)`
392			`lw v0,0(a2)`
393			`sw v0,0(a0)`
394			`daddiu a0,a0,4`
395			`daddiu a2,a2,4`
396			`daddiu a3,a3,4`
397			`subu a1,a1,4`
398			`bne a1,$0,copyloop`
399			`nop`
400			`la a0,__buserr_cnt`
401			`sw $0,0(a0)`
402			`j ra`
403			`nop`
404			`.set reorder`
405			`.end __default_buserr_handler`
406
407			`.ent __restore_buserr_handler`
408			`.globl __restore_buserr_handler`
409			`__restore_buserr_handler:`
410			`.set noreorder`
411			`# restore original (monitor) bus error handler`
412			`# in: void`
413			`# out: void`
414			`mfc0 a0,C0_SR`
415			`nop`
416			`li a1,SR_BEV`
417			`and a1,a1,a0`
418			`beq a1,$0,res_baseaddr`
419			`lui a0,0x8000 # delay slot`
420			`lui a0,0xbfc0`
421			`daddiu a0,a0,0x0200`
422			`res_baseaddr:`
423			`daddiu a0,a0,0x0180`
424			`# a0 = base vector table address`
425			`la a1,__exception_code_end`
426			`la a3,__exception_code`
427			`subu a1,a1,a3`
428			`la a3,__previous`
429			`# there must be a better way of doing this????`
430			`res_copyloop:`
431			`lw v0,0(a3)`
432			`sw v0,0(a0)`
433			`daddiu a0,a0,4`
434			`daddiu a3,a3,4`
435			`subu a1,a1,4`
436			`bne a1,$0,res_copyloop`
437			`nop`
438			`j ra`
439			`nop`
440			`.set reorder`
441			`.end __restore_buserr_handler`
442
443			`.ent __buserr_count`
444			`.globl __buserr_count`
445			`__buserr_count:`
446			`.set noreorder`
447			`# restore original (monitor) bus error handler`
448			`# in: void`
449			`# out: unsigned int __buserr_cnt`
450			`la v0,__buserr_cnt`
451			`lw v0,0(v0)`
452			`j ra`
453			`nop`
454			`.set reorder`
455			`.end __buserr_count`
456
457			`/* EOF vr5xxx.S */`