68fd9ee3e8ae13bb41d95934216219ead70777d2
[pandora-kernel.git] / arch / sparc / include / asm / trap_block.h
1 #ifndef _SPARC_TRAP_BLOCK_H
2 #define _SPARC_TRAP_BLOCK_H
3
4 #include <asm/hypervisor.h>
5 #include <asm/asi.h>
6
7 #ifndef __ASSEMBLY__
8
9 /* Trap handling code needs to get at a few critical values upon
10  * trap entry and to process TSB misses.  These cannot be in the
11  * per_cpu() area as we really need to lock them into the TLB and
12  * thus make them part of the main kernel image.  As a result we
13  * try to make this as small as possible.
14  *
15  * This is padded out and aligned to 64-bytes to avoid false sharing
16  * on SMP.
17  */
18
19 /* If you modify the size of this structure, please update
20  * TRAP_BLOCK_SZ_SHIFT below.
21  */
22 struct thread_info;
23 struct trap_per_cpu {
24 /* D-cache line 1: Basic thread information, cpu and device mondo queues */
25         struct thread_info      *thread;
26         unsigned long           pgd_paddr;
27         unsigned long           cpu_mondo_pa;
28         unsigned long           dev_mondo_pa;
29
30 /* D-cache line 2: Error Mondo Queue and kernel buffer pointers */
31         unsigned long           resum_mondo_pa;
32         unsigned long           resum_kernel_buf_pa;
33         unsigned long           nonresum_mondo_pa;
34         unsigned long           nonresum_kernel_buf_pa;
35
36 /* Dcache lines 3, 4, 5, and 6: Hypervisor Fault Status */
37         struct hv_fault_status  fault_info;
38
39 /* Dcache line 7: Physical addresses of CPU send mondo block and CPU list.  */
40         unsigned long           cpu_mondo_block_pa;
41         unsigned long           cpu_list_pa;
42         unsigned long           tsb_huge;
43         unsigned long           tsb_huge_temp;
44
45 /* Dcache line 8: IRQ work list, and keep trap_block a power-of-2 in size.  */
46         unsigned long           irq_worklist_pa;
47         unsigned int            cpu_mondo_qmask;
48         unsigned int            dev_mondo_qmask;
49         unsigned int            resum_qmask;
50         unsigned int            nonresum_qmask;
51         unsigned long           __unused;
52 } __attribute__((aligned(64)));
53 extern struct trap_per_cpu trap_block[NR_CPUS];
54 extern void init_cur_cpu_trap(struct thread_info *);
55 extern void setup_tba(void);
56 extern int ncpus_probed;
57
58 extern unsigned long real_hard_smp_processor_id(void);
59
60 struct cpuid_patch_entry {
61         unsigned int    addr;
62         unsigned int    cheetah_safari[4];
63         unsigned int    cheetah_jbus[4];
64         unsigned int    starfire[4];
65         unsigned int    sun4v[4];
66 };
67 extern struct cpuid_patch_entry __cpuid_patch, __cpuid_patch_end;
68
69 struct sun4v_1insn_patch_entry {
70         unsigned int    addr;
71         unsigned int    insn;
72 };
73 extern struct sun4v_1insn_patch_entry __sun4v_1insn_patch,
74         __sun4v_1insn_patch_end;
75
76 struct sun4v_2insn_patch_entry {
77         unsigned int    addr;
78         unsigned int    insns[2];
79 };
80 extern struct sun4v_2insn_patch_entry __sun4v_2insn_patch,
81         __sun4v_2insn_patch_end;
82
83
84 #endif /* !(__ASSEMBLY__) */
85
86 #define TRAP_PER_CPU_THREAD             0x00
87 #define TRAP_PER_CPU_PGD_PADDR          0x08
88 #define TRAP_PER_CPU_CPU_MONDO_PA       0x10
89 #define TRAP_PER_CPU_DEV_MONDO_PA       0x18
90 #define TRAP_PER_CPU_RESUM_MONDO_PA     0x20
91 #define TRAP_PER_CPU_RESUM_KBUF_PA      0x28
92 #define TRAP_PER_CPU_NONRESUM_MONDO_PA  0x30
93 #define TRAP_PER_CPU_NONRESUM_KBUF_PA   0x38
94 #define TRAP_PER_CPU_FAULT_INFO         0x40
95 #define TRAP_PER_CPU_CPU_MONDO_BLOCK_PA 0xc0
96 #define TRAP_PER_CPU_CPU_LIST_PA        0xc8
97 #define TRAP_PER_CPU_TSB_HUGE           0xd0
98 #define TRAP_PER_CPU_TSB_HUGE_TEMP      0xd8
99 #define TRAP_PER_CPU_IRQ_WORKLIST_PA    0xe0
100 #define TRAP_PER_CPU_CPU_MONDO_QMASK    0xe8
101 #define TRAP_PER_CPU_DEV_MONDO_QMASK    0xec
102 #define TRAP_PER_CPU_RESUM_QMASK        0xf0
103 #define TRAP_PER_CPU_NONRESUM_QMASK     0xf4
104
105 #define TRAP_BLOCK_SZ_SHIFT             8
106
107 #include <asm/scratchpad.h>
108
109 #define __GET_CPUID(REG)                                \
110         /* Spitfire implementation (default). */        \
111 661:    ldxa            [%g0] ASI_UPA_CONFIG, REG;      \
112         srlx            REG, 17, REG;                   \
113          and            REG, 0x1f, REG;                 \
114         nop;                                            \
115         .section        .cpuid_patch, "ax";             \
116         /* Instruction location. */                     \
117         .word           661b;                           \
118         /* Cheetah Safari implementation. */            \
119         ldxa            [%g0] ASI_SAFARI_CONFIG, REG;   \
120         srlx            REG, 17, REG;                   \
121         and             REG, 0x3ff, REG;                \
122         nop;                                            \
123         /* Cheetah JBUS implementation. */              \
124         ldxa            [%g0] ASI_JBUS_CONFIG, REG;     \
125         srlx            REG, 17, REG;                   \
126         and             REG, 0x1f, REG;                 \
127         nop;                                            \
128         /* Starfire implementation. */                  \
129         sethi           %hi(0x1fff40000d0 >> 9), REG;   \
130         sllx            REG, 9, REG;                    \
131         or              REG, 0xd0, REG;                 \
132         lduwa           [REG] ASI_PHYS_BYPASS_EC_E, REG;\
133         /* sun4v implementation. */                     \
134         mov             SCRATCHPAD_CPUID, REG;          \
135         ldxa            [REG] ASI_SCRATCHPAD, REG;      \
136         nop;                                            \
137         nop;                                            \
138         .previous;
139
140 #ifdef CONFIG_SMP
141
142 #define TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
143         __GET_CPUID(TMP)                        \
144         sethi   %hi(trap_block), DEST;          \
145         sllx    TMP, TRAP_BLOCK_SZ_SHIFT, TMP;  \
146         or      DEST, %lo(trap_block), DEST;    \
147         add     DEST, TMP, DEST;                \
148
149 /* Clobbers TMP, current address space PGD phys address into DEST.  */
150 #define TRAP_LOAD_PGD_PHYS(DEST, TMP)           \
151         TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
152         ldx     [DEST + TRAP_PER_CPU_PGD_PADDR], DEST;
153
154 /* Clobbers TMP, loads local processor's IRQ work area into DEST.  */
155 #define TRAP_LOAD_IRQ_WORK_PA(DEST, TMP)        \
156         TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
157         add     DEST, TRAP_PER_CPU_IRQ_WORKLIST_PA, DEST;
158
159 /* Clobbers TMP, loads DEST with current thread info pointer.  */
160 #define TRAP_LOAD_THREAD_REG(DEST, TMP)         \
161         TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
162         ldx     [DEST + TRAP_PER_CPU_THREAD], DEST;
163
164 /* Given the current thread info pointer in THR, load the per-cpu
165  * area base of the current processor into DEST.  REG1, REG2, and REG3 are
166  * clobbered.
167  *
168  * You absolutely cannot use DEST as a temporary in this code.  The
169  * reason is that traps can happen during execution, and return from
170  * trap will load the fully resolved DEST per-cpu base.  This can corrupt
171  * the calculations done by the macro mid-stream.
172  */
173 #define LOAD_PER_CPU_BASE(DEST, THR, REG1, REG2, REG3)  \
174         lduh    [THR + TI_CPU], REG1;                   \
175         sethi   %hi(__per_cpu_shift), REG3;             \
176         sethi   %hi(__per_cpu_base), REG2;              \
177         ldx     [REG3 + %lo(__per_cpu_shift)], REG3;    \
178         ldx     [REG2 + %lo(__per_cpu_base)], REG2;     \
179         sllx    REG1, REG3, REG3;                       \
180         add     REG3, REG2, DEST;
181
182 #else
183
184 #define TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
185         sethi   %hi(trap_block), DEST;          \
186         or      DEST, %lo(trap_block), DEST;    \
187
188 /* Uniprocessor versions, we know the cpuid is zero.  */
189 #define TRAP_LOAD_PGD_PHYS(DEST, TMP)           \
190         TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
191         ldx     [DEST + TRAP_PER_CPU_PGD_PADDR], DEST;
192
193 /* Clobbers TMP, loads local processor's IRQ work area into DEST.  */
194 #define TRAP_LOAD_IRQ_WORK_PA(DEST, TMP)        \
195         TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
196         add     DEST, TRAP_PER_CPU_IRQ_WORKLIST_PA, DEST;
197
198 #define TRAP_LOAD_THREAD_REG(DEST, TMP)         \
199         TRAP_LOAD_TRAP_BLOCK(DEST, TMP)         \
200         ldx     [DEST + TRAP_PER_CPU_THREAD], DEST;
201
202 /* No per-cpu areas on uniprocessor, so no need to load DEST.  */
203 #define LOAD_PER_CPU_BASE(DEST, THR, REG1, REG2, REG3)
204
205 #endif /* !(CONFIG_SMP) */
206
207 #endif /* _SPARC_TRAP_BLOCK_H */