Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2010 Tilera Corporation. All Rights Reserved. |
| 3 | * |
| 4 | * This program is free software; you can redistribute it and/or |
| 5 | * modify it under the terms of the GNU General Public License |
| 6 | * as published by the Free Software Foundation, version 2. |
| 7 | * |
| 8 | * This program is distributed in the hope that it will be useful, but |
| 9 | * WITHOUT ANY WARRANTY; without even the implied warranty of |
| 10 | * MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, GOOD TITLE or |
| 11 | * NON INFRINGEMENT. See the GNU General Public License for |
| 12 | * more details. |
| 13 | */ |
| 14 | |
| 15 | #ifndef _ASM_TILE_PROCESSOR_H |
| 16 | #define _ASM_TILE_PROCESSOR_H |
| 17 | |
| 18 | #ifndef __ASSEMBLY__ |
| 19 | |
| 20 | /* |
| 21 | * NOTE: we don't include <linux/ptrace.h> or <linux/percpu.h> as one |
| 22 | * normally would, due to #include dependencies. |
| 23 | */ |
Chris Metcalf | 9f9c038 | 2010-06-25 17:00:56 -0400 | [diff] [blame] | 24 | #include <linux/types.h> |
Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 25 | #include <asm/ptrace.h> |
| 26 | #include <asm/percpu.h> |
| 27 | |
| 28 | #include <arch/chip.h> |
| 29 | #include <arch/spr_def.h> |
| 30 | |
| 31 | struct task_struct; |
| 32 | struct thread_struct; |
Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 33 | |
| 34 | typedef struct { |
| 35 | unsigned long seg; |
| 36 | } mm_segment_t; |
| 37 | |
| 38 | /* |
| 39 | * Default implementation of macro that returns current |
| 40 | * instruction pointer ("program counter"). |
| 41 | */ |
| 42 | void *current_text_addr(void); |
| 43 | |
| 44 | #if CHIP_HAS_TILE_DMA() |
| 45 | /* Capture the state of a suspended DMA. */ |
| 46 | struct tile_dma_state { |
| 47 | int enabled; |
| 48 | unsigned long src; |
| 49 | unsigned long dest; |
| 50 | unsigned long strides; |
| 51 | unsigned long chunk_size; |
| 52 | unsigned long src_chunk; |
| 53 | unsigned long dest_chunk; |
| 54 | unsigned long byte; |
| 55 | unsigned long status; |
| 56 | }; |
| 57 | |
| 58 | /* |
| 59 | * A mask of the DMA status register for selecting only the 'running' |
| 60 | * and 'done' bits. |
| 61 | */ |
| 62 | #define DMA_STATUS_MASK \ |
| 63 | (SPR_DMA_STATUS__RUNNING_MASK | SPR_DMA_STATUS__DONE_MASK) |
| 64 | #endif |
| 65 | |
| 66 | /* |
| 67 | * Track asynchronous TLB events (faults and access violations) |
| 68 | * that occur while we are in kernel mode from DMA or the SN processor. |
| 69 | */ |
| 70 | struct async_tlb { |
| 71 | short fault_num; /* original fault number; 0 if none */ |
| 72 | char is_fault; /* was it a fault (vs an access violation) */ |
| 73 | char is_write; /* for fault: was it caused by a write? */ |
| 74 | unsigned long address; /* what address faulted? */ |
| 75 | }; |
| 76 | |
Chris Metcalf | 9f9c038 | 2010-06-25 17:00:56 -0400 | [diff] [blame] | 77 | #ifdef CONFIG_HARDWALL |
| 78 | struct hardwall_info; |
| 79 | #endif |
Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 80 | |
| 81 | struct thread_struct { |
| 82 | /* kernel stack pointer */ |
| 83 | unsigned long ksp; |
| 84 | /* kernel PC */ |
| 85 | unsigned long pc; |
| 86 | /* starting user stack pointer (for page migration) */ |
| 87 | unsigned long usp0; |
| 88 | /* pid of process that created this one */ |
| 89 | pid_t creator_pid; |
| 90 | #if CHIP_HAS_TILE_DMA() |
| 91 | /* DMA info for suspended threads (byte == 0 means no DMA state) */ |
| 92 | struct tile_dma_state tile_dma_state; |
| 93 | #endif |
| 94 | /* User EX_CONTEXT registers */ |
| 95 | unsigned long ex_context[2]; |
| 96 | /* User SYSTEM_SAVE registers */ |
| 97 | unsigned long system_save[4]; |
| 98 | /* User interrupt mask */ |
| 99 | unsigned long long interrupt_mask; |
| 100 | /* User interrupt-control 0 state */ |
| 101 | unsigned long intctrl_0; |
| 102 | #if CHIP_HAS_PROC_STATUS_SPR() |
| 103 | /* Any other miscellaneous processor state bits */ |
| 104 | unsigned long proc_status; |
| 105 | #endif |
Chris Metcalf | 9f9c038 | 2010-06-25 17:00:56 -0400 | [diff] [blame] | 106 | #ifdef CONFIG_HARDWALL |
| 107 | /* Is this task tied to an activated hardwall? */ |
| 108 | struct hardwall_info *hardwall; |
| 109 | /* Chains this task into the list at hardwall->list. */ |
| 110 | struct list_head hardwall_list; |
| 111 | #endif |
Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 112 | #if CHIP_HAS_TILE_DMA() |
| 113 | /* Async DMA TLB fault information */ |
| 114 | struct async_tlb dma_async_tlb; |
| 115 | #endif |
| 116 | #if CHIP_HAS_SN_PROC() |
| 117 | /* Was static network processor when we were switched out? */ |
| 118 | int sn_proc_running; |
| 119 | /* Async SNI TLB fault information */ |
| 120 | struct async_tlb sn_async_tlb; |
| 121 | #endif |
| 122 | }; |
| 123 | |
| 124 | #endif /* !__ASSEMBLY__ */ |
| 125 | |
| 126 | /* |
| 127 | * Start with "sp" this many bytes below the top of the kernel stack. |
| 128 | * This preserves the invariant that a called function may write to *sp. |
| 129 | */ |
| 130 | #define STACK_TOP_DELTA 8 |
| 131 | |
| 132 | /* |
| 133 | * When entering the kernel via a fault, start with the top of the |
| 134 | * pt_regs structure this many bytes below the top of the page. |
| 135 | * This aligns the pt_regs structure optimally for cache-line access. |
| 136 | */ |
| 137 | #ifdef __tilegx__ |
| 138 | #define KSTK_PTREGS_GAP 48 |
| 139 | #else |
| 140 | #define KSTK_PTREGS_GAP 56 |
| 141 | #endif |
| 142 | |
| 143 | #ifndef __ASSEMBLY__ |
| 144 | |
| 145 | #ifdef __tilegx__ |
| 146 | #define TASK_SIZE_MAX (MEM_LOW_END + 1) |
| 147 | #else |
| 148 | #define TASK_SIZE_MAX PAGE_OFFSET |
| 149 | #endif |
| 150 | |
| 151 | /* TASK_SIZE and related variables are always checked in "current" context. */ |
| 152 | #ifdef CONFIG_COMPAT |
| 153 | #define COMPAT_TASK_SIZE (1UL << 31) |
| 154 | #define TASK_SIZE ((current_thread_info()->status & TS_COMPAT) ?\ |
| 155 | COMPAT_TASK_SIZE : TASK_SIZE_MAX) |
| 156 | #else |
| 157 | #define TASK_SIZE TASK_SIZE_MAX |
| 158 | #endif |
| 159 | |
| 160 | /* We provide a minimal "vdso" a la x86; just the sigreturn code for now. */ |
| 161 | #define VDSO_BASE (TASK_SIZE - PAGE_SIZE) |
| 162 | |
| 163 | #define STACK_TOP VDSO_BASE |
| 164 | |
| 165 | /* STACK_TOP_MAX is used temporarily in execve and should not check COMPAT. */ |
| 166 | #define STACK_TOP_MAX TASK_SIZE_MAX |
| 167 | |
| 168 | /* |
| 169 | * This decides where the kernel will search for a free chunk of vm |
| 170 | * space during mmap's, if it is using bottom-up mapping. |
| 171 | */ |
| 172 | #define TASK_UNMAPPED_BASE (PAGE_ALIGN(TASK_SIZE / 3)) |
| 173 | |
| 174 | #define HAVE_ARCH_PICK_MMAP_LAYOUT |
| 175 | |
| 176 | #define INIT_THREAD { \ |
| 177 | .ksp = (unsigned long)init_stack + THREAD_SIZE - STACK_TOP_DELTA, \ |
| 178 | .interrupt_mask = -1ULL \ |
| 179 | } |
| 180 | |
| 181 | /* Kernel stack top for the task that first boots on this cpu. */ |
| 182 | DECLARE_PER_CPU(unsigned long, boot_sp); |
| 183 | |
| 184 | /* PC to boot from on this cpu. */ |
| 185 | DECLARE_PER_CPU(unsigned long, boot_pc); |
| 186 | |
| 187 | /* Do necessary setup to start up a newly executed thread. */ |
| 188 | static inline void start_thread(struct pt_regs *regs, |
| 189 | unsigned long pc, unsigned long usp) |
| 190 | { |
| 191 | regs->pc = pc; |
| 192 | regs->sp = usp; |
| 193 | } |
| 194 | |
| 195 | /* Free all resources held by a thread. */ |
| 196 | static inline void release_thread(struct task_struct *dead_task) |
| 197 | { |
| 198 | /* Nothing for now */ |
| 199 | } |
| 200 | |
| 201 | /* Prepare to copy thread state - unlazy all lazy status. */ |
| 202 | #define prepare_to_copy(tsk) do { } while (0) |
| 203 | |
| 204 | extern int kernel_thread(int (*fn)(void *), void *arg, unsigned long flags); |
| 205 | |
Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 206 | |
| 207 | /* |
| 208 | * Return saved (kernel) PC of a blocked thread. |
| 209 | * Only used in a printk() in kernel/sched.c, so don't work too hard. |
| 210 | */ |
| 211 | #define thread_saved_pc(t) ((t)->thread.pc) |
| 212 | |
| 213 | unsigned long get_wchan(struct task_struct *p); |
| 214 | |
| 215 | /* Return initial ksp value for given task. */ |
| 216 | #define task_ksp0(task) ((unsigned long)(task)->stack + THREAD_SIZE) |
| 217 | |
| 218 | /* Return some info about the user process TASK. */ |
| 219 | #define KSTK_TOP(task) (task_ksp0(task) - STACK_TOP_DELTA) |
| 220 | #define task_pt_regs(task) \ |
| 221 | ((struct pt_regs *)(task_ksp0(task) - KSTK_PTREGS_GAP) - 1) |
| 222 | #define task_sp(task) (task_pt_regs(task)->sp) |
| 223 | #define task_pc(task) (task_pt_regs(task)->pc) |
| 224 | /* Aliases for pc and sp (used in fs/proc/array.c) */ |
| 225 | #define KSTK_EIP(task) task_pc(task) |
| 226 | #define KSTK_ESP(task) task_sp(task) |
| 227 | |
| 228 | /* Standard format for printing registers and other word-size data. */ |
| 229 | #ifdef __tilegx__ |
| 230 | # define REGFMT "0x%016lx" |
| 231 | #else |
| 232 | # define REGFMT "0x%08lx" |
| 233 | #endif |
| 234 | |
| 235 | /* |
| 236 | * Do some slow action (e.g. read a slow SPR). |
| 237 | * Note that this must also have compiler-barrier semantics since |
| 238 | * it may be used in a busy loop reading memory. |
| 239 | */ |
| 240 | static inline void cpu_relax(void) |
| 241 | { |
| 242 | __insn_mfspr(SPR_PASS); |
| 243 | barrier(); |
| 244 | } |
| 245 | |
| 246 | struct siginfo; |
| 247 | extern void arch_coredump_signal(struct siginfo *, struct pt_regs *); |
| 248 | #define arch_coredump_signal arch_coredump_signal |
| 249 | |
Chris Metcalf | 9f9c038 | 2010-06-25 17:00:56 -0400 | [diff] [blame] | 250 | /* Info on this processor (see fs/proc/cpuinfo.c) */ |
| 251 | struct seq_operations; |
| 252 | extern const struct seq_operations cpuinfo_op; |
| 253 | |
Chris Metcalf | 867e359 | 2010-05-28 23:09:12 -0400 | [diff] [blame] | 254 | /* Provide information about the chip model. */ |
| 255 | extern char chip_model[64]; |
| 256 | |
| 257 | /* Data on which physical memory controller corresponds to which NUMA node. */ |
| 258 | extern int node_controller[]; |
| 259 | |
| 260 | |
| 261 | /* Do we dump information to the console when a user application crashes? */ |
| 262 | extern int show_crashinfo; |
| 263 | |
| 264 | #if CHIP_HAS_CBOX_HOME_MAP() |
| 265 | /* Does the heap allocator return hash-for-home pages by default? */ |
| 266 | extern int hash_default; |
| 267 | |
| 268 | /* Should kernel stack pages be hash-for-home? */ |
| 269 | extern int kstack_hash; |
| 270 | #else |
| 271 | #define hash_default 0 |
| 272 | #define kstack_hash 0 |
| 273 | #endif |
| 274 | |
| 275 | /* Are we using huge pages in the TLB for kernel data? */ |
| 276 | extern int kdata_huge; |
| 277 | |
| 278 | /* |
| 279 | * Note that with OLOC the prefetch will return an unused read word to |
| 280 | * the issuing tile, which will cause some MDN traffic. Benchmarking |
| 281 | * should be done to see whether this outweighs prefetching. |
| 282 | */ |
| 283 | #define ARCH_HAS_PREFETCH |
| 284 | #define ARCH_HAS_PREFETCHW |
| 285 | #define ARCH_HAS_SPINLOCK_PREFETCH |
| 286 | |
| 287 | #define prefetch(ptr) __builtin_prefetch((ptr), 0, 3) |
| 288 | #define prefetchw(ptr) __builtin_prefetch((ptr), 1, 3) |
| 289 | |
| 290 | #ifdef CONFIG_SMP |
| 291 | #define spin_lock_prefetch(ptr) prefetchw(ptr) |
| 292 | #else |
| 293 | /* Nothing to prefetch. */ |
| 294 | #define spin_lock_prefetch(lock) do { } while (0) |
| 295 | #endif |
| 296 | |
| 297 | #else /* __ASSEMBLY__ */ |
| 298 | |
| 299 | /* Do some slow action (e.g. read a slow SPR). */ |
| 300 | #define CPU_RELAX mfspr zero, SPR_PASS |
| 301 | |
| 302 | #endif /* !__ASSEMBLY__ */ |
| 303 | |
| 304 | /* Assembly code assumes that the PL is in the low bits. */ |
| 305 | #if SPR_EX_CONTEXT_1_1__PL_SHIFT != 0 |
| 306 | # error Fix assembly assumptions about PL |
| 307 | #endif |
| 308 | |
| 309 | /* We sometimes use these macros for EX_CONTEXT_0_1 as well. */ |
| 310 | #if SPR_EX_CONTEXT_1_1__PL_SHIFT != SPR_EX_CONTEXT_0_1__PL_SHIFT || \ |
| 311 | SPR_EX_CONTEXT_1_1__PL_RMASK != SPR_EX_CONTEXT_0_1__PL_RMASK || \ |
| 312 | SPR_EX_CONTEXT_1_1__ICS_SHIFT != SPR_EX_CONTEXT_0_1__ICS_SHIFT || \ |
| 313 | SPR_EX_CONTEXT_1_1__ICS_RMASK != SPR_EX_CONTEXT_0_1__ICS_RMASK |
| 314 | # error Fix assumptions that EX1 macros work for both PL0 and PL1 |
| 315 | #endif |
| 316 | |
| 317 | /* Allow pulling apart and recombining the PL and ICS bits in EX_CONTEXT. */ |
| 318 | #define EX1_PL(ex1) \ |
| 319 | (((ex1) >> SPR_EX_CONTEXT_1_1__PL_SHIFT) & SPR_EX_CONTEXT_1_1__PL_RMASK) |
| 320 | #define EX1_ICS(ex1) \ |
| 321 | (((ex1) >> SPR_EX_CONTEXT_1_1__ICS_SHIFT) & SPR_EX_CONTEXT_1_1__ICS_RMASK) |
| 322 | #define PL_ICS_EX1(pl, ics) \ |
| 323 | (((pl) << SPR_EX_CONTEXT_1_1__PL_SHIFT) | \ |
| 324 | ((ics) << SPR_EX_CONTEXT_1_1__ICS_SHIFT)) |
| 325 | |
| 326 | /* |
| 327 | * Provide symbolic constants for PLs. |
| 328 | * Note that assembly code assumes that USER_PL is zero. |
| 329 | */ |
| 330 | #define USER_PL 0 |
| 331 | #define KERNEL_PL 1 |
| 332 | |
| 333 | /* SYSTEM_SAVE_1_0 holds the current cpu number ORed with ksp0. */ |
| 334 | #define CPU_LOG_MASK_VALUE 12 |
| 335 | #define CPU_MASK_VALUE ((1 << CPU_LOG_MASK_VALUE) - 1) |
| 336 | #if CONFIG_NR_CPUS > CPU_MASK_VALUE |
| 337 | # error Too many cpus! |
| 338 | #endif |
| 339 | #define raw_smp_processor_id() \ |
| 340 | ((int)__insn_mfspr(SPR_SYSTEM_SAVE_1_0) & CPU_MASK_VALUE) |
| 341 | #define get_current_ksp0() \ |
| 342 | (__insn_mfspr(SPR_SYSTEM_SAVE_1_0) & ~CPU_MASK_VALUE) |
| 343 | #define next_current_ksp0(task) ({ \ |
| 344 | unsigned long __ksp0 = task_ksp0(task); \ |
| 345 | int __cpu = raw_smp_processor_id(); \ |
| 346 | BUG_ON(__ksp0 & CPU_MASK_VALUE); \ |
| 347 | __ksp0 | __cpu; \ |
| 348 | }) |
| 349 | |
| 350 | #endif /* _ASM_TILE_PROCESSOR_H */ |