2 * Copyright 2010 Tilera Corporation. All Rights Reserved.
4 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation, version 2.
8 * This program is distributed in the hope that it will be useful, but
9 * WITHOUT ANY WARRANTY; without even the implied warranty of
10 * MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE, GOOD TITLE or
11 * NON INFRINGEMENT. See the GNU General Public License for
15 #ifndef _ASM_TILE_PROCESSOR_H
16 #define _ASM_TILE_PROCESSOR_H
21 * NOTE: we don't include <linux/ptrace.h> or <linux/percpu.h> as one
22 * normally would, due to #include dependencies.
24 #include <asm/ptrace.h>
25 #include <asm/percpu.h>
27 #include <arch/chip.h>
28 #include <arch/spr_def.h>
39 * Default implementation of macro that returns current
40 * instruction pointer ("program counter").
42 void *current_text_addr(void);
44 #if CHIP_HAS_TILE_DMA()
45 /* Capture the state of a suspended DMA. */
46 struct tile_dma_state
{
50 unsigned long strides
;
51 unsigned long chunk_size
;
52 unsigned long src_chunk
;
53 unsigned long dest_chunk
;
59 * A mask of the DMA status register for selecting only the 'running'
62 #define DMA_STATUS_MASK \
63 (SPR_DMA_STATUS__RUNNING_MASK | SPR_DMA_STATUS__DONE_MASK)
67 * Track asynchronous TLB events (faults and access violations)
68 * that occur while we are in kernel mode from DMA or the SN processor.
71 short fault_num
; /* original fault number; 0 if none */
72 char is_fault
; /* was it a fault (vs an access violation) */
73 char is_write
; /* for fault: was it caused by a write? */
74 unsigned long address
; /* what address faulted? */
78 struct thread_struct
{
79 /* kernel stack pointer */
83 /* starting user stack pointer (for page migration) */
85 /* pid of process that created this one */
87 #if CHIP_HAS_TILE_DMA()
88 /* DMA info for suspended threads (byte == 0 means no DMA state) */
89 struct tile_dma_state tile_dma_state
;
91 /* User EX_CONTEXT registers */
92 unsigned long ex_context
[2];
93 /* User SYSTEM_SAVE registers */
94 unsigned long system_save
[4];
95 /* User interrupt mask */
96 unsigned long long interrupt_mask
;
97 /* User interrupt-control 0 state */
98 unsigned long intctrl_0
;
99 #if CHIP_HAS_PROC_STATUS_SPR()
100 /* Any other miscellaneous processor state bits */
101 unsigned long proc_status
;
103 #if CHIP_HAS_TILE_DMA()
104 /* Async DMA TLB fault information */
105 struct async_tlb dma_async_tlb
;
107 #if CHIP_HAS_SN_PROC()
108 /* Was static network processor when we were switched out? */
110 /* Async SNI TLB fault information */
111 struct async_tlb sn_async_tlb
;
115 #endif /* !__ASSEMBLY__ */
118 * Start with "sp" this many bytes below the top of the kernel stack.
119 * This preserves the invariant that a called function may write to *sp.
121 #define STACK_TOP_DELTA 8
124 * When entering the kernel via a fault, start with the top of the
125 * pt_regs structure this many bytes below the top of the page.
126 * This aligns the pt_regs structure optimally for cache-line access.
129 #define KSTK_PTREGS_GAP 48
131 #define KSTK_PTREGS_GAP 56
137 #define TASK_SIZE_MAX (MEM_LOW_END + 1)
139 #define TASK_SIZE_MAX PAGE_OFFSET
142 /* TASK_SIZE and related variables are always checked in "current" context. */
144 #define COMPAT_TASK_SIZE (1UL << 31)
145 #define TASK_SIZE ((current_thread_info()->status & TS_COMPAT) ?\
146 COMPAT_TASK_SIZE : TASK_SIZE_MAX)
148 #define TASK_SIZE TASK_SIZE_MAX
151 /* We provide a minimal "vdso" a la x86; just the sigreturn code for now. */
152 #define VDSO_BASE (TASK_SIZE - PAGE_SIZE)
154 #define STACK_TOP VDSO_BASE
156 /* STACK_TOP_MAX is used temporarily in execve and should not check COMPAT. */
157 #define STACK_TOP_MAX TASK_SIZE_MAX
160 * This decides where the kernel will search for a free chunk of vm
161 * space during mmap's, if it is using bottom-up mapping.
163 #define TASK_UNMAPPED_BASE (PAGE_ALIGN(TASK_SIZE / 3))
165 #define HAVE_ARCH_PICK_MMAP_LAYOUT
167 #define INIT_THREAD { \
168 .ksp = (unsigned long)init_stack + THREAD_SIZE - STACK_TOP_DELTA, \
169 .interrupt_mask = -1ULL \
172 /* Kernel stack top for the task that first boots on this cpu. */
173 DECLARE_PER_CPU(unsigned long, boot_sp
);
175 /* PC to boot from on this cpu. */
176 DECLARE_PER_CPU(unsigned long, boot_pc
);
178 /* Do necessary setup to start up a newly executed thread. */
179 static inline void start_thread(struct pt_regs
*regs
,
180 unsigned long pc
, unsigned long usp
)
186 /* Free all resources held by a thread. */
187 static inline void release_thread(struct task_struct
*dead_task
)
189 /* Nothing for now */
192 /* Prepare to copy thread state - unlazy all lazy status. */
193 #define prepare_to_copy(tsk) do { } while (0)
195 extern int kernel_thread(int (*fn
)(void *), void *arg
, unsigned long flags
);
197 /* Helper routines for setting home cache modes at exec() time. */
201 * Return saved (kernel) PC of a blocked thread.
202 * Only used in a printk() in kernel/sched.c, so don't work too hard.
204 #define thread_saved_pc(t) ((t)->thread.pc)
206 unsigned long get_wchan(struct task_struct
*p
);
208 /* Return initial ksp value for given task. */
209 #define task_ksp0(task) ((unsigned long)(task)->stack + THREAD_SIZE)
211 /* Return some info about the user process TASK. */
212 #define KSTK_TOP(task) (task_ksp0(task) - STACK_TOP_DELTA)
213 #define task_pt_regs(task) \
214 ((struct pt_regs *)(task_ksp0(task) - KSTK_PTREGS_GAP) - 1)
215 #define task_sp(task) (task_pt_regs(task)->sp)
216 #define task_pc(task) (task_pt_regs(task)->pc)
217 /* Aliases for pc and sp (used in fs/proc/array.c) */
218 #define KSTK_EIP(task) task_pc(task)
219 #define KSTK_ESP(task) task_sp(task)
221 /* Standard format for printing registers and other word-size data. */
223 # define REGFMT "0x%016lx"
225 # define REGFMT "0x%08lx"
229 * Do some slow action (e.g. read a slow SPR).
230 * Note that this must also have compiler-barrier semantics since
231 * it may be used in a busy loop reading memory.
233 static inline void cpu_relax(void)
235 __insn_mfspr(SPR_PASS
);
240 extern void arch_coredump_signal(struct siginfo
*, struct pt_regs
*);
241 #define arch_coredump_signal arch_coredump_signal
243 /* Provide information about the chip model. */
244 extern char chip_model
[64];
246 /* Data on which physical memory controller corresponds to which NUMA node. */
247 extern int node_controller
[];
250 /* Do we dump information to the console when a user application crashes? */
251 extern int show_crashinfo
;
253 #if CHIP_HAS_CBOX_HOME_MAP()
254 /* Does the heap allocator return hash-for-home pages by default? */
255 extern int hash_default
;
257 /* Should kernel stack pages be hash-for-home? */
258 extern int kstack_hash
;
260 #define hash_default 0
261 #define kstack_hash 0
264 /* Are we using huge pages in the TLB for kernel data? */
265 extern int kdata_huge
;
268 * Note that with OLOC the prefetch will return an unused read word to
269 * the issuing tile, which will cause some MDN traffic. Benchmarking
270 * should be done to see whether this outweighs prefetching.
272 #define ARCH_HAS_PREFETCH
273 #define ARCH_HAS_PREFETCHW
274 #define ARCH_HAS_SPINLOCK_PREFETCH
276 #define prefetch(ptr) __builtin_prefetch((ptr), 0, 3)
277 #define prefetchw(ptr) __builtin_prefetch((ptr), 1, 3)
280 #define spin_lock_prefetch(ptr) prefetchw(ptr)
282 /* Nothing to prefetch. */
283 #define spin_lock_prefetch(lock) do { } while (0)
286 #else /* __ASSEMBLY__ */
288 /* Do some slow action (e.g. read a slow SPR). */
289 #define CPU_RELAX mfspr zero, SPR_PASS
291 #endif /* !__ASSEMBLY__ */
293 /* Assembly code assumes that the PL is in the low bits. */
294 #if SPR_EX_CONTEXT_1_1__PL_SHIFT != 0
295 # error Fix assembly assumptions about PL
298 /* We sometimes use these macros for EX_CONTEXT_0_1 as well. */
299 #if SPR_EX_CONTEXT_1_1__PL_SHIFT != SPR_EX_CONTEXT_0_1__PL_SHIFT || \
300 SPR_EX_CONTEXT_1_1__PL_RMASK != SPR_EX_CONTEXT_0_1__PL_RMASK || \
301 SPR_EX_CONTEXT_1_1__ICS_SHIFT != SPR_EX_CONTEXT_0_1__ICS_SHIFT || \
302 SPR_EX_CONTEXT_1_1__ICS_RMASK != SPR_EX_CONTEXT_0_1__ICS_RMASK
303 # error Fix assumptions that EX1 macros work for both PL0 and PL1
306 /* Allow pulling apart and recombining the PL and ICS bits in EX_CONTEXT. */
307 #define EX1_PL(ex1) \
308 (((ex1) >> SPR_EX_CONTEXT_1_1__PL_SHIFT) & SPR_EX_CONTEXT_1_1__PL_RMASK)
309 #define EX1_ICS(ex1) \
310 (((ex1) >> SPR_EX_CONTEXT_1_1__ICS_SHIFT) & SPR_EX_CONTEXT_1_1__ICS_RMASK)
311 #define PL_ICS_EX1(pl, ics) \
312 (((pl) << SPR_EX_CONTEXT_1_1__PL_SHIFT) | \
313 ((ics) << SPR_EX_CONTEXT_1_1__ICS_SHIFT))
316 * Provide symbolic constants for PLs.
317 * Note that assembly code assumes that USER_PL is zero.
322 /* SYSTEM_SAVE_1_0 holds the current cpu number ORed with ksp0. */
323 #define CPU_LOG_MASK_VALUE 12
324 #define CPU_MASK_VALUE ((1 << CPU_LOG_MASK_VALUE) - 1)
325 #if CONFIG_NR_CPUS > CPU_MASK_VALUE
326 # error Too many cpus!
328 #define raw_smp_processor_id() \
329 ((int)__insn_mfspr(SPR_SYSTEM_SAVE_1_0) & CPU_MASK_VALUE)
330 #define get_current_ksp0() \
331 (__insn_mfspr(SPR_SYSTEM_SAVE_1_0) & ~CPU_MASK_VALUE)
332 #define next_current_ksp0(task) ({ \
333 unsigned long __ksp0 = task_ksp0(task); \
334 int __cpu = raw_smp_processor_id(); \
335 BUG_ON(__ksp0 & CPU_MASK_VALUE); \
339 #endif /* _ASM_TILE_PROCESSOR_H */