cpudata.h 4.8 KB
Newer Older
L
Linus Torvalds 已提交
1 2
/* cpudata.h: Per-cpu parameters.
 *
3
 * Copyright (C) 2003, 2005, 2006 David S. Miller (davem@davemloft.net)
L
Linus Torvalds 已提交
4 5 6 7 8
 */

#ifndef _SPARC64_CPUDATA_H
#define _SPARC64_CPUDATA_H

9 10
#ifndef __ASSEMBLY__

L
Linus Torvalds 已提交
11
#include <linux/percpu.h>
12
#include <linux/threads.h>
L
Linus Torvalds 已提交
13 14 15

typedef struct {
	/* Dcache line 1 */
16
	unsigned int	__softirq_pending; /* must be 1st, see rtrap.S */
L
Linus Torvalds 已提交
17 18 19 20 21 22
	unsigned int	multiplier;
	unsigned int	counter;
	unsigned int	idle_volume;
	unsigned long	clock_tick;	/* %tick's per second */
	unsigned long	udelay_val;

23
	/* Dcache line 2, rarely used */
24 25 26 27 28 29 30
	unsigned int	dcache_size;
	unsigned int	dcache_line_size;
	unsigned int	icache_size;
	unsigned int	icache_line_size;
	unsigned int	ecache_size;
	unsigned int	ecache_line_size;
	unsigned int	__pad3;
31
	unsigned int	__pad4;
L
Linus Torvalds 已提交
32 33 34 35 36 37
} cpuinfo_sparc;

DECLARE_PER_CPU(cpuinfo_sparc, __cpu_data);
#define cpu_data(__cpu)		per_cpu(__cpu_data, (__cpu))
#define local_cpu_data()	__get_cpu_var(__cpu_data)

38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
/* Trap handling code needs to get at a few critical values upon
 * trap entry and to process TSB misses.  These cannot be in the
 * per_cpu() area as we really need to lock them into the TLB and
 * thus make them part of the main kernel image.  As a result we
 * try to make this as small as possible.
 *
 * This is padded out and aligned to 64-bytes to avoid false sharing
 * on SMP.
 */

/* If you modify the size of this structure, please update
 * TRAP_BLOCK_SZ_SHIFT below.
 */
struct thread_info;
struct trap_per_cpu {
/* D-cache line 1 */
	struct thread_info	*thread;
	unsigned long		pgd_paddr;
	unsigned long		__pad1[2];

/* D-cache line 2 */
	unsigned long		__pad2[4];
} __attribute__((aligned(64)));
extern struct trap_per_cpu trap_block[NR_CPUS];
extern void init_cur_cpu_trap(void);
63
extern void setup_tba(void);
64

65 66 67 68 69 70 71 72 73 74
#ifdef CONFIG_SMP
struct cpuid_patch_entry {
	unsigned int	addr;
	unsigned int	cheetah_safari[4];
	unsigned int	cheetah_jbus[4];
	unsigned int	starfire[4];
};
extern struct cpuid_patch_entry __cpuid_patch, __cpuid_patch_end;
#endif

75 76 77 78 79 80 81
#endif /* !(__ASSEMBLY__) */

#define TRAP_PER_CPU_THREAD	0x00
#define TRAP_PER_CPU_PGD_PADDR	0x08

#define TRAP_BLOCK_SZ_SHIFT	6

82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
#ifdef CONFIG_SMP

#define __GET_CPUID(REG)				\
	/* Spitfire implementation (default). */	\
661:	ldxa		[%g0] ASI_UPA_CONFIG, REG;	\
	srlx		REG, 17, REG;			\
	 and		REG, 0x1f, REG;			\
	nop;						\
	.section	.cpuid_patch, "ax";		\
	/* Instruction location. */			\
	.word		661b;				\
	/* Cheetah Safari implementation. */		\
	ldxa		[%g0] ASI_SAFARI_CONFIG, REG;	\
	srlx		REG, 17, REG;			\
	and		REG, 0x3ff, REG;		\
	nop;						\
	/* Cheetah JBUS implementation. */		\
	ldxa		[%g0] ASI_JBUS_CONFIG, REG;	\
	srlx		REG, 17, REG;			\
	and		REG, 0x1f, REG;			\
	nop;						\
	/* Starfire implementation. */			\
	sethi		%hi(0x1fff40000d0 >> 9), REG;	\
	sllx		REG, 9, REG;			\
	or		REG, 0xd0, REG;			\
	lduwa		[REG] ASI_PHYS_BYPASS_EC_E, REG;\
	.previous;
109 110 111

/* Clobbers %g1, current address space PGD phys address into %g7.  */
#define TRAP_LOAD_PGD_PHYS			\
112
	__GET_CPUID(%g1)			\
113
	sethi	%hi(trap_block), %g7;		\
114
	sllx	%g1, TRAP_BLOCK_SZ_SHIFT, %g1;	\
115
	or	%g7, %lo(trap_block), %g7;	\
116
	add	%g7, %g1, %g7;			\
117 118 119 120
	ldx	[%g7 + TRAP_PER_CPU_PGD_PADDR], %g7;

/* Clobbers %g1, loads local processor's IRQ work area into %g6.  */
#define TRAP_LOAD_IRQ_WORK			\
121 122 123 124 125
	__GET_CPUID(%g1)			\
	sethi	%hi(__irq_work), %g6;		\
	sllx	%g1, 6, %g1;			\
	or	%g6, %lo(__irq_work), %g6;	\
	add	%g6, %g1, %g6;
126 127 128

/* Clobbers %g1, loads %g6 with current thread info pointer.  */
#define TRAP_LOAD_THREAD_REG			\
129 130 131 132 133
	__GET_CPUID(%g1)			\
	sethi	%hi(trap_block), %g6;		\
	sllx	%g1, TRAP_BLOCK_SZ_SHIFT, %g1;	\
	or	%g6, %lo(trap_block), %g6;	\
	ldx	[%g6 + %g1], %g6;
134 135

/* Given the current thread info pointer in %g6, load the per-cpu
136
 * area base of the current processor into %g5.  REG1, REG2, and REG3 are
137
 * clobbered.
138 139 140 141 142
 *
 * You absolutely cannot use %g5 as a temporary in this code.  The
 * reason is that traps can happen during execution, and return from
 * trap will load the fully resolved %g5 per-cpu base.  This can corrupt
 * the calculations done by the macro mid-stream.
143
 */
144
#define LOAD_PER_CPU_BASE(REG1, REG2, REG3)		\
145
	ldub	[%g6 + TI_CPU], REG1;			\
146
	sethi	%hi(__per_cpu_shift), REG3;		\
147
	sethi	%hi(__per_cpu_base), REG2;		\
148
	ldx	[REG3 + %lo(__per_cpu_shift)], REG3;	\
149
	ldx	[REG2 + %lo(__per_cpu_base)], REG2;	\
150 151
	sllx	REG1, REG3, REG3;			\
	add	REG3, REG2, %g5;
152

153
#else
154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169

/* Uniprocessor versions, we know the cpuid is zero.  */
#define TRAP_LOAD_PGD_PHYS			\
	sethi	%hi(trap_block), %g7;		\
	or	%g7, %lo(trap_block), %g7;	\
	ldx	[%g7 + TRAP_PER_CPU_PGD_PADDR], %g7;

#define TRAP_LOAD_IRQ_WORK			\
	sethi	%hi(__irq_work), %g6;		\
	or	%g6, %lo(__irq_work), %g6;

#define TRAP_LOAD_THREAD_REG			\
	sethi	%hi(trap_block), %g6;		\
	ldx	[%g6 + %lo(trap_block)], %g6;

/* No per-cpu areas on uniprocessor, so no need to load %g5.  */
170
#define LOAD_PER_CPU_BASE(REG1, REG2, REG3)
171 172

#endif /* !(CONFIG_SMP) */
173

L
Linus Torvalds 已提交
174
#endif /* _SPARC64_CPUDATA_H */