diff options
author | Glenn Elliott <gelliott@cs.unc.edu> | 2012-03-04 19:47:13 -0500 |
---|---|---|
committer | Glenn Elliott <gelliott@cs.unc.edu> | 2012-03-04 19:47:13 -0500 |
commit | c71c03bda1e86c9d5198c5d83f712e695c4f2a1e (patch) | |
tree | ecb166cb3e2b7e2adb3b5e292245fefd23381ac8 /drivers/net/sfc/io.h | |
parent | ea53c912f8a86a8567697115b6a0d8152beee5c8 (diff) | |
parent | 6a00f206debf8a5c8899055726ad127dbeeed098 (diff) |
Merge branch 'mpi-master' into wip-k-fmlpwip-k-fmlp
Conflicts:
litmus/sched_cedf.c
Diffstat (limited to 'drivers/net/sfc/io.h')
-rw-r--r-- | drivers/net/sfc/io.h | 158 |
1 files changed, 94 insertions, 64 deletions
diff --git a/drivers/net/sfc/io.h b/drivers/net/sfc/io.h index 85a99fe87437..cc978803d484 100644 --- a/drivers/net/sfc/io.h +++ b/drivers/net/sfc/io.h | |||
@@ -1,7 +1,7 @@ | |||
1 | /**************************************************************************** | 1 | /**************************************************************************** |
2 | * Driver for Solarflare Solarstorm network controllers and boards | 2 | * Driver for Solarflare Solarstorm network controllers and boards |
3 | * Copyright 2005-2006 Fen Systems Ltd. | 3 | * Copyright 2005-2006 Fen Systems Ltd. |
4 | * Copyright 2006-2009 Solarflare Communications Inc. | 4 | * Copyright 2006-2010 Solarflare Communications Inc. |
5 | * | 5 | * |
6 | * This program is free software; you can redistribute it and/or modify it | 6 | * This program is free software; you can redistribute it and/or modify it |
7 | * under the terms of the GNU General Public License version 2 as published | 7 | * under the terms of the GNU General Public License version 2 as published |
@@ -22,28 +22,39 @@ | |||
22 | * | 22 | * |
23 | * Notes on locking strategy: | 23 | * Notes on locking strategy: |
24 | * | 24 | * |
25 | * Most NIC registers require 16-byte (or 8-byte, for SRAM) atomic writes | 25 | * Most CSRs are 128-bit (oword) and therefore cannot be read or |
26 | * which necessitates locking. | 26 | * written atomically. Access from the host is buffered by the Bus |
27 | * Under normal operation few writes to NIC registers are made and these | 27 | * Interface Unit (BIU). Whenever the host reads from the lowest |
28 | * registers (EVQ_RPTR_REG, RX_DESC_UPD_REG and TX_DESC_UPD_REG) are special | 28 | * address of such a register, or from the address of a different such |
29 | * cased to allow 4-byte (hence lockless) accesses. | 29 | * register, the BIU latches the register's value. Subsequent reads |
30 | * from higher addresses of the same register will read the latched | ||
31 | * value. Whenever the host writes part of such a register, the BIU | ||
32 | * collects the written value and does not write to the underlying | ||
33 | * register until all 4 dwords have been written. A similar buffering | ||
34 | * scheme applies to host access to the NIC's 64-bit SRAM. | ||
30 | * | 35 | * |
31 | * It *is* safe to write to these 4-byte registers in the middle of an | 36 | * Access to different CSRs and 64-bit SRAM words must be serialised, |
32 | * access to an 8-byte or 16-byte register. We therefore use a | 37 | * since interleaved access can result in lost writes or lost |
33 | * spinlock to protect accesses to the larger registers, but no locks | 38 | * information from read-to-clear fields. We use efx_nic::biu_lock |
34 | * for the 4-byte registers. | 39 | * for this. (We could use separate locks for read and write, but |
40 | * this is not normally a performance bottleneck.) | ||
35 | * | 41 | * |
36 | * A write barrier is needed to ensure that DW3 is written after DW0/1/2 | 42 | * The DMA descriptor pointers (RX_DESC_UPD and TX_DESC_UPD) are |
37 | * due to the way the 16byte registers are "collected" in the BIU. | 43 | * 128-bit but are special-cased in the BIU to avoid the need for |
44 | * locking in the host: | ||
38 | * | 45 | * |
39 | * We also lock when carrying out reads, to ensure consistency of the | 46 | * - They are write-only. |
40 | * data (made possible since the BIU reads all 128 bits into a cache). | 47 | * - The semantics of writing to these registers are such that |
41 | * Reads are very rare, so this isn't a significant performance | 48 | * replacing the low 96 bits with zero does not affect functionality. |
42 | * impact. (Most data transferred from NIC to host is DMAed directly | 49 | * - If the host writes to the last dword address of such a register |
43 | * into host memory). | 50 | * (i.e. the high 32 bits) the underlying register will always be |
44 | * | 51 | * written. If the collector and the current write together do not |
45 | * I/O BAR access uses locks for both reads and writes (but is only provided | 52 | * provide values for all 128 bits of the register, the low 96 bits |
46 | * for testing purposes). | 53 | * will be written as zero. |
54 | * - If the host writes to the address of any other part of such a | ||
55 | * register while the collector already holds values for some other | ||
56 | * register, the write is discarded and the collector maintains its | ||
57 | * current state. | ||
47 | */ | 58 | */ |
48 | 59 | ||
49 | #if BITS_PER_LONG == 64 | 60 | #if BITS_PER_LONG == 64 |
@@ -72,7 +83,7 @@ static inline __le32 _efx_readd(struct efx_nic *efx, unsigned int reg) | |||
72 | return (__force __le32)__raw_readl(efx->membase + reg); | 83 | return (__force __le32)__raw_readl(efx->membase + reg); |
73 | } | 84 | } |
74 | 85 | ||
75 | /* Writes to a normal 16-byte Efx register, locking as appropriate. */ | 86 | /* Write a normal 128-bit CSR, locking as appropriate. */ |
76 | static inline void efx_writeo(struct efx_nic *efx, efx_oword_t *value, | 87 | static inline void efx_writeo(struct efx_nic *efx, efx_oword_t *value, |
77 | unsigned int reg) | 88 | unsigned int reg) |
78 | { | 89 | { |
@@ -85,21 +96,19 @@ static inline void efx_writeo(struct efx_nic *efx, efx_oword_t *value, | |||
85 | spin_lock_irqsave(&efx->biu_lock, flags); | 96 | spin_lock_irqsave(&efx->biu_lock, flags); |
86 | #ifdef EFX_USE_QWORD_IO | 97 | #ifdef EFX_USE_QWORD_IO |
87 | _efx_writeq(efx, value->u64[0], reg + 0); | 98 | _efx_writeq(efx, value->u64[0], reg + 0); |
88 | wmb(); | ||
89 | _efx_writeq(efx, value->u64[1], reg + 8); | 99 | _efx_writeq(efx, value->u64[1], reg + 8); |
90 | #else | 100 | #else |
91 | _efx_writed(efx, value->u32[0], reg + 0); | 101 | _efx_writed(efx, value->u32[0], reg + 0); |
92 | _efx_writed(efx, value->u32[1], reg + 4); | 102 | _efx_writed(efx, value->u32[1], reg + 4); |
93 | _efx_writed(efx, value->u32[2], reg + 8); | 103 | _efx_writed(efx, value->u32[2], reg + 8); |
94 | wmb(); | ||
95 | _efx_writed(efx, value->u32[3], reg + 12); | 104 | _efx_writed(efx, value->u32[3], reg + 12); |
96 | #endif | 105 | #endif |
106 | wmb(); | ||
97 | mmiowb(); | 107 | mmiowb(); |
98 | spin_unlock_irqrestore(&efx->biu_lock, flags); | 108 | spin_unlock_irqrestore(&efx->biu_lock, flags); |
99 | } | 109 | } |
100 | 110 | ||
101 | /* Write an 8-byte NIC SRAM entry through the supplied mapping, | 111 | /* Write 64-bit SRAM through the supplied mapping, locking as appropriate. */ |
102 | * locking as appropriate. */ | ||
103 | static inline void efx_sram_writeq(struct efx_nic *efx, void __iomem *membase, | 112 | static inline void efx_sram_writeq(struct efx_nic *efx, void __iomem *membase, |
104 | efx_qword_t *value, unsigned int index) | 113 | efx_qword_t *value, unsigned int index) |
105 | { | 114 | { |
@@ -115,36 +124,27 @@ static inline void efx_sram_writeq(struct efx_nic *efx, void __iomem *membase, | |||
115 | __raw_writeq((__force u64)value->u64[0], membase + addr); | 124 | __raw_writeq((__force u64)value->u64[0], membase + addr); |
116 | #else | 125 | #else |
117 | __raw_writel((__force u32)value->u32[0], membase + addr); | 126 | __raw_writel((__force u32)value->u32[0], membase + addr); |
118 | wmb(); | ||
119 | __raw_writel((__force u32)value->u32[1], membase + addr + 4); | 127 | __raw_writel((__force u32)value->u32[1], membase + addr + 4); |
120 | #endif | 128 | #endif |
129 | wmb(); | ||
121 | mmiowb(); | 130 | mmiowb(); |
122 | spin_unlock_irqrestore(&efx->biu_lock, flags); | 131 | spin_unlock_irqrestore(&efx->biu_lock, flags); |
123 | } | 132 | } |
124 | 133 | ||
125 | /* Write dword to NIC register that allows partial writes | 134 | /* Write a 32-bit CSR or the last dword of a special 128-bit CSR */ |
126 | * | ||
127 | * Some registers (EVQ_RPTR_REG, RX_DESC_UPD_REG and | ||
128 | * TX_DESC_UPD_REG) can be written to as a single dword. This allows | ||
129 | * for lockless writes. | ||
130 | */ | ||
131 | static inline void efx_writed(struct efx_nic *efx, efx_dword_t *value, | 135 | static inline void efx_writed(struct efx_nic *efx, efx_dword_t *value, |
132 | unsigned int reg) | 136 | unsigned int reg) |
133 | { | 137 | { |
134 | netif_vdbg(efx, hw, efx->net_dev, | 138 | netif_vdbg(efx, hw, efx->net_dev, |
135 | "writing partial register %x with "EFX_DWORD_FMT"\n", | 139 | "writing register %x with "EFX_DWORD_FMT"\n", |
136 | reg, EFX_DWORD_VAL(*value)); | 140 | reg, EFX_DWORD_VAL(*value)); |
137 | 141 | ||
138 | /* No lock required */ | 142 | /* No lock required */ |
139 | _efx_writed(efx, value->u32[0], reg); | 143 | _efx_writed(efx, value->u32[0], reg); |
144 | wmb(); | ||
140 | } | 145 | } |
141 | 146 | ||
142 | /* Read from a NIC register | 147 | /* Read a 128-bit CSR, locking as appropriate. */ |
143 | * | ||
144 | * This reads an entire 16-byte register in one go, locking as | ||
145 | * appropriate. It is essential to read the first dword first, as this | ||
146 | * prompts the NIC to load the current value into the shadow register. | ||
147 | */ | ||
148 | static inline void efx_reado(struct efx_nic *efx, efx_oword_t *value, | 148 | static inline void efx_reado(struct efx_nic *efx, efx_oword_t *value, |
149 | unsigned int reg) | 149 | unsigned int reg) |
150 | { | 150 | { |
@@ -163,8 +163,7 @@ static inline void efx_reado(struct efx_nic *efx, efx_oword_t *value, | |||
163 | EFX_OWORD_VAL(*value)); | 163 | EFX_OWORD_VAL(*value)); |
164 | } | 164 | } |
165 | 165 | ||
166 | /* Read an 8-byte SRAM entry through supplied mapping, | 166 | /* Read 64-bit SRAM through the supplied mapping, locking as appropriate. */ |
167 | * locking as appropriate. */ | ||
168 | static inline void efx_sram_readq(struct efx_nic *efx, void __iomem *membase, | 167 | static inline void efx_sram_readq(struct efx_nic *efx, void __iomem *membase, |
169 | efx_qword_t *value, unsigned int index) | 168 | efx_qword_t *value, unsigned int index) |
170 | { | 169 | { |
@@ -186,7 +185,7 @@ static inline void efx_sram_readq(struct efx_nic *efx, void __iomem *membase, | |||
186 | addr, EFX_QWORD_VAL(*value)); | 185 | addr, EFX_QWORD_VAL(*value)); |
187 | } | 186 | } |
188 | 187 | ||
189 | /* Read dword from register that allows partial writes (sic) */ | 188 | /* Read a 32-bit CSR or SRAM */ |
190 | static inline void efx_readd(struct efx_nic *efx, efx_dword_t *value, | 189 | static inline void efx_readd(struct efx_nic *efx, efx_dword_t *value, |
191 | unsigned int reg) | 190 | unsigned int reg) |
192 | { | 191 | { |
@@ -196,28 +195,28 @@ static inline void efx_readd(struct efx_nic *efx, efx_dword_t *value, | |||
196 | reg, EFX_DWORD_VAL(*value)); | 195 | reg, EFX_DWORD_VAL(*value)); |
197 | } | 196 | } |
198 | 197 | ||
199 | /* Write to a register forming part of a table */ | 198 | /* Write a 128-bit CSR forming part of a table */ |
200 | static inline void efx_writeo_table(struct efx_nic *efx, efx_oword_t *value, | 199 | static inline void efx_writeo_table(struct efx_nic *efx, efx_oword_t *value, |
201 | unsigned int reg, unsigned int index) | 200 | unsigned int reg, unsigned int index) |
202 | { | 201 | { |
203 | efx_writeo(efx, value, reg + index * sizeof(efx_oword_t)); | 202 | efx_writeo(efx, value, reg + index * sizeof(efx_oword_t)); |
204 | } | 203 | } |
205 | 204 | ||
206 | /* Read to a register forming part of a table */ | 205 | /* Read a 128-bit CSR forming part of a table */ |
207 | static inline void efx_reado_table(struct efx_nic *efx, efx_oword_t *value, | 206 | static inline void efx_reado_table(struct efx_nic *efx, efx_oword_t *value, |
208 | unsigned int reg, unsigned int index) | 207 | unsigned int reg, unsigned int index) |
209 | { | 208 | { |
210 | efx_reado(efx, value, reg + index * sizeof(efx_oword_t)); | 209 | efx_reado(efx, value, reg + index * sizeof(efx_oword_t)); |
211 | } | 210 | } |
212 | 211 | ||
213 | /* Write to a dword register forming part of a table */ | 212 | /* Write a 32-bit CSR forming part of a table, or 32-bit SRAM */ |
214 | static inline void efx_writed_table(struct efx_nic *efx, efx_dword_t *value, | 213 | static inline void efx_writed_table(struct efx_nic *efx, efx_dword_t *value, |
215 | unsigned int reg, unsigned int index) | 214 | unsigned int reg, unsigned int index) |
216 | { | 215 | { |
217 | efx_writed(efx, value, reg + index * sizeof(efx_oword_t)); | 216 | efx_writed(efx, value, reg + index * sizeof(efx_oword_t)); |
218 | } | 217 | } |
219 | 218 | ||
220 | /* Read from a dword register forming part of a table */ | 219 | /* Read a 32-bit CSR forming part of a table, or 32-bit SRAM */ |
221 | static inline void efx_readd_table(struct efx_nic *efx, efx_dword_t *value, | 220 | static inline void efx_readd_table(struct efx_nic *efx, efx_dword_t *value, |
222 | unsigned int reg, unsigned int index) | 221 | unsigned int reg, unsigned int index) |
223 | { | 222 | { |
@@ -231,29 +230,56 @@ static inline void efx_readd_table(struct efx_nic *efx, efx_dword_t *value, | |||
231 | #define EFX_PAGED_REG(page, reg) \ | 230 | #define EFX_PAGED_REG(page, reg) \ |
232 | ((page) * EFX_PAGE_BLOCK_SIZE + (reg)) | 231 | ((page) * EFX_PAGE_BLOCK_SIZE + (reg)) |
233 | 232 | ||
234 | /* As for efx_writeo(), but for a page-mapped register. */ | 233 | /* Write the whole of RX_DESC_UPD or TX_DESC_UPD */ |
235 | static inline void efx_writeo_page(struct efx_nic *efx, efx_oword_t *value, | 234 | static inline void _efx_writeo_page(struct efx_nic *efx, efx_oword_t *value, |
236 | unsigned int reg, unsigned int page) | 235 | unsigned int reg, unsigned int page) |
237 | { | 236 | { |
238 | efx_writeo(efx, value, EFX_PAGED_REG(page, reg)); | 237 | reg = EFX_PAGED_REG(page, reg); |
239 | } | 238 | |
239 | netif_vdbg(efx, hw, efx->net_dev, | ||
240 | "writing register %x with " EFX_OWORD_FMT "\n", reg, | ||
241 | EFX_OWORD_VAL(*value)); | ||
240 | 242 | ||
241 | /* As for efx_writed(), but for a page-mapped register. */ | 243 | #ifdef EFX_USE_QWORD_IO |
242 | static inline void efx_writed_page(struct efx_nic *efx, efx_dword_t *value, | 244 | _efx_writeq(efx, value->u64[0], reg + 0); |
243 | unsigned int reg, unsigned int page) | 245 | _efx_writeq(efx, value->u64[1], reg + 8); |
246 | #else | ||
247 | _efx_writed(efx, value->u32[0], reg + 0); | ||
248 | _efx_writed(efx, value->u32[1], reg + 4); | ||
249 | _efx_writed(efx, value->u32[2], reg + 8); | ||
250 | _efx_writed(efx, value->u32[3], reg + 12); | ||
251 | #endif | ||
252 | wmb(); | ||
253 | } | ||
254 | #define efx_writeo_page(efx, value, reg, page) \ | ||
255 | _efx_writeo_page(efx, value, \ | ||
256 | reg + \ | ||
257 | BUILD_BUG_ON_ZERO((reg) != 0x830 && (reg) != 0xa10), \ | ||
258 | page) | ||
259 | |||
260 | /* Write a page-mapped 32-bit CSR (EVQ_RPTR or the high bits of | ||
261 | * RX_DESC_UPD or TX_DESC_UPD) | ||
262 | */ | ||
263 | static inline void _efx_writed_page(struct efx_nic *efx, efx_dword_t *value, | ||
264 | unsigned int reg, unsigned int page) | ||
244 | { | 265 | { |
245 | efx_writed(efx, value, EFX_PAGED_REG(page, reg)); | 266 | efx_writed(efx, value, EFX_PAGED_REG(page, reg)); |
246 | } | 267 | } |
247 | 268 | #define efx_writed_page(efx, value, reg, page) \ | |
248 | /* Write dword to page-mapped register with an extra lock. | 269 | _efx_writed_page(efx, value, \ |
249 | * | 270 | reg + \ |
250 | * As for efx_writed_page(), but for a register that suffers from | 271 | BUILD_BUG_ON_ZERO((reg) != 0x400 && (reg) != 0x83c \ |
251 | * SFC bug 3181. Take out a lock so the BIU collector cannot be | 272 | && (reg) != 0xa1c), \ |
252 | * confused. */ | 273 | page) |
253 | static inline void efx_writed_page_locked(struct efx_nic *efx, | 274 | |
254 | efx_dword_t *value, | 275 | /* Write TIMER_COMMAND. This is a page-mapped 32-bit CSR, but a bug |
255 | unsigned int reg, | 276 | * in the BIU means that writes to TIMER_COMMAND[0] invalidate the |
256 | unsigned int page) | 277 | * collector register. |
278 | */ | ||
279 | static inline void _efx_writed_page_locked(struct efx_nic *efx, | ||
280 | efx_dword_t *value, | ||
281 | unsigned int reg, | ||
282 | unsigned int page) | ||
257 | { | 283 | { |
258 | unsigned long flags __attribute__ ((unused)); | 284 | unsigned long flags __attribute__ ((unused)); |
259 | 285 | ||
@@ -265,5 +291,9 @@ static inline void efx_writed_page_locked(struct efx_nic *efx, | |||
265 | efx_writed(efx, value, EFX_PAGED_REG(page, reg)); | 291 | efx_writed(efx, value, EFX_PAGED_REG(page, reg)); |
266 | } | 292 | } |
267 | } | 293 | } |
294 | #define efx_writed_page_locked(efx, value, reg, page) \ | ||
295 | _efx_writed_page_locked(efx, value, \ | ||
296 | reg + BUILD_BUG_ON_ZERO((reg) != 0x420), \ | ||
297 | page) | ||
268 | 298 | ||
269 | #endif /* EFX_IO_H */ | 299 | #endif /* EFX_IO_H */ |