blob: 41b18c5a31412e13839b66be977eae92725dbb80 [file] [log] [blame]
Chris Leech0bbd5f42006-05-23 17:35:34 -07001/*
2 * Copyright(c) 2004 - 2006 Intel Corporation. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
7 * any later version.
8 *
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
13 *
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
17 *
18 * The full GNU General Public License is included in this distribution in the
19 * file called COPYING.
20 */
21
22/*
23 * This driver supports an Intel I/OAT DMA engine, which does asynchronous
24 * copy operations.
25 */
26
27#include <linux/init.h>
28#include <linux/module.h>
29#include <linux/pci.h>
30#include <linux/interrupt.h>
31#include <linux/dmaengine.h>
32#include <linux/delay.h>
David S. Miller6b00c922006-05-23 17:37:58 -070033#include <linux/dma-mapping.h>
Chris Leech0bbd5f42006-05-23 17:35:34 -070034#include "ioatdma.h"
Chris Leech0bbd5f42006-05-23 17:35:34 -070035#include "ioatdma_registers.h"
36#include "ioatdma_hw.h"
37
38#define to_ioat_chan(chan) container_of(chan, struct ioat_dma_chan, common)
39#define to_ioat_device(dev) container_of(dev, struct ioat_device, common)
40#define to_ioat_desc(lh) container_of(lh, struct ioat_desc_sw, node)
Dan Williams7405f742007-01-02 11:10:43 -070041#define tx_to_ioat_desc(tx) container_of(tx, struct ioat_desc_sw, async_tx)
Chris Leech0bbd5f42006-05-23 17:35:34 -070042
43/* internal functions */
44static int __devinit ioat_probe(struct pci_dev *pdev, const struct pci_device_id *ent);
Dan Aloni428ed602007-03-08 09:57:36 -080045static void ioat_shutdown(struct pci_dev *pdev);
Chris Leech0bbd5f42006-05-23 17:35:34 -070046static void __devexit ioat_remove(struct pci_dev *pdev);
47
48static int enumerate_dma_channels(struct ioat_device *device)
49{
50 u8 xfercap_scale;
51 u32 xfercap;
52 int i;
53 struct ioat_dma_chan *ioat_chan;
54
Chris Leeche3828812007-03-08 09:57:35 -080055 device->common.chancnt = readb(device->reg_base + IOAT_CHANCNT_OFFSET);
56 xfercap_scale = readb(device->reg_base + IOAT_XFERCAP_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -070057 xfercap = (xfercap_scale == 0 ? -1 : (1UL << xfercap_scale));
58
59 for (i = 0; i < device->common.chancnt; i++) {
60 ioat_chan = kzalloc(sizeof(*ioat_chan), GFP_KERNEL);
61 if (!ioat_chan) {
62 device->common.chancnt = i;
63 break;
64 }
65
66 ioat_chan->device = device;
67 ioat_chan->reg_base = device->reg_base + (0x80 * (i + 1));
68 ioat_chan->xfercap = xfercap;
69 spin_lock_init(&ioat_chan->cleanup_lock);
70 spin_lock_init(&ioat_chan->desc_lock);
71 INIT_LIST_HEAD(&ioat_chan->free_desc);
72 INIT_LIST_HEAD(&ioat_chan->used_desc);
73 /* This should be made common somewhere in dmaengine.c */
74 ioat_chan->common.device = &device->common;
Chris Leech0bbd5f42006-05-23 17:35:34 -070075 list_add_tail(&ioat_chan->common.device_node,
76 &device->common.channels);
77 }
78 return device->common.chancnt;
79}
80
Dan Williams7405f742007-01-02 11:10:43 -070081static void
82ioat_set_src(dma_addr_t addr, struct dma_async_tx_descriptor *tx, int index)
83{
84 struct ioat_desc_sw *iter, *desc = tx_to_ioat_desc(tx);
85 struct ioat_dma_chan *ioat_chan = to_ioat_chan(tx->chan);
86
87 pci_unmap_addr_set(desc, src, addr);
88
89 list_for_each_entry(iter, &desc->async_tx.tx_list, node) {
90 iter->hw->src_addr = addr;
91 addr += ioat_chan->xfercap;
92 }
93
94}
95
96static void
97ioat_set_dest(dma_addr_t addr, struct dma_async_tx_descriptor *tx, int index)
98{
99 struct ioat_desc_sw *iter, *desc = tx_to_ioat_desc(tx);
100 struct ioat_dma_chan *ioat_chan = to_ioat_chan(tx->chan);
101
102 pci_unmap_addr_set(desc, dst, addr);
103
104 list_for_each_entry(iter, &desc->async_tx.tx_list, node) {
105 iter->hw->dst_addr = addr;
106 addr += ioat_chan->xfercap;
107 }
108}
109
110static dma_cookie_t
111ioat_tx_submit(struct dma_async_tx_descriptor *tx)
112{
113 struct ioat_dma_chan *ioat_chan = to_ioat_chan(tx->chan);
114 struct ioat_desc_sw *desc = tx_to_ioat_desc(tx);
115 int append = 0;
116 dma_cookie_t cookie;
117 struct ioat_desc_sw *group_start;
118
119 group_start = list_entry(desc->async_tx.tx_list.next,
120 struct ioat_desc_sw, node);
121 spin_lock_bh(&ioat_chan->desc_lock);
122 /* cookie incr and addition to used_list must be atomic */
123 cookie = ioat_chan->common.cookie;
124 cookie++;
125 if (cookie < 0)
126 cookie = 1;
127 ioat_chan->common.cookie = desc->async_tx.cookie = cookie;
128
129 /* write address into NextDescriptor field of last desc in chain */
130 to_ioat_desc(ioat_chan->used_desc.prev)->hw->next =
131 group_start->async_tx.phys;
132 list_splice_init(&desc->async_tx.tx_list, ioat_chan->used_desc.prev);
133
134 ioat_chan->pending += desc->tx_cnt;
135 if (ioat_chan->pending >= 4) {
136 append = 1;
137 ioat_chan->pending = 0;
138 }
139 spin_unlock_bh(&ioat_chan->desc_lock);
140
141 if (append)
142 writeb(IOAT_CHANCMD_APPEND,
143 ioat_chan->reg_base + IOAT_CHANCMD_OFFSET);
144
145 return cookie;
146}
147
Chris Leech0bbd5f42006-05-23 17:35:34 -0700148static struct ioat_desc_sw *ioat_dma_alloc_descriptor(
149 struct ioat_dma_chan *ioat_chan,
Al Viro47b16532006-10-10 22:45:47 +0100150 gfp_t flags)
Chris Leech0bbd5f42006-05-23 17:35:34 -0700151{
152 struct ioat_dma_descriptor *desc;
153 struct ioat_desc_sw *desc_sw;
154 struct ioat_device *ioat_device;
155 dma_addr_t phys;
156
157 ioat_device = to_ioat_device(ioat_chan->common.device);
158 desc = pci_pool_alloc(ioat_device->dma_pool, flags, &phys);
159 if (unlikely(!desc))
160 return NULL;
161
162 desc_sw = kzalloc(sizeof(*desc_sw), flags);
163 if (unlikely(!desc_sw)) {
164 pci_pool_free(ioat_device->dma_pool, desc, phys);
165 return NULL;
166 }
167
168 memset(desc, 0, sizeof(*desc));
Dan Williams7405f742007-01-02 11:10:43 -0700169 dma_async_tx_descriptor_init(&desc_sw->async_tx, &ioat_chan->common);
170 desc_sw->async_tx.tx_set_src = ioat_set_src;
171 desc_sw->async_tx.tx_set_dest = ioat_set_dest;
172 desc_sw->async_tx.tx_submit = ioat_tx_submit;
173 INIT_LIST_HEAD(&desc_sw->async_tx.tx_list);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700174 desc_sw->hw = desc;
Dan Williams7405f742007-01-02 11:10:43 -0700175 desc_sw->async_tx.phys = phys;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700176
177 return desc_sw;
178}
179
180#define INITIAL_IOAT_DESC_COUNT 128
181
182static void ioat_start_null_desc(struct ioat_dma_chan *ioat_chan);
183
184/* returns the actual number of allocated descriptors */
185static int ioat_dma_alloc_chan_resources(struct dma_chan *chan)
186{
187 struct ioat_dma_chan *ioat_chan = to_ioat_chan(chan);
188 struct ioat_desc_sw *desc = NULL;
189 u16 chanctrl;
190 u32 chanerr;
191 int i;
192 LIST_HEAD(tmp_list);
193
Shannon Nelsone4223972007-08-24 23:02:53 -0700194 /* have we already been set up? */
195 if (!list_empty(&ioat_chan->free_desc))
196 return INITIAL_IOAT_DESC_COUNT;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700197
198 /* Setup register to interrupt and write completion status on error */
Shannon Nelsone4223972007-08-24 23:02:53 -0700199 chanctrl = IOAT_CHANCTRL_ERR_INT_EN |
Chris Leech0bbd5f42006-05-23 17:35:34 -0700200 IOAT_CHANCTRL_ANY_ERR_ABORT_EN |
201 IOAT_CHANCTRL_ERR_COMPLETION_EN;
Chris Leeche3828812007-03-08 09:57:35 -0800202 writew(chanctrl, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700203
Chris Leeche3828812007-03-08 09:57:35 -0800204 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700205 if (chanerr) {
206 printk("IOAT: CHANERR = %x, clearing\n", chanerr);
Chris Leeche3828812007-03-08 09:57:35 -0800207 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700208 }
209
210 /* Allocate descriptors */
211 for (i = 0; i < INITIAL_IOAT_DESC_COUNT; i++) {
212 desc = ioat_dma_alloc_descriptor(ioat_chan, GFP_KERNEL);
213 if (!desc) {
214 printk(KERN_ERR "IOAT: Only %d initial descriptors\n", i);
215 break;
216 }
217 list_add_tail(&desc->node, &tmp_list);
218 }
219 spin_lock_bh(&ioat_chan->desc_lock);
220 list_splice(&tmp_list, &ioat_chan->free_desc);
221 spin_unlock_bh(&ioat_chan->desc_lock);
222
223 /* allocate a completion writeback area */
224 /* doing 2 32bit writes to mmio since 1 64b write doesn't work */
225 ioat_chan->completion_virt =
226 pci_pool_alloc(ioat_chan->device->completion_pool,
227 GFP_KERNEL,
228 &ioat_chan->completion_addr);
229 memset(ioat_chan->completion_virt, 0,
230 sizeof(*ioat_chan->completion_virt));
Chris Leeche3828812007-03-08 09:57:35 -0800231 writel(((u64) ioat_chan->completion_addr) & 0x00000000FFFFFFFF,
232 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW);
233 writel(((u64) ioat_chan->completion_addr) >> 32,
234 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700235
236 ioat_start_null_desc(ioat_chan);
237 return i;
238}
239
240static void ioat_dma_memcpy_cleanup(struct ioat_dma_chan *ioat_chan);
241
242static void ioat_dma_free_chan_resources(struct dma_chan *chan)
243{
244 struct ioat_dma_chan *ioat_chan = to_ioat_chan(chan);
245 struct ioat_device *ioat_device = to_ioat_device(chan->device);
246 struct ioat_desc_sw *desc, *_desc;
247 u16 chanctrl;
248 int in_use_descs = 0;
249
250 ioat_dma_memcpy_cleanup(ioat_chan);
251
Chris Leeche3828812007-03-08 09:57:35 -0800252 writeb(IOAT_CHANCMD_RESET, ioat_chan->reg_base + IOAT_CHANCMD_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700253
254 spin_lock_bh(&ioat_chan->desc_lock);
255 list_for_each_entry_safe(desc, _desc, &ioat_chan->used_desc, node) {
256 in_use_descs++;
257 list_del(&desc->node);
Dan Williams7405f742007-01-02 11:10:43 -0700258 pci_pool_free(ioat_device->dma_pool, desc->hw,
259 desc->async_tx.phys);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700260 kfree(desc);
261 }
262 list_for_each_entry_safe(desc, _desc, &ioat_chan->free_desc, node) {
263 list_del(&desc->node);
Dan Williams7405f742007-01-02 11:10:43 -0700264 pci_pool_free(ioat_device->dma_pool, desc->hw,
265 desc->async_tx.phys);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700266 kfree(desc);
267 }
268 spin_unlock_bh(&ioat_chan->desc_lock);
269
270 pci_pool_free(ioat_device->completion_pool,
271 ioat_chan->completion_virt,
272 ioat_chan->completion_addr);
273
274 /* one is ok since we left it on there on purpose */
275 if (in_use_descs > 1)
276 printk(KERN_ERR "IOAT: Freeing %d in use descriptors!\n",
277 in_use_descs - 1);
278
279 ioat_chan->last_completion = ioat_chan->completion_addr = 0;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700280}
281
Dan Williams7405f742007-01-02 11:10:43 -0700282static struct dma_async_tx_descriptor *
283ioat_dma_prep_memcpy(struct dma_chan *chan, size_t len, int int_en)
Chris Leech0bbd5f42006-05-23 17:35:34 -0700284{
Dan Williams7405f742007-01-02 11:10:43 -0700285 struct ioat_dma_chan *ioat_chan = to_ioat_chan(chan);
286 struct ioat_desc_sw *first, *prev, *new;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700287 LIST_HEAD(new_chain);
288 u32 copy;
289 size_t orig_len;
Dan Williams7405f742007-01-02 11:10:43 -0700290 int desc_count = 0;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700291
292 if (!len)
Dan Williams7405f742007-01-02 11:10:43 -0700293 return NULL;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700294
295 orig_len = len;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700296
297 first = NULL;
298 prev = NULL;
299
300 spin_lock_bh(&ioat_chan->desc_lock);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700301 while (len) {
302 if (!list_empty(&ioat_chan->free_desc)) {
303 new = to_ioat_desc(ioat_chan->free_desc.next);
304 list_del(&new->node);
305 } else {
306 /* try to get another desc */
307 new = ioat_dma_alloc_descriptor(ioat_chan, GFP_ATOMIC);
308 /* will this ever happen? */
309 /* TODO add upper limit on these */
310 BUG_ON(!new);
311 }
312
313 copy = min((u32) len, ioat_chan->xfercap);
314
315 new->hw->size = copy;
316 new->hw->ctl = 0;
Dan Williams7405f742007-01-02 11:10:43 -0700317 new->async_tx.cookie = 0;
318 new->async_tx.ack = 1;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700319
320 /* chain together the physical address list for the HW */
321 if (!first)
322 first = new;
323 else
Dan Williams7405f742007-01-02 11:10:43 -0700324 prev->hw->next = (u64) new->async_tx.phys;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700325
326 prev = new;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700327 len -= copy;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700328 list_add_tail(&new->node, &new_chain);
329 desc_count++;
330 }
Dan Williams7405f742007-01-02 11:10:43 -0700331
332 list_splice(&new_chain, &new->async_tx.tx_list);
333
Chris Leech0bbd5f42006-05-23 17:35:34 -0700334 new->hw->ctl = IOAT_DMA_DESCRIPTOR_CTL_CP_STS;
335 new->hw->next = 0;
Dan Williams7405f742007-01-02 11:10:43 -0700336 new->tx_cnt = desc_count;
337 new->async_tx.ack = 0; /* client is in control of this ack */
338 new->async_tx.cookie = -EBUSY;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700339
Shannon Nelson54a09fe2007-08-14 17:36:31 -0700340 pci_unmap_len_set(new, len, orig_len);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700341 spin_unlock_bh(&ioat_chan->desc_lock);
342
Dan Williams7405f742007-01-02 11:10:43 -0700343 return new ? &new->async_tx : NULL;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700344}
345
Chris Leech0bbd5f42006-05-23 17:35:34 -0700346
347/**
Randy Dunlap65088712006-07-03 19:45:31 -0700348 * ioat_dma_memcpy_issue_pending - push potentially unrecognized appended descriptors to hw
Chris Leech0bbd5f42006-05-23 17:35:34 -0700349 * @chan: DMA channel handle
350 */
351
352static void ioat_dma_memcpy_issue_pending(struct dma_chan *chan)
353{
354 struct ioat_dma_chan *ioat_chan = to_ioat_chan(chan);
355
356 if (ioat_chan->pending != 0) {
357 ioat_chan->pending = 0;
Chris Leeche3828812007-03-08 09:57:35 -0800358 writeb(IOAT_CHANCMD_APPEND,
359 ioat_chan->reg_base + IOAT_CHANCMD_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700360 }
361}
362
363static void ioat_dma_memcpy_cleanup(struct ioat_dma_chan *chan)
364{
365 unsigned long phys_complete;
366 struct ioat_desc_sw *desc, *_desc;
367 dma_cookie_t cookie = 0;
368
369 prefetch(chan->completion_virt);
370
371 if (!spin_trylock(&chan->cleanup_lock))
372 return;
373
374 /* The completion writeback can happen at any time,
375 so reads by the driver need to be atomic operations
376 The descriptor physical addresses are limited to 32-bits
377 when the CPU can only do a 32-bit mov */
378
379#if (BITS_PER_LONG == 64)
380 phys_complete =
381 chan->completion_virt->full & IOAT_CHANSTS_COMPLETED_DESCRIPTOR_ADDR;
382#else
383 phys_complete = chan->completion_virt->low & IOAT_LOW_COMPLETION_MASK;
384#endif
385
386 if ((chan->completion_virt->full & IOAT_CHANSTS_DMA_TRANSFER_STATUS) ==
387 IOAT_CHANSTS_DMA_TRANSFER_STATUS_HALTED) {
388 printk("IOAT: Channel halted, chanerr = %x\n",
Chris Leeche3828812007-03-08 09:57:35 -0800389 readl(chan->reg_base + IOAT_CHANERR_OFFSET));
Chris Leech0bbd5f42006-05-23 17:35:34 -0700390
391 /* TODO do something to salvage the situation */
392 }
393
394 if (phys_complete == chan->last_completion) {
395 spin_unlock(&chan->cleanup_lock);
396 return;
397 }
398
399 spin_lock_bh(&chan->desc_lock);
400 list_for_each_entry_safe(desc, _desc, &chan->used_desc, node) {
401
402 /*
403 * Incoming DMA requests may use multiple descriptors, due to
404 * exceeding xfercap, perhaps. If so, only the last one will
405 * have a cookie, and require unmapping.
406 */
Dan Williams7405f742007-01-02 11:10:43 -0700407 if (desc->async_tx.cookie) {
408 cookie = desc->async_tx.cookie;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700409
410 /* yes we are unmapping both _page and _single alloc'd
411 regions with unmap_page. Is this *really* that bad?
412 */
413 pci_unmap_page(chan->device->pdev,
414 pci_unmap_addr(desc, dst),
Shannon Nelson54a09fe2007-08-14 17:36:31 -0700415 pci_unmap_len(desc, len),
Chris Leech0bbd5f42006-05-23 17:35:34 -0700416 PCI_DMA_FROMDEVICE);
417 pci_unmap_page(chan->device->pdev,
418 pci_unmap_addr(desc, src),
Shannon Nelson54a09fe2007-08-14 17:36:31 -0700419 pci_unmap_len(desc, len),
Chris Leech0bbd5f42006-05-23 17:35:34 -0700420 PCI_DMA_TODEVICE);
421 }
422
Dan Williams7405f742007-01-02 11:10:43 -0700423 if (desc->async_tx.phys != phys_complete) {
424 /* a completed entry, but not the last, so cleanup
425 * if the client is done with the descriptor
426 */
427 if (desc->async_tx.ack) {
428 list_del(&desc->node);
429 list_add_tail(&desc->node, &chan->free_desc);
430 } else
431 desc->async_tx.cookie = 0;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700432 } else {
433 /* last used desc. Do not remove, so we can append from
434 it, but don't look at it next time, either */
Dan Williams7405f742007-01-02 11:10:43 -0700435 desc->async_tx.cookie = 0;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700436
437 /* TODO check status bits? */
438 break;
439 }
440 }
441
442 spin_unlock_bh(&chan->desc_lock);
443
444 chan->last_completion = phys_complete;
445 if (cookie != 0)
446 chan->completed_cookie = cookie;
447
448 spin_unlock(&chan->cleanup_lock);
449}
450
Dan Williams7405f742007-01-02 11:10:43 -0700451static void ioat_dma_dependency_added(struct dma_chan *chan)
452{
453 struct ioat_dma_chan *ioat_chan = to_ioat_chan(chan);
454 spin_lock_bh(&ioat_chan->desc_lock);
455 if (ioat_chan->pending == 0) {
456 spin_unlock_bh(&ioat_chan->desc_lock);
457 ioat_dma_memcpy_cleanup(ioat_chan);
458 } else
459 spin_unlock_bh(&ioat_chan->desc_lock);
460}
461
Chris Leech0bbd5f42006-05-23 17:35:34 -0700462/**
463 * ioat_dma_is_complete - poll the status of a IOAT DMA transaction
464 * @chan: IOAT DMA channel handle
465 * @cookie: DMA transaction identifier
Randy Dunlap65088712006-07-03 19:45:31 -0700466 * @done: if not %NULL, updated with last completed transaction
467 * @used: if not %NULL, updated with last used transaction
Chris Leech0bbd5f42006-05-23 17:35:34 -0700468 */
469
470static enum dma_status ioat_dma_is_complete(struct dma_chan *chan,
471 dma_cookie_t cookie,
472 dma_cookie_t *done,
473 dma_cookie_t *used)
474{
475 struct ioat_dma_chan *ioat_chan = to_ioat_chan(chan);
476 dma_cookie_t last_used;
477 dma_cookie_t last_complete;
478 enum dma_status ret;
479
480 last_used = chan->cookie;
481 last_complete = ioat_chan->completed_cookie;
482
483 if (done)
484 *done= last_complete;
485 if (used)
486 *used = last_used;
487
488 ret = dma_async_is_complete(cookie, last_complete, last_used);
489 if (ret == DMA_SUCCESS)
490 return ret;
491
492 ioat_dma_memcpy_cleanup(ioat_chan);
493
494 last_used = chan->cookie;
495 last_complete = ioat_chan->completed_cookie;
496
497 if (done)
498 *done= last_complete;
499 if (used)
500 *used = last_used;
501
502 return dma_async_is_complete(cookie, last_complete, last_used);
503}
504
505/* PCI API */
506
507static struct pci_device_id ioat_pci_tbl[] = {
508 { PCI_DEVICE(PCI_VENDOR_ID_INTEL, PCI_DEVICE_ID_INTEL_IOAT) },
Dan Williams3039f072007-07-13 08:06:19 -0700509 { PCI_DEVICE(PCI_VENDOR_ID_UNISYS,
510 PCI_DEVICE_ID_UNISYS_DMA_DIRECTOR) },
Chris Leech0bbd5f42006-05-23 17:35:34 -0700511 { 0, }
512};
513
Randy Dunlap92504f72007-06-27 14:09:56 -0700514static struct pci_driver ioat_pci_driver = {
Chris Leech0bbd5f42006-05-23 17:35:34 -0700515 .name = "ioatdma",
516 .id_table = ioat_pci_tbl,
517 .probe = ioat_probe,
Dan Aloni428ed602007-03-08 09:57:36 -0800518 .shutdown = ioat_shutdown,
Chris Leech0bbd5f42006-05-23 17:35:34 -0700519 .remove = __devexit_p(ioat_remove),
520};
521
David Howells7d12e782006-10-05 14:55:46 +0100522static irqreturn_t ioat_do_interrupt(int irq, void *data)
Chris Leech0bbd5f42006-05-23 17:35:34 -0700523{
524 struct ioat_device *instance = data;
525 unsigned long attnstatus;
526 u8 intrctrl;
527
Chris Leeche3828812007-03-08 09:57:35 -0800528 intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700529
530 if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN))
531 return IRQ_NONE;
532
533 if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) {
Chris Leeche3828812007-03-08 09:57:35 -0800534 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700535 return IRQ_NONE;
536 }
537
Chris Leeche3828812007-03-08 09:57:35 -0800538 attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700539
540 printk(KERN_ERR "ioatdma error: interrupt! status %lx\n", attnstatus);
541
Chris Leeche3828812007-03-08 09:57:35 -0800542 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700543 return IRQ_HANDLED;
544}
545
546static void ioat_start_null_desc(struct ioat_dma_chan *ioat_chan)
547{
548 struct ioat_desc_sw *desc;
549
550 spin_lock_bh(&ioat_chan->desc_lock);
551
552 if (!list_empty(&ioat_chan->free_desc)) {
553 desc = to_ioat_desc(ioat_chan->free_desc.next);
554 list_del(&desc->node);
555 } else {
556 /* try to get another desc */
557 spin_unlock_bh(&ioat_chan->desc_lock);
558 desc = ioat_dma_alloc_descriptor(ioat_chan, GFP_KERNEL);
559 spin_lock_bh(&ioat_chan->desc_lock);
560 /* will this ever happen? */
561 BUG_ON(!desc);
562 }
563
564 desc->hw->ctl = IOAT_DMA_DESCRIPTOR_NUL;
565 desc->hw->next = 0;
Dan Williams7405f742007-01-02 11:10:43 -0700566 desc->async_tx.ack = 1;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700567
568 list_add_tail(&desc->node, &ioat_chan->used_desc);
569 spin_unlock_bh(&ioat_chan->desc_lock);
570
Dan Williams7405f742007-01-02 11:10:43 -0700571 writel(((u64) desc->async_tx.phys) & 0x00000000FFFFFFFF,
Chris Leeche3828812007-03-08 09:57:35 -0800572 ioat_chan->reg_base + IOAT_CHAINADDR_OFFSET_LOW);
Dan Williams7405f742007-01-02 11:10:43 -0700573 writel(((u64) desc->async_tx.phys) >> 32,
Chris Leech70774b42007-03-08 09:57:35 -0800574 ioat_chan->reg_base + IOAT_CHAINADDR_OFFSET_HIGH);
575
Chris Leeche3828812007-03-08 09:57:35 -0800576 writeb(IOAT_CHANCMD_START, ioat_chan->reg_base + IOAT_CHANCMD_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700577}
578
579/*
580 * Perform a IOAT transaction to verify the HW works.
581 */
582#define IOAT_TEST_SIZE 2000
583
584static int ioat_self_test(struct ioat_device *device)
585{
586 int i;
587 u8 *src;
588 u8 *dest;
589 struct dma_chan *dma_chan;
Dan Williams7405f742007-01-02 11:10:43 -0700590 struct dma_async_tx_descriptor *tx;
591 dma_addr_t addr;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700592 dma_cookie_t cookie;
593 int err = 0;
594
Christoph Lametere94b1762006-12-06 20:33:17 -0800595 src = kzalloc(sizeof(u8) * IOAT_TEST_SIZE, GFP_KERNEL);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700596 if (!src)
597 return -ENOMEM;
Christoph Lametere94b1762006-12-06 20:33:17 -0800598 dest = kzalloc(sizeof(u8) * IOAT_TEST_SIZE, GFP_KERNEL);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700599 if (!dest) {
600 kfree(src);
601 return -ENOMEM;
602 }
603
604 /* Fill in src buffer */
605 for (i = 0; i < IOAT_TEST_SIZE; i++)
606 src[i] = (u8)i;
607
608 /* Start copy, using first DMA channel */
609 dma_chan = container_of(device->common.channels.next,
610 struct dma_chan,
611 device_node);
612 if (ioat_dma_alloc_chan_resources(dma_chan) < 1) {
613 err = -ENODEV;
614 goto out;
615 }
616
Dan Williams7405f742007-01-02 11:10:43 -0700617 tx = ioat_dma_prep_memcpy(dma_chan, IOAT_TEST_SIZE, 0);
618 async_tx_ack(tx);
619 addr = dma_map_single(dma_chan->device->dev, src, IOAT_TEST_SIZE,
620 DMA_TO_DEVICE);
621 ioat_set_src(addr, tx, 0);
622 addr = dma_map_single(dma_chan->device->dev, dest, IOAT_TEST_SIZE,
623 DMA_FROM_DEVICE);
624 ioat_set_dest(addr, tx, 0);
625 cookie = ioat_tx_submit(tx);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700626 ioat_dma_memcpy_issue_pending(dma_chan);
627 msleep(1);
628
629 if (ioat_dma_is_complete(dma_chan, cookie, NULL, NULL) != DMA_SUCCESS) {
630 printk(KERN_ERR "ioatdma: Self-test copy timed out, disabling\n");
631 err = -ENODEV;
632 goto free_resources;
633 }
634 if (memcmp(src, dest, IOAT_TEST_SIZE)) {
635 printk(KERN_ERR "ioatdma: Self-test copy failed compare, disabling\n");
636 err = -ENODEV;
637 goto free_resources;
638 }
639
640free_resources:
641 ioat_dma_free_chan_resources(dma_chan);
642out:
643 kfree(src);
644 kfree(dest);
645 return err;
646}
647
648static int __devinit ioat_probe(struct pci_dev *pdev,
649 const struct pci_device_id *ent)
650{
651 int err;
652 unsigned long mmio_start, mmio_len;
Al Viro47b16532006-10-10 22:45:47 +0100653 void __iomem *reg_base;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700654 struct ioat_device *device;
655
656 err = pci_enable_device(pdev);
657 if (err)
658 goto err_enable_device;
659
660 err = pci_set_dma_mask(pdev, DMA_64BIT_MASK);
661 if (err)
662 err = pci_set_dma_mask(pdev, DMA_32BIT_MASK);
663 if (err)
664 goto err_set_dma_mask;
665
Randy Dunlap92504f72007-06-27 14:09:56 -0700666 err = pci_request_regions(pdev, ioat_pci_driver.name);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700667 if (err)
668 goto err_request_regions;
669
670 mmio_start = pci_resource_start(pdev, 0);
671 mmio_len = pci_resource_len(pdev, 0);
672
673 reg_base = ioremap(mmio_start, mmio_len);
674 if (!reg_base) {
675 err = -ENOMEM;
676 goto err_ioremap;
677 }
678
679 device = kzalloc(sizeof(*device), GFP_KERNEL);
680 if (!device) {
681 err = -ENOMEM;
682 goto err_kzalloc;
683 }
684
685 /* DMA coherent memory pool for DMA descriptor allocations */
686 device->dma_pool = pci_pool_create("dma_desc_pool", pdev,
687 sizeof(struct ioat_dma_descriptor), 64, 0);
688 if (!device->dma_pool) {
689 err = -ENOMEM;
690 goto err_dma_pool;
691 }
692
693 device->completion_pool = pci_pool_create("completion_pool", pdev, sizeof(u64), SMP_CACHE_BYTES, SMP_CACHE_BYTES);
694 if (!device->completion_pool) {
695 err = -ENOMEM;
696 goto err_completion_pool;
697 }
698
699 device->pdev = pdev;
700 pci_set_drvdata(pdev, device);
701#ifdef CONFIG_PCI_MSI
702 if (pci_enable_msi(pdev) == 0) {
703 device->msi = 1;
704 } else {
705 device->msi = 0;
706 }
707#endif
Thomas Gleixnerdace1452006-07-01 19:29:38 -0700708 err = request_irq(pdev->irq, &ioat_do_interrupt, IRQF_SHARED, "ioat",
Chris Leech0bbd5f42006-05-23 17:35:34 -0700709 device);
710 if (err)
711 goto err_irq;
712
713 device->reg_base = reg_base;
714
Chris Leeche3828812007-03-08 09:57:35 -0800715 writeb(IOAT_INTRCTRL_MASTER_INT_EN, device->reg_base + IOAT_INTRCTRL_OFFSET);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700716 pci_set_master(pdev);
717
718 INIT_LIST_HEAD(&device->common.channels);
719 enumerate_dma_channels(device);
720
Dan Williams7405f742007-01-02 11:10:43 -0700721 dma_cap_set(DMA_MEMCPY, device->common.cap_mask);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700722 device->common.device_alloc_chan_resources = ioat_dma_alloc_chan_resources;
723 device->common.device_free_chan_resources = ioat_dma_free_chan_resources;
Dan Williams7405f742007-01-02 11:10:43 -0700724 device->common.device_prep_dma_memcpy = ioat_dma_prep_memcpy;
725 device->common.device_is_tx_complete = ioat_dma_is_complete;
726 device->common.device_issue_pending = ioat_dma_memcpy_issue_pending;
727 device->common.device_dependency_added = ioat_dma_dependency_added;
728 device->common.dev = &pdev->dev;
Chris Leech0bbd5f42006-05-23 17:35:34 -0700729 printk(KERN_INFO "Intel(R) I/OAT DMA Engine found, %d channels\n",
730 device->common.chancnt);
731
732 err = ioat_self_test(device);
733 if (err)
734 goto err_self_test;
735
736 dma_async_device_register(&device->common);
737
738 return 0;
739
740err_self_test:
741err_irq:
742 pci_pool_destroy(device->completion_pool);
743err_completion_pool:
744 pci_pool_destroy(device->dma_pool);
745err_dma_pool:
746 kfree(device);
747err_kzalloc:
748 iounmap(reg_base);
749err_ioremap:
750 pci_release_regions(pdev);
751err_request_regions:
752err_set_dma_mask:
753 pci_disable_device(pdev);
754err_enable_device:
Dan Aloni428ed602007-03-08 09:57:36 -0800755
756 printk(KERN_ERR "Intel(R) I/OAT DMA Engine initialization failed\n");
757
Chris Leech0bbd5f42006-05-23 17:35:34 -0700758 return err;
759}
760
Dan Aloni428ed602007-03-08 09:57:36 -0800761static void ioat_shutdown(struct pci_dev *pdev)
762{
763 struct ioat_device *device;
764 device = pci_get_drvdata(pdev);
765
766 dma_async_device_unregister(&device->common);
767}
768
Chris Leech0bbd5f42006-05-23 17:35:34 -0700769static void __devexit ioat_remove(struct pci_dev *pdev)
770{
771 struct ioat_device *device;
772 struct dma_chan *chan, *_chan;
773 struct ioat_dma_chan *ioat_chan;
774
775 device = pci_get_drvdata(pdev);
776 dma_async_device_unregister(&device->common);
777
778 free_irq(device->pdev->irq, device);
779#ifdef CONFIG_PCI_MSI
780 if (device->msi)
781 pci_disable_msi(device->pdev);
782#endif
783 pci_pool_destroy(device->dma_pool);
784 pci_pool_destroy(device->completion_pool);
785 iounmap(device->reg_base);
786 pci_release_regions(pdev);
787 pci_disable_device(pdev);
788 list_for_each_entry_safe(chan, _chan, &device->common.channels, device_node) {
789 ioat_chan = to_ioat_chan(chan);
790 list_del(&chan->device_node);
791 kfree(ioat_chan);
792 }
793 kfree(device);
794}
795
796/* MODULE API */
Chris Leech000725d2007-03-08 09:57:33 -0800797MODULE_VERSION("1.9");
Chris Leech0bbd5f42006-05-23 17:35:34 -0700798MODULE_LICENSE("GPL");
799MODULE_AUTHOR("Intel Corporation");
800
801static int __init ioat_init_module(void)
802{
803 /* it's currently unsafe to unload this module */
804 /* if forced, worst case is that rmmod hangs */
David S. Miller8070b2b2006-06-26 00:10:46 -0700805 __unsafe(THIS_MODULE);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700806
Randy Dunlap92504f72007-06-27 14:09:56 -0700807 return pci_register_driver(&ioat_pci_driver);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700808}
809
810module_init(ioat_init_module);
811
812static void __exit ioat_exit_module(void)
813{
Randy Dunlap92504f72007-06-27 14:09:56 -0700814 pci_unregister_driver(&ioat_pci_driver);
Chris Leech0bbd5f42006-05-23 17:35:34 -0700815}
816
817module_exit(ioat_exit_module);