Merge tag 'v5.9' into next
[linux-2.6-microblaze.git] / drivers / dma / iop-adma.c
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * offload engine driver for the Intel Xscale series of i/o processors
4  * Copyright © 2006, Intel Corporation.
5  */
6
7 /*
8  * This driver supports the asynchrounous DMA copy and RAID engines available
9  * on the Intel Xscale(R) family of I/O Processors (IOP 32x, 33x, 134x)
10  */
11
12 #include <linux/init.h>
13 #include <linux/module.h>
14 #include <linux/delay.h>
15 #include <linux/dma-mapping.h>
16 #include <linux/spinlock.h>
17 #include <linux/interrupt.h>
18 #include <linux/platform_device.h>
19 #include <linux/prefetch.h>
20 #include <linux/memory.h>
21 #include <linux/ioport.h>
22 #include <linux/raid/pq.h>
23 #include <linux/slab.h>
24
25 #include "iop-adma.h"
26 #include "dmaengine.h"
27
28 #define to_iop_adma_chan(chan) container_of(chan, struct iop_adma_chan, common)
29 #define to_iop_adma_device(dev) \
30         container_of(dev, struct iop_adma_device, common)
31 #define tx_to_iop_adma_slot(tx) \
32         container_of(tx, struct iop_adma_desc_slot, async_tx)
33
34 /**
35  * iop_adma_free_slots - flags descriptor slots for reuse
36  * @slot: Slot to free
37  * Caller must hold &iop_chan->lock while calling this function
38  */
39 static void iop_adma_free_slots(struct iop_adma_desc_slot *slot)
40 {
41         int stride = slot->slots_per_op;
42
43         while (stride--) {
44                 slot->slots_per_op = 0;
45                 slot = list_entry(slot->slot_node.next,
46                                 struct iop_adma_desc_slot,
47                                 slot_node);
48         }
49 }
50
51 static dma_cookie_t
52 iop_adma_run_tx_complete_actions(struct iop_adma_desc_slot *desc,
53         struct iop_adma_chan *iop_chan, dma_cookie_t cookie)
54 {
55         struct dma_async_tx_descriptor *tx = &desc->async_tx;
56
57         BUG_ON(tx->cookie < 0);
58         if (tx->cookie > 0) {
59                 cookie = tx->cookie;
60                 tx->cookie = 0;
61
62                 /* call the callback (must not sleep or submit new
63                  * operations to this channel)
64                  */
65                 dmaengine_desc_get_callback_invoke(tx, NULL);
66
67                 dma_descriptor_unmap(tx);
68                 if (desc->group_head)
69                         desc->group_head = NULL;
70         }
71
72         /* run dependent operations */
73         dma_run_dependencies(tx);
74
75         return cookie;
76 }
77
78 static int
79 iop_adma_clean_slot(struct iop_adma_desc_slot *desc,
80         struct iop_adma_chan *iop_chan)
81 {
82         /* the client is allowed to attach dependent operations
83          * until 'ack' is set
84          */
85         if (!async_tx_test_ack(&desc->async_tx))
86                 return 0;
87
88         /* leave the last descriptor in the chain
89          * so we can append to it
90          */
91         if (desc->chain_node.next == &iop_chan->chain)
92                 return 1;
93
94         dev_dbg(iop_chan->device->common.dev,
95                 "\tfree slot: %d slots_per_op: %d\n",
96                 desc->idx, desc->slots_per_op);
97
98         list_del(&desc->chain_node);
99         iop_adma_free_slots(desc);
100
101         return 0;
102 }
103
104 static void __iop_adma_slot_cleanup(struct iop_adma_chan *iop_chan)
105 {
106         struct iop_adma_desc_slot *iter, *_iter, *grp_start = NULL;
107         dma_cookie_t cookie = 0;
108         u32 current_desc = iop_chan_get_current_descriptor(iop_chan);
109         int busy = iop_chan_is_busy(iop_chan);
110         int seen_current = 0, slot_cnt = 0, slots_per_op = 0;
111
112         dev_dbg(iop_chan->device->common.dev, "%s\n", __func__);
113         /* free completed slots from the chain starting with
114          * the oldest descriptor
115          */
116         list_for_each_entry_safe(iter, _iter, &iop_chan->chain,
117                                         chain_node) {
118                 pr_debug("\tcookie: %d slot: %d busy: %d "
119                         "this_desc: %pad next_desc: %#llx ack: %d\n",
120                         iter->async_tx.cookie, iter->idx, busy,
121                         &iter->async_tx.phys, (u64)iop_desc_get_next_desc(iter),
122                         async_tx_test_ack(&iter->async_tx));
123                 prefetch(_iter);
124                 prefetch(&_iter->async_tx);
125
126                 /* do not advance past the current descriptor loaded into the
127                  * hardware channel, subsequent descriptors are either in
128                  * process or have not been submitted
129                  */
130                 if (seen_current)
131                         break;
132
133                 /* stop the search if we reach the current descriptor and the
134                  * channel is busy, or if it appears that the current descriptor
135                  * needs to be re-read (i.e. has been appended to)
136                  */
137                 if (iter->async_tx.phys == current_desc) {
138                         BUG_ON(seen_current++);
139                         if (busy || iop_desc_get_next_desc(iter))
140                                 break;
141                 }
142
143                 /* detect the start of a group transaction */
144                 if (!slot_cnt && !slots_per_op) {
145                         slot_cnt = iter->slot_cnt;
146                         slots_per_op = iter->slots_per_op;
147                         if (slot_cnt <= slots_per_op) {
148                                 slot_cnt = 0;
149                                 slots_per_op = 0;
150                         }
151                 }
152
153                 if (slot_cnt) {
154                         pr_debug("\tgroup++\n");
155                         if (!grp_start)
156                                 grp_start = iter;
157                         slot_cnt -= slots_per_op;
158                 }
159
160                 /* all the members of a group are complete */
161                 if (slots_per_op != 0 && slot_cnt == 0) {
162                         struct iop_adma_desc_slot *grp_iter, *_grp_iter;
163                         int end_of_chain = 0;
164                         pr_debug("\tgroup end\n");
165
166                         /* collect the total results */
167                         if (grp_start->xor_check_result) {
168                                 u32 zero_sum_result = 0;
169                                 slot_cnt = grp_start->slot_cnt;
170                                 grp_iter = grp_start;
171
172                                 list_for_each_entry_from(grp_iter,
173                                         &iop_chan->chain, chain_node) {
174                                         zero_sum_result |=
175                                             iop_desc_get_zero_result(grp_iter);
176                                         pr_debug("\titer%d result: %d\n",
177                                             grp_iter->idx, zero_sum_result);
178                                         slot_cnt -= slots_per_op;
179                                         if (slot_cnt == 0)
180                                                 break;
181                                 }
182                                 pr_debug("\tgrp_start->xor_check_result: %p\n",
183                                         grp_start->xor_check_result);
184                                 *grp_start->xor_check_result = zero_sum_result;
185                         }
186
187                         /* clean up the group */
188                         slot_cnt = grp_start->slot_cnt;
189                         grp_iter = grp_start;
190                         list_for_each_entry_safe_from(grp_iter, _grp_iter,
191                                 &iop_chan->chain, chain_node) {
192                                 cookie = iop_adma_run_tx_complete_actions(
193                                         grp_iter, iop_chan, cookie);
194
195                                 slot_cnt -= slots_per_op;
196                                 end_of_chain = iop_adma_clean_slot(grp_iter,
197                                         iop_chan);
198
199                                 if (slot_cnt == 0 || end_of_chain)
200                                         break;
201                         }
202
203                         /* the group should be complete at this point */
204                         BUG_ON(slot_cnt);
205
206                         slots_per_op = 0;
207                         grp_start = NULL;
208                         if (end_of_chain)
209                                 break;
210                         else
211                                 continue;
212                 } else if (slots_per_op) /* wait for group completion */
213                         continue;
214
215                 /* write back zero sum results (single descriptor case) */
216                 if (iter->xor_check_result && iter->async_tx.cookie)
217                         *iter->xor_check_result =
218                                 iop_desc_get_zero_result(iter);
219
220                 cookie = iop_adma_run_tx_complete_actions(
221                                         iter, iop_chan, cookie);
222
223                 if (iop_adma_clean_slot(iter, iop_chan))
224                         break;
225         }
226
227         if (cookie > 0) {
228                 iop_chan->common.completed_cookie = cookie;
229                 pr_debug("\tcompleted cookie %d\n", cookie);
230         }
231 }
232
233 static void
234 iop_adma_slot_cleanup(struct iop_adma_chan *iop_chan)
235 {
236         spin_lock_bh(&iop_chan->lock);
237         __iop_adma_slot_cleanup(iop_chan);
238         spin_unlock_bh(&iop_chan->lock);
239 }
240
241 static void iop_adma_tasklet(unsigned long data)
242 {
243         struct iop_adma_chan *iop_chan = (struct iop_adma_chan *) data;
244
245         /* lockdep will flag depedency submissions as potentially
246          * recursive locking, this is not the case as a dependency
247          * submission will never recurse a channels submit routine.
248          * There are checks in async_tx.c to prevent this.
249          */
250         spin_lock_nested(&iop_chan->lock, SINGLE_DEPTH_NESTING);
251         __iop_adma_slot_cleanup(iop_chan);
252         spin_unlock(&iop_chan->lock);
253 }
254
255 static struct iop_adma_desc_slot *
256 iop_adma_alloc_slots(struct iop_adma_chan *iop_chan, int num_slots,
257                         int slots_per_op)
258 {
259         struct iop_adma_desc_slot *iter, *_iter, *alloc_start = NULL;
260         LIST_HEAD(chain);
261         int slots_found, retry = 0;
262
263         /* start search from the last allocated descrtiptor
264          * if a contiguous allocation can not be found start searching
265          * from the beginning of the list
266          */
267 retry:
268         slots_found = 0;
269         if (retry == 0)
270                 iter = iop_chan->last_used;
271         else
272                 iter = list_entry(&iop_chan->all_slots,
273                         struct iop_adma_desc_slot,
274                         slot_node);
275
276         list_for_each_entry_safe_continue(
277                 iter, _iter, &iop_chan->all_slots, slot_node) {
278                 prefetch(_iter);
279                 prefetch(&_iter->async_tx);
280                 if (iter->slots_per_op) {
281                         /* give up after finding the first busy slot
282                          * on the second pass through the list
283                          */
284                         if (retry)
285                                 break;
286
287                         slots_found = 0;
288                         continue;
289                 }
290
291                 /* start the allocation if the slot is correctly aligned */
292                 if (!slots_found++) {
293                         if (iop_desc_is_aligned(iter, slots_per_op))
294                                 alloc_start = iter;
295                         else {
296                                 slots_found = 0;
297                                 continue;
298                         }
299                 }
300
301                 if (slots_found == num_slots) {
302                         struct iop_adma_desc_slot *alloc_tail = NULL;
303                         struct iop_adma_desc_slot *last_used = NULL;
304                         iter = alloc_start;
305                         while (num_slots) {
306                                 int i;
307                                 dev_dbg(iop_chan->device->common.dev,
308                                         "allocated slot: %d "
309                                         "(desc %p phys: %#llx) slots_per_op %d\n",
310                                         iter->idx, iter->hw_desc,
311                                         (u64)iter->async_tx.phys, slots_per_op);
312
313                                 /* pre-ack all but the last descriptor */
314                                 if (num_slots != slots_per_op)
315                                         async_tx_ack(&iter->async_tx);
316
317                                 list_add_tail(&iter->chain_node, &chain);
318                                 alloc_tail = iter;
319                                 iter->async_tx.cookie = 0;
320                                 iter->slot_cnt = num_slots;
321                                 iter->xor_check_result = NULL;
322                                 for (i = 0; i < slots_per_op; i++) {
323                                         iter->slots_per_op = slots_per_op - i;
324                                         last_used = iter;
325                                         iter = list_entry(iter->slot_node.next,
326                                                 struct iop_adma_desc_slot,
327                                                 slot_node);
328                                 }
329                                 num_slots -= slots_per_op;
330                         }
331                         alloc_tail->group_head = alloc_start;
332                         alloc_tail->async_tx.cookie = -EBUSY;
333                         list_splice(&chain, &alloc_tail->tx_list);
334                         iop_chan->last_used = last_used;
335                         iop_desc_clear_next_desc(alloc_start);
336                         iop_desc_clear_next_desc(alloc_tail);
337                         return alloc_tail;
338                 }
339         }
340         if (!retry++)
341                 goto retry;
342
343         /* perform direct reclaim if the allocation fails */
344         __iop_adma_slot_cleanup(iop_chan);
345
346         return NULL;
347 }
348
349 static void iop_adma_check_threshold(struct iop_adma_chan *iop_chan)
350 {
351         dev_dbg(iop_chan->device->common.dev, "pending: %d\n",
352                 iop_chan->pending);
353
354         if (iop_chan->pending >= IOP_ADMA_THRESHOLD) {
355                 iop_chan->pending = 0;
356                 iop_chan_append(iop_chan);
357         }
358 }
359
360 static dma_cookie_t
361 iop_adma_tx_submit(struct dma_async_tx_descriptor *tx)
362 {
363         struct iop_adma_desc_slot *sw_desc = tx_to_iop_adma_slot(tx);
364         struct iop_adma_chan *iop_chan = to_iop_adma_chan(tx->chan);
365         struct iop_adma_desc_slot *grp_start, *old_chain_tail;
366         int slot_cnt;
367         dma_cookie_t cookie;
368         dma_addr_t next_dma;
369
370         grp_start = sw_desc->group_head;
371         slot_cnt = grp_start->slot_cnt;
372
373         spin_lock_bh(&iop_chan->lock);
374         cookie = dma_cookie_assign(tx);
375
376         old_chain_tail = list_entry(iop_chan->chain.prev,
377                 struct iop_adma_desc_slot, chain_node);
378         list_splice_init(&sw_desc->tx_list,
379                          &old_chain_tail->chain_node);
380
381         /* fix up the hardware chain */
382         next_dma = grp_start->async_tx.phys;
383         iop_desc_set_next_desc(old_chain_tail, next_dma);
384         BUG_ON(iop_desc_get_next_desc(old_chain_tail) != next_dma); /* flush */
385
386         /* check for pre-chained descriptors */
387         iop_paranoia(iop_desc_get_next_desc(sw_desc));
388
389         /* increment the pending count by the number of slots
390          * memcpy operations have a 1:1 (slot:operation) relation
391          * other operations are heavier and will pop the threshold
392          * more often.
393          */
394         iop_chan->pending += slot_cnt;
395         iop_adma_check_threshold(iop_chan);
396         spin_unlock_bh(&iop_chan->lock);
397
398         dev_dbg(iop_chan->device->common.dev, "%s cookie: %d slot: %d\n",
399                 __func__, sw_desc->async_tx.cookie, sw_desc->idx);
400
401         return cookie;
402 }
403
404 static void iop_chan_start_null_memcpy(struct iop_adma_chan *iop_chan);
405 static void iop_chan_start_null_xor(struct iop_adma_chan *iop_chan);
406
407 /**
408  * iop_adma_alloc_chan_resources -  returns the number of allocated descriptors
409  * @chan: allocate descriptor resources for this channel
410  *
411  * Note: We keep the slots for 1 operation on iop_chan->chain at all times.  To
412  * avoid deadlock, via async_xor, num_descs_in_pool must at a minimum be
413  * greater than 2x the number slots needed to satisfy a device->max_xor
414  * request.
415  * */
416 static int iop_adma_alloc_chan_resources(struct dma_chan *chan)
417 {
418         char *hw_desc;
419         int idx;
420         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
421         struct iop_adma_desc_slot *slot = NULL;
422         int init = iop_chan->slots_allocated ? 0 : 1;
423         struct iop_adma_platform_data *plat_data =
424                 dev_get_platdata(&iop_chan->device->pdev->dev);
425         int num_descs_in_pool = plat_data->pool_size/IOP_ADMA_SLOT_SIZE;
426
427         /* Allocate descriptor slots */
428         do {
429                 idx = iop_chan->slots_allocated;
430                 if (idx == num_descs_in_pool)
431                         break;
432
433                 slot = kzalloc(sizeof(*slot), GFP_KERNEL);
434                 if (!slot) {
435                         printk(KERN_INFO "IOP ADMA Channel only initialized"
436                                 " %d descriptor slots", idx);
437                         break;
438                 }
439                 hw_desc = (char *) iop_chan->device->dma_desc_pool_virt;
440                 slot->hw_desc = (void *) &hw_desc[idx * IOP_ADMA_SLOT_SIZE];
441
442                 dma_async_tx_descriptor_init(&slot->async_tx, chan);
443                 slot->async_tx.tx_submit = iop_adma_tx_submit;
444                 INIT_LIST_HEAD(&slot->tx_list);
445                 INIT_LIST_HEAD(&slot->chain_node);
446                 INIT_LIST_HEAD(&slot->slot_node);
447                 hw_desc = (char *) iop_chan->device->dma_desc_pool;
448                 slot->async_tx.phys =
449                         (dma_addr_t) &hw_desc[idx * IOP_ADMA_SLOT_SIZE];
450                 slot->idx = idx;
451
452                 spin_lock_bh(&iop_chan->lock);
453                 iop_chan->slots_allocated++;
454                 list_add_tail(&slot->slot_node, &iop_chan->all_slots);
455                 spin_unlock_bh(&iop_chan->lock);
456         } while (iop_chan->slots_allocated < num_descs_in_pool);
457
458         if (idx && !iop_chan->last_used)
459                 iop_chan->last_used = list_entry(iop_chan->all_slots.next,
460                                         struct iop_adma_desc_slot,
461                                         slot_node);
462
463         dev_dbg(iop_chan->device->common.dev,
464                 "allocated %d descriptor slots last_used: %p\n",
465                 iop_chan->slots_allocated, iop_chan->last_used);
466
467         /* initialize the channel and the chain with a null operation */
468         if (init) {
469                 if (dma_has_cap(DMA_MEMCPY,
470                         iop_chan->device->common.cap_mask))
471                         iop_chan_start_null_memcpy(iop_chan);
472                 else if (dma_has_cap(DMA_XOR,
473                         iop_chan->device->common.cap_mask))
474                         iop_chan_start_null_xor(iop_chan);
475                 else
476                         BUG();
477         }
478
479         return (idx > 0) ? idx : -ENOMEM;
480 }
481
482 static struct dma_async_tx_descriptor *
483 iop_adma_prep_dma_interrupt(struct dma_chan *chan, unsigned long flags)
484 {
485         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
486         struct iop_adma_desc_slot *sw_desc, *grp_start;
487         int slot_cnt, slots_per_op;
488
489         dev_dbg(iop_chan->device->common.dev, "%s\n", __func__);
490
491         spin_lock_bh(&iop_chan->lock);
492         slot_cnt = iop_chan_interrupt_slot_count(&slots_per_op, iop_chan);
493         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
494         if (sw_desc) {
495                 grp_start = sw_desc->group_head;
496                 iop_desc_init_interrupt(grp_start, iop_chan);
497                 sw_desc->async_tx.flags = flags;
498         }
499         spin_unlock_bh(&iop_chan->lock);
500
501         return sw_desc ? &sw_desc->async_tx : NULL;
502 }
503
504 static struct dma_async_tx_descriptor *
505 iop_adma_prep_dma_memcpy(struct dma_chan *chan, dma_addr_t dma_dest,
506                          dma_addr_t dma_src, size_t len, unsigned long flags)
507 {
508         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
509         struct iop_adma_desc_slot *sw_desc, *grp_start;
510         int slot_cnt, slots_per_op;
511
512         if (unlikely(!len))
513                 return NULL;
514         BUG_ON(len > IOP_ADMA_MAX_BYTE_COUNT);
515
516         dev_dbg(iop_chan->device->common.dev, "%s len: %zu\n",
517                 __func__, len);
518
519         spin_lock_bh(&iop_chan->lock);
520         slot_cnt = iop_chan_memcpy_slot_count(len, &slots_per_op);
521         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
522         if (sw_desc) {
523                 grp_start = sw_desc->group_head;
524                 iop_desc_init_memcpy(grp_start, flags);
525                 iop_desc_set_byte_count(grp_start, iop_chan, len);
526                 iop_desc_set_dest_addr(grp_start, iop_chan, dma_dest);
527                 iop_desc_set_memcpy_src_addr(grp_start, dma_src);
528                 sw_desc->async_tx.flags = flags;
529         }
530         spin_unlock_bh(&iop_chan->lock);
531
532         return sw_desc ? &sw_desc->async_tx : NULL;
533 }
534
535 static struct dma_async_tx_descriptor *
536 iop_adma_prep_dma_xor(struct dma_chan *chan, dma_addr_t dma_dest,
537                       dma_addr_t *dma_src, unsigned int src_cnt, size_t len,
538                       unsigned long flags)
539 {
540         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
541         struct iop_adma_desc_slot *sw_desc, *grp_start;
542         int slot_cnt, slots_per_op;
543
544         if (unlikely(!len))
545                 return NULL;
546         BUG_ON(len > IOP_ADMA_XOR_MAX_BYTE_COUNT);
547
548         dev_dbg(iop_chan->device->common.dev,
549                 "%s src_cnt: %d len: %zu flags: %lx\n",
550                 __func__, src_cnt, len, flags);
551
552         spin_lock_bh(&iop_chan->lock);
553         slot_cnt = iop_chan_xor_slot_count(len, src_cnt, &slots_per_op);
554         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
555         if (sw_desc) {
556                 grp_start = sw_desc->group_head;
557                 iop_desc_init_xor(grp_start, src_cnt, flags);
558                 iop_desc_set_byte_count(grp_start, iop_chan, len);
559                 iop_desc_set_dest_addr(grp_start, iop_chan, dma_dest);
560                 sw_desc->async_tx.flags = flags;
561                 while (src_cnt--)
562                         iop_desc_set_xor_src_addr(grp_start, src_cnt,
563                                                   dma_src[src_cnt]);
564         }
565         spin_unlock_bh(&iop_chan->lock);
566
567         return sw_desc ? &sw_desc->async_tx : NULL;
568 }
569
570 static struct dma_async_tx_descriptor *
571 iop_adma_prep_dma_xor_val(struct dma_chan *chan, dma_addr_t *dma_src,
572                           unsigned int src_cnt, size_t len, u32 *result,
573                           unsigned long flags)
574 {
575         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
576         struct iop_adma_desc_slot *sw_desc, *grp_start;
577         int slot_cnt, slots_per_op;
578
579         if (unlikely(!len))
580                 return NULL;
581
582         dev_dbg(iop_chan->device->common.dev, "%s src_cnt: %d len: %zu\n",
583                 __func__, src_cnt, len);
584
585         spin_lock_bh(&iop_chan->lock);
586         slot_cnt = iop_chan_zero_sum_slot_count(len, src_cnt, &slots_per_op);
587         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
588         if (sw_desc) {
589                 grp_start = sw_desc->group_head;
590                 iop_desc_init_zero_sum(grp_start, src_cnt, flags);
591                 iop_desc_set_zero_sum_byte_count(grp_start, len);
592                 grp_start->xor_check_result = result;
593                 pr_debug("\t%s: grp_start->xor_check_result: %p\n",
594                         __func__, grp_start->xor_check_result);
595                 sw_desc->async_tx.flags = flags;
596                 while (src_cnt--)
597                         iop_desc_set_zero_sum_src_addr(grp_start, src_cnt,
598                                                        dma_src[src_cnt]);
599         }
600         spin_unlock_bh(&iop_chan->lock);
601
602         return sw_desc ? &sw_desc->async_tx : NULL;
603 }
604
605 static struct dma_async_tx_descriptor *
606 iop_adma_prep_dma_pq(struct dma_chan *chan, dma_addr_t *dst, dma_addr_t *src,
607                      unsigned int src_cnt, const unsigned char *scf, size_t len,
608                      unsigned long flags)
609 {
610         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
611         struct iop_adma_desc_slot *sw_desc, *g;
612         int slot_cnt, slots_per_op;
613         int continue_srcs;
614
615         if (unlikely(!len))
616                 return NULL;
617         BUG_ON(len > IOP_ADMA_XOR_MAX_BYTE_COUNT);
618
619         dev_dbg(iop_chan->device->common.dev,
620                 "%s src_cnt: %d len: %zu flags: %lx\n",
621                 __func__, src_cnt, len, flags);
622
623         if (dmaf_p_disabled_continue(flags))
624                 continue_srcs = 1+src_cnt;
625         else if (dmaf_continue(flags))
626                 continue_srcs = 3+src_cnt;
627         else
628                 continue_srcs = 0+src_cnt;
629
630         spin_lock_bh(&iop_chan->lock);
631         slot_cnt = iop_chan_pq_slot_count(len, continue_srcs, &slots_per_op);
632         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
633         if (sw_desc) {
634                 int i;
635
636                 g = sw_desc->group_head;
637                 iop_desc_set_byte_count(g, iop_chan, len);
638
639                 /* even if P is disabled its destination address (bits
640                  * [3:0]) must match Q.  It is ok if P points to an
641                  * invalid address, it won't be written.
642                  */
643                 if (flags & DMA_PREP_PQ_DISABLE_P)
644                         dst[0] = dst[1] & 0x7;
645
646                 iop_desc_set_pq_addr(g, dst);
647                 sw_desc->async_tx.flags = flags;
648                 for (i = 0; i < src_cnt; i++)
649                         iop_desc_set_pq_src_addr(g, i, src[i], scf[i]);
650
651                 /* if we are continuing a previous operation factor in
652                  * the old p and q values, see the comment for dma_maxpq
653                  * in include/linux/dmaengine.h
654                  */
655                 if (dmaf_p_disabled_continue(flags))
656                         iop_desc_set_pq_src_addr(g, i++, dst[1], 1);
657                 else if (dmaf_continue(flags)) {
658                         iop_desc_set_pq_src_addr(g, i++, dst[0], 0);
659                         iop_desc_set_pq_src_addr(g, i++, dst[1], 1);
660                         iop_desc_set_pq_src_addr(g, i++, dst[1], 0);
661                 }
662                 iop_desc_init_pq(g, i, flags);
663         }
664         spin_unlock_bh(&iop_chan->lock);
665
666         return sw_desc ? &sw_desc->async_tx : NULL;
667 }
668
669 static struct dma_async_tx_descriptor *
670 iop_adma_prep_dma_pq_val(struct dma_chan *chan, dma_addr_t *pq, dma_addr_t *src,
671                          unsigned int src_cnt, const unsigned char *scf,
672                          size_t len, enum sum_check_flags *pqres,
673                          unsigned long flags)
674 {
675         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
676         struct iop_adma_desc_slot *sw_desc, *g;
677         int slot_cnt, slots_per_op;
678
679         if (unlikely(!len))
680                 return NULL;
681         BUG_ON(len > IOP_ADMA_XOR_MAX_BYTE_COUNT);
682
683         dev_dbg(iop_chan->device->common.dev, "%s src_cnt: %d len: %zu\n",
684                 __func__, src_cnt, len);
685
686         spin_lock_bh(&iop_chan->lock);
687         slot_cnt = iop_chan_pq_zero_sum_slot_count(len, src_cnt + 2, &slots_per_op);
688         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
689         if (sw_desc) {
690                 /* for validate operations p and q are tagged onto the
691                  * end of the source list
692                  */
693                 int pq_idx = src_cnt;
694
695                 g = sw_desc->group_head;
696                 iop_desc_init_pq_zero_sum(g, src_cnt+2, flags);
697                 iop_desc_set_pq_zero_sum_byte_count(g, len);
698                 g->pq_check_result = pqres;
699                 pr_debug("\t%s: g->pq_check_result: %p\n",
700                         __func__, g->pq_check_result);
701                 sw_desc->async_tx.flags = flags;
702                 while (src_cnt--)
703                         iop_desc_set_pq_zero_sum_src_addr(g, src_cnt,
704                                                           src[src_cnt],
705                                                           scf[src_cnt]);
706                 iop_desc_set_pq_zero_sum_addr(g, pq_idx, src);
707         }
708         spin_unlock_bh(&iop_chan->lock);
709
710         return sw_desc ? &sw_desc->async_tx : NULL;
711 }
712
713 static void iop_adma_free_chan_resources(struct dma_chan *chan)
714 {
715         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
716         struct iop_adma_desc_slot *iter, *_iter;
717         int in_use_descs = 0;
718
719         iop_adma_slot_cleanup(iop_chan);
720
721         spin_lock_bh(&iop_chan->lock);
722         list_for_each_entry_safe(iter, _iter, &iop_chan->chain,
723                                         chain_node) {
724                 in_use_descs++;
725                 list_del(&iter->chain_node);
726         }
727         list_for_each_entry_safe_reverse(
728                 iter, _iter, &iop_chan->all_slots, slot_node) {
729                 list_del(&iter->slot_node);
730                 kfree(iter);
731                 iop_chan->slots_allocated--;
732         }
733         iop_chan->last_used = NULL;
734
735         dev_dbg(iop_chan->device->common.dev, "%s slots_allocated %d\n",
736                 __func__, iop_chan->slots_allocated);
737         spin_unlock_bh(&iop_chan->lock);
738
739         /* one is ok since we left it on there on purpose */
740         if (in_use_descs > 1)
741                 printk(KERN_ERR "IOP: Freeing %d in use descriptors!\n",
742                         in_use_descs - 1);
743 }
744
745 /**
746  * iop_adma_status - poll the status of an ADMA transaction
747  * @chan: ADMA channel handle
748  * @cookie: ADMA transaction identifier
749  * @txstate: a holder for the current state of the channel or NULL
750  */
751 static enum dma_status iop_adma_status(struct dma_chan *chan,
752                                         dma_cookie_t cookie,
753                                         struct dma_tx_state *txstate)
754 {
755         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
756         int ret;
757
758         ret = dma_cookie_status(chan, cookie, txstate);
759         if (ret == DMA_COMPLETE)
760                 return ret;
761
762         iop_adma_slot_cleanup(iop_chan);
763
764         return dma_cookie_status(chan, cookie, txstate);
765 }
766
767 static irqreturn_t iop_adma_eot_handler(int irq, void *data)
768 {
769         struct iop_adma_chan *chan = data;
770
771         dev_dbg(chan->device->common.dev, "%s\n", __func__);
772
773         tasklet_schedule(&chan->irq_tasklet);
774
775         iop_adma_device_clear_eot_status(chan);
776
777         return IRQ_HANDLED;
778 }
779
780 static irqreturn_t iop_adma_eoc_handler(int irq, void *data)
781 {
782         struct iop_adma_chan *chan = data;
783
784         dev_dbg(chan->device->common.dev, "%s\n", __func__);
785
786         tasklet_schedule(&chan->irq_tasklet);
787
788         iop_adma_device_clear_eoc_status(chan);
789
790         return IRQ_HANDLED;
791 }
792
793 static irqreturn_t iop_adma_err_handler(int irq, void *data)
794 {
795         struct iop_adma_chan *chan = data;
796         unsigned long status = iop_chan_get_status(chan);
797
798         dev_err(chan->device->common.dev,
799                 "error ( %s%s%s%s%s%s%s)\n",
800                 iop_is_err_int_parity(status, chan) ? "int_parity " : "",
801                 iop_is_err_mcu_abort(status, chan) ? "mcu_abort " : "",
802                 iop_is_err_int_tabort(status, chan) ? "int_tabort " : "",
803                 iop_is_err_int_mabort(status, chan) ? "int_mabort " : "",
804                 iop_is_err_pci_tabort(status, chan) ? "pci_tabort " : "",
805                 iop_is_err_pci_mabort(status, chan) ? "pci_mabort " : "",
806                 iop_is_err_split_tx(status, chan) ? "split_tx " : "");
807
808         iop_adma_device_clear_err_status(chan);
809
810         BUG();
811
812         return IRQ_HANDLED;
813 }
814
815 static void iop_adma_issue_pending(struct dma_chan *chan)
816 {
817         struct iop_adma_chan *iop_chan = to_iop_adma_chan(chan);
818
819         if (iop_chan->pending) {
820                 iop_chan->pending = 0;
821                 iop_chan_append(iop_chan);
822         }
823 }
824
825 /*
826  * Perform a transaction to verify the HW works.
827  */
828 #define IOP_ADMA_TEST_SIZE 2000
829
830 static int iop_adma_memcpy_self_test(struct iop_adma_device *device)
831 {
832         int i;
833         void *src, *dest;
834         dma_addr_t src_dma, dest_dma;
835         struct dma_chan *dma_chan;
836         dma_cookie_t cookie;
837         struct dma_async_tx_descriptor *tx;
838         int err = 0;
839         struct iop_adma_chan *iop_chan;
840
841         dev_dbg(device->common.dev, "%s\n", __func__);
842
843         src = kmalloc(IOP_ADMA_TEST_SIZE, GFP_KERNEL);
844         if (!src)
845                 return -ENOMEM;
846         dest = kzalloc(IOP_ADMA_TEST_SIZE, GFP_KERNEL);
847         if (!dest) {
848                 kfree(src);
849                 return -ENOMEM;
850         }
851
852         /* Fill in src buffer */
853         for (i = 0; i < IOP_ADMA_TEST_SIZE; i++)
854                 ((u8 *) src)[i] = (u8)i;
855
856         /* Start copy, using first DMA channel */
857         dma_chan = container_of(device->common.channels.next,
858                                 struct dma_chan,
859                                 device_node);
860         if (iop_adma_alloc_chan_resources(dma_chan) < 1) {
861                 err = -ENODEV;
862                 goto out;
863         }
864
865         dest_dma = dma_map_single(dma_chan->device->dev, dest,
866                                 IOP_ADMA_TEST_SIZE, DMA_FROM_DEVICE);
867         src_dma = dma_map_single(dma_chan->device->dev, src,
868                                 IOP_ADMA_TEST_SIZE, DMA_TO_DEVICE);
869         tx = iop_adma_prep_dma_memcpy(dma_chan, dest_dma, src_dma,
870                                       IOP_ADMA_TEST_SIZE,
871                                       DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
872
873         cookie = iop_adma_tx_submit(tx);
874         iop_adma_issue_pending(dma_chan);
875         msleep(1);
876
877         if (iop_adma_status(dma_chan, cookie, NULL) !=
878                         DMA_COMPLETE) {
879                 dev_err(dma_chan->device->dev,
880                         "Self-test copy timed out, disabling\n");
881                 err = -ENODEV;
882                 goto free_resources;
883         }
884
885         iop_chan = to_iop_adma_chan(dma_chan);
886         dma_sync_single_for_cpu(&iop_chan->device->pdev->dev, dest_dma,
887                 IOP_ADMA_TEST_SIZE, DMA_FROM_DEVICE);
888         if (memcmp(src, dest, IOP_ADMA_TEST_SIZE)) {
889                 dev_err(dma_chan->device->dev,
890                         "Self-test copy failed compare, disabling\n");
891                 err = -ENODEV;
892                 goto free_resources;
893         }
894
895 free_resources:
896         iop_adma_free_chan_resources(dma_chan);
897 out:
898         kfree(src);
899         kfree(dest);
900         return err;
901 }
902
903 #define IOP_ADMA_NUM_SRC_TEST 4 /* must be <= 15 */
904 static int
905 iop_adma_xor_val_self_test(struct iop_adma_device *device)
906 {
907         int i, src_idx;
908         struct page *dest;
909         struct page *xor_srcs[IOP_ADMA_NUM_SRC_TEST];
910         struct page *zero_sum_srcs[IOP_ADMA_NUM_SRC_TEST + 1];
911         dma_addr_t dma_srcs[IOP_ADMA_NUM_SRC_TEST + 1];
912         dma_addr_t dest_dma;
913         struct dma_async_tx_descriptor *tx;
914         struct dma_chan *dma_chan;
915         dma_cookie_t cookie;
916         u8 cmp_byte = 0;
917         u32 cmp_word;
918         u32 zero_sum_result;
919         int err = 0;
920         struct iop_adma_chan *iop_chan;
921
922         dev_dbg(device->common.dev, "%s\n", __func__);
923
924         for (src_idx = 0; src_idx < IOP_ADMA_NUM_SRC_TEST; src_idx++) {
925                 xor_srcs[src_idx] = alloc_page(GFP_KERNEL);
926                 if (!xor_srcs[src_idx]) {
927                         while (src_idx--)
928                                 __free_page(xor_srcs[src_idx]);
929                         return -ENOMEM;
930                 }
931         }
932
933         dest = alloc_page(GFP_KERNEL);
934         if (!dest) {
935                 while (src_idx--)
936                         __free_page(xor_srcs[src_idx]);
937                 return -ENOMEM;
938         }
939
940         /* Fill in src buffers */
941         for (src_idx = 0; src_idx < IOP_ADMA_NUM_SRC_TEST; src_idx++) {
942                 u8 *ptr = page_address(xor_srcs[src_idx]);
943                 for (i = 0; i < PAGE_SIZE; i++)
944                         ptr[i] = (1 << src_idx);
945         }
946
947         for (src_idx = 0; src_idx < IOP_ADMA_NUM_SRC_TEST; src_idx++)
948                 cmp_byte ^= (u8) (1 << src_idx);
949
950         cmp_word = (cmp_byte << 24) | (cmp_byte << 16) |
951                         (cmp_byte << 8) | cmp_byte;
952
953         memset(page_address(dest), 0, PAGE_SIZE);
954
955         dma_chan = container_of(device->common.channels.next,
956                                 struct dma_chan,
957                                 device_node);
958         if (iop_adma_alloc_chan_resources(dma_chan) < 1) {
959                 err = -ENODEV;
960                 goto out;
961         }
962
963         /* test xor */
964         dest_dma = dma_map_page(dma_chan->device->dev, dest, 0,
965                                 PAGE_SIZE, DMA_FROM_DEVICE);
966         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST; i++)
967                 dma_srcs[i] = dma_map_page(dma_chan->device->dev, xor_srcs[i],
968                                            0, PAGE_SIZE, DMA_TO_DEVICE);
969         tx = iop_adma_prep_dma_xor(dma_chan, dest_dma, dma_srcs,
970                                    IOP_ADMA_NUM_SRC_TEST, PAGE_SIZE,
971                                    DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
972
973         cookie = iop_adma_tx_submit(tx);
974         iop_adma_issue_pending(dma_chan);
975         msleep(8);
976
977         if (iop_adma_status(dma_chan, cookie, NULL) !=
978                 DMA_COMPLETE) {
979                 dev_err(dma_chan->device->dev,
980                         "Self-test xor timed out, disabling\n");
981                 err = -ENODEV;
982                 goto free_resources;
983         }
984
985         iop_chan = to_iop_adma_chan(dma_chan);
986         dma_sync_single_for_cpu(&iop_chan->device->pdev->dev, dest_dma,
987                 PAGE_SIZE, DMA_FROM_DEVICE);
988         for (i = 0; i < (PAGE_SIZE / sizeof(u32)); i++) {
989                 u32 *ptr = page_address(dest);
990                 if (ptr[i] != cmp_word) {
991                         dev_err(dma_chan->device->dev,
992                                 "Self-test xor failed compare, disabling\n");
993                         err = -ENODEV;
994                         goto free_resources;
995                 }
996         }
997         dma_sync_single_for_device(&iop_chan->device->pdev->dev, dest_dma,
998                 PAGE_SIZE, DMA_TO_DEVICE);
999
1000         /* skip zero sum if the capability is not present */
1001         if (!dma_has_cap(DMA_XOR_VAL, dma_chan->device->cap_mask))
1002                 goto free_resources;
1003
1004         /* zero sum the sources with the destintation page */
1005         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST; i++)
1006                 zero_sum_srcs[i] = xor_srcs[i];
1007         zero_sum_srcs[i] = dest;
1008
1009         zero_sum_result = 1;
1010
1011         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST + 1; i++)
1012                 dma_srcs[i] = dma_map_page(dma_chan->device->dev,
1013                                            zero_sum_srcs[i], 0, PAGE_SIZE,
1014                                            DMA_TO_DEVICE);
1015         tx = iop_adma_prep_dma_xor_val(dma_chan, dma_srcs,
1016                                        IOP_ADMA_NUM_SRC_TEST + 1, PAGE_SIZE,
1017                                        &zero_sum_result,
1018                                        DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
1019
1020         cookie = iop_adma_tx_submit(tx);
1021         iop_adma_issue_pending(dma_chan);
1022         msleep(8);
1023
1024         if (iop_adma_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
1025                 dev_err(dma_chan->device->dev,
1026                         "Self-test zero sum timed out, disabling\n");
1027                 err = -ENODEV;
1028                 goto free_resources;
1029         }
1030
1031         if (zero_sum_result != 0) {
1032                 dev_err(dma_chan->device->dev,
1033                         "Self-test zero sum failed compare, disabling\n");
1034                 err = -ENODEV;
1035                 goto free_resources;
1036         }
1037
1038         /* test for non-zero parity sum */
1039         zero_sum_result = 0;
1040         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST + 1; i++)
1041                 dma_srcs[i] = dma_map_page(dma_chan->device->dev,
1042                                            zero_sum_srcs[i], 0, PAGE_SIZE,
1043                                            DMA_TO_DEVICE);
1044         tx = iop_adma_prep_dma_xor_val(dma_chan, dma_srcs,
1045                                        IOP_ADMA_NUM_SRC_TEST + 1, PAGE_SIZE,
1046                                        &zero_sum_result,
1047                                        DMA_PREP_INTERRUPT | DMA_CTRL_ACK);
1048
1049         cookie = iop_adma_tx_submit(tx);
1050         iop_adma_issue_pending(dma_chan);
1051         msleep(8);
1052
1053         if (iop_adma_status(dma_chan, cookie, NULL) != DMA_COMPLETE) {
1054                 dev_err(dma_chan->device->dev,
1055                         "Self-test non-zero sum timed out, disabling\n");
1056                 err = -ENODEV;
1057                 goto free_resources;
1058         }
1059
1060         if (zero_sum_result != 1) {
1061                 dev_err(dma_chan->device->dev,
1062                         "Self-test non-zero sum failed compare, disabling\n");
1063                 err = -ENODEV;
1064                 goto free_resources;
1065         }
1066
1067 free_resources:
1068         iop_adma_free_chan_resources(dma_chan);
1069 out:
1070         src_idx = IOP_ADMA_NUM_SRC_TEST;
1071         while (src_idx--)
1072                 __free_page(xor_srcs[src_idx]);
1073         __free_page(dest);
1074         return err;
1075 }
1076
1077 #ifdef CONFIG_RAID6_PQ
1078 static int
1079 iop_adma_pq_zero_sum_self_test(struct iop_adma_device *device)
1080 {
1081         /* combined sources, software pq results, and extra hw pq results */
1082         struct page *pq[IOP_ADMA_NUM_SRC_TEST+2+2];
1083         /* ptr to the extra hw pq buffers defined above */
1084         struct page **pq_hw = &pq[IOP_ADMA_NUM_SRC_TEST+2];
1085         /* address conversion buffers (dma_map / page_address) */
1086         void *pq_sw[IOP_ADMA_NUM_SRC_TEST+2];
1087         dma_addr_t pq_src[IOP_ADMA_NUM_SRC_TEST+2];
1088         dma_addr_t *pq_dest = &pq_src[IOP_ADMA_NUM_SRC_TEST];
1089
1090         int i;
1091         struct dma_async_tx_descriptor *tx;
1092         struct dma_chan *dma_chan;
1093         dma_cookie_t cookie;
1094         u32 zero_sum_result;
1095         int err = 0;
1096         struct device *dev;
1097
1098         dev_dbg(device->common.dev, "%s\n", __func__);
1099
1100         for (i = 0; i < ARRAY_SIZE(pq); i++) {
1101                 pq[i] = alloc_page(GFP_KERNEL);
1102                 if (!pq[i]) {
1103                         while (i--)
1104                                 __free_page(pq[i]);
1105                         return -ENOMEM;
1106                 }
1107         }
1108
1109         /* Fill in src buffers */
1110         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST; i++) {
1111                 pq_sw[i] = page_address(pq[i]);
1112                 memset(pq_sw[i], 0x11111111 * (1<<i), PAGE_SIZE);
1113         }
1114         pq_sw[i] = page_address(pq[i]);
1115         pq_sw[i+1] = page_address(pq[i+1]);
1116
1117         dma_chan = container_of(device->common.channels.next,
1118                                 struct dma_chan,
1119                                 device_node);
1120         if (iop_adma_alloc_chan_resources(dma_chan) < 1) {
1121                 err = -ENODEV;
1122                 goto out;
1123         }
1124
1125         dev = dma_chan->device->dev;
1126
1127         /* initialize the dests */
1128         memset(page_address(pq_hw[0]), 0 , PAGE_SIZE);
1129         memset(page_address(pq_hw[1]), 0 , PAGE_SIZE);
1130
1131         /* test pq */
1132         pq_dest[0] = dma_map_page(dev, pq_hw[0], 0, PAGE_SIZE, DMA_FROM_DEVICE);
1133         pq_dest[1] = dma_map_page(dev, pq_hw[1], 0, PAGE_SIZE, DMA_FROM_DEVICE);
1134         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST; i++)
1135                 pq_src[i] = dma_map_page(dev, pq[i], 0, PAGE_SIZE,
1136                                          DMA_TO_DEVICE);
1137
1138         tx = iop_adma_prep_dma_pq(dma_chan, pq_dest, pq_src,
1139                                   IOP_ADMA_NUM_SRC_TEST, (u8 *)raid6_gfexp,
1140                                   PAGE_SIZE,
1141                                   DMA_PREP_INTERRUPT |
1142                                   DMA_CTRL_ACK);
1143
1144         cookie = iop_adma_tx_submit(tx);
1145         iop_adma_issue_pending(dma_chan);
1146         msleep(8);
1147
1148         if (iop_adma_status(dma_chan, cookie, NULL) !=
1149                 DMA_COMPLETE) {
1150                 dev_err(dev, "Self-test pq timed out, disabling\n");
1151                 err = -ENODEV;
1152                 goto free_resources;
1153         }
1154
1155         raid6_call.gen_syndrome(IOP_ADMA_NUM_SRC_TEST+2, PAGE_SIZE, pq_sw);
1156
1157         if (memcmp(pq_sw[IOP_ADMA_NUM_SRC_TEST],
1158                    page_address(pq_hw[0]), PAGE_SIZE) != 0) {
1159                 dev_err(dev, "Self-test p failed compare, disabling\n");
1160                 err = -ENODEV;
1161                 goto free_resources;
1162         }
1163         if (memcmp(pq_sw[IOP_ADMA_NUM_SRC_TEST+1],
1164                    page_address(pq_hw[1]), PAGE_SIZE) != 0) {
1165                 dev_err(dev, "Self-test q failed compare, disabling\n");
1166                 err = -ENODEV;
1167                 goto free_resources;
1168         }
1169
1170         /* test correct zero sum using the software generated pq values */
1171         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST + 2; i++)
1172                 pq_src[i] = dma_map_page(dev, pq[i], 0, PAGE_SIZE,
1173                                          DMA_TO_DEVICE);
1174
1175         zero_sum_result = ~0;
1176         tx = iop_adma_prep_dma_pq_val(dma_chan, &pq_src[IOP_ADMA_NUM_SRC_TEST],
1177                                       pq_src, IOP_ADMA_NUM_SRC_TEST,
1178                                       raid6_gfexp, PAGE_SIZE, &zero_sum_result,
1179                                       DMA_PREP_INTERRUPT|DMA_CTRL_ACK);
1180
1181         cookie = iop_adma_tx_submit(tx);
1182         iop_adma_issue_pending(dma_chan);
1183         msleep(8);
1184
1185         if (iop_adma_status(dma_chan, cookie, NULL) !=
1186                 DMA_COMPLETE) {
1187                 dev_err(dev, "Self-test pq-zero-sum timed out, disabling\n");
1188                 err = -ENODEV;
1189                 goto free_resources;
1190         }
1191
1192         if (zero_sum_result != 0) {
1193                 dev_err(dev, "Self-test pq-zero-sum failed to validate: %x\n",
1194                         zero_sum_result);
1195                 err = -ENODEV;
1196                 goto free_resources;
1197         }
1198
1199         /* test incorrect zero sum */
1200         i = IOP_ADMA_NUM_SRC_TEST;
1201         memset(pq_sw[i] + 100, 0, 100);
1202         memset(pq_sw[i+1] + 200, 0, 200);
1203         for (i = 0; i < IOP_ADMA_NUM_SRC_TEST + 2; i++)
1204                 pq_src[i] = dma_map_page(dev, pq[i], 0, PAGE_SIZE,
1205                                          DMA_TO_DEVICE);
1206
1207         zero_sum_result = 0;
1208         tx = iop_adma_prep_dma_pq_val(dma_chan, &pq_src[IOP_ADMA_NUM_SRC_TEST],
1209                                       pq_src, IOP_ADMA_NUM_SRC_TEST,
1210                                       raid6_gfexp, PAGE_SIZE, &zero_sum_result,
1211                                       DMA_PREP_INTERRUPT|DMA_CTRL_ACK);
1212
1213         cookie = iop_adma_tx_submit(tx);
1214         iop_adma_issue_pending(dma_chan);
1215         msleep(8);
1216
1217         if (iop_adma_status(dma_chan, cookie, NULL) !=
1218                 DMA_COMPLETE) {
1219                 dev_err(dev, "Self-test !pq-zero-sum timed out, disabling\n");
1220                 err = -ENODEV;
1221                 goto free_resources;
1222         }
1223
1224         if (zero_sum_result != (SUM_CHECK_P_RESULT | SUM_CHECK_Q_RESULT)) {
1225                 dev_err(dev, "Self-test !pq-zero-sum failed to validate: %x\n",
1226                         zero_sum_result);
1227                 err = -ENODEV;
1228                 goto free_resources;
1229         }
1230
1231 free_resources:
1232         iop_adma_free_chan_resources(dma_chan);
1233 out:
1234         i = ARRAY_SIZE(pq);
1235         while (i--)
1236                 __free_page(pq[i]);
1237         return err;
1238 }
1239 #endif
1240
1241 static int iop_adma_remove(struct platform_device *dev)
1242 {
1243         struct iop_adma_device *device = platform_get_drvdata(dev);
1244         struct dma_chan *chan, *_chan;
1245         struct iop_adma_chan *iop_chan;
1246         struct iop_adma_platform_data *plat_data = dev_get_platdata(&dev->dev);
1247
1248         dma_async_device_unregister(&device->common);
1249
1250         dma_free_coherent(&dev->dev, plat_data->pool_size,
1251                         device->dma_desc_pool_virt, device->dma_desc_pool);
1252
1253         list_for_each_entry_safe(chan, _chan, &device->common.channels,
1254                                 device_node) {
1255                 iop_chan = to_iop_adma_chan(chan);
1256                 list_del(&chan->device_node);
1257                 kfree(iop_chan);
1258         }
1259         kfree(device);
1260
1261         return 0;
1262 }
1263
1264 static int iop_adma_probe(struct platform_device *pdev)
1265 {
1266         struct resource *res;
1267         int ret = 0, i;
1268         struct iop_adma_device *adev;
1269         struct iop_adma_chan *iop_chan;
1270         struct dma_device *dma_dev;
1271         struct iop_adma_platform_data *plat_data = dev_get_platdata(&pdev->dev);
1272
1273         res = platform_get_resource(pdev, IORESOURCE_MEM, 0);
1274         if (!res)
1275                 return -ENODEV;
1276
1277         if (!devm_request_mem_region(&pdev->dev, res->start,
1278                                 resource_size(res), pdev->name))
1279                 return -EBUSY;
1280
1281         adev = kzalloc(sizeof(*adev), GFP_KERNEL);
1282         if (!adev)
1283                 return -ENOMEM;
1284         dma_dev = &adev->common;
1285
1286         /* allocate coherent memory for hardware descriptors
1287          * note: writecombine gives slightly better performance, but
1288          * requires that we explicitly flush the writes
1289          */
1290         adev->dma_desc_pool_virt = dma_alloc_wc(&pdev->dev,
1291                                                 plat_data->pool_size,
1292                                                 &adev->dma_desc_pool,
1293                                                 GFP_KERNEL);
1294         if (!adev->dma_desc_pool_virt) {
1295                 ret = -ENOMEM;
1296                 goto err_free_adev;
1297         }
1298
1299         dev_dbg(&pdev->dev, "%s: allocated descriptor pool virt %p phys %p\n",
1300                 __func__, adev->dma_desc_pool_virt,
1301                 (void *) adev->dma_desc_pool);
1302
1303         adev->id = plat_data->hw_id;
1304
1305         /* discover transaction capabilites from the platform data */
1306         dma_dev->cap_mask = plat_data->cap_mask;
1307
1308         adev->pdev = pdev;
1309         platform_set_drvdata(pdev, adev);
1310
1311         INIT_LIST_HEAD(&dma_dev->channels);
1312
1313         /* set base routines */
1314         dma_dev->device_alloc_chan_resources = iop_adma_alloc_chan_resources;
1315         dma_dev->device_free_chan_resources = iop_adma_free_chan_resources;
1316         dma_dev->device_tx_status = iop_adma_status;
1317         dma_dev->device_issue_pending = iop_adma_issue_pending;
1318         dma_dev->dev = &pdev->dev;
1319
1320         /* set prep routines based on capability */
1321         if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask))
1322                 dma_dev->device_prep_dma_memcpy = iop_adma_prep_dma_memcpy;
1323         if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
1324                 dma_dev->max_xor = iop_adma_get_max_xor();
1325                 dma_dev->device_prep_dma_xor = iop_adma_prep_dma_xor;
1326         }
1327         if (dma_has_cap(DMA_XOR_VAL, dma_dev->cap_mask))
1328                 dma_dev->device_prep_dma_xor_val =
1329                         iop_adma_prep_dma_xor_val;
1330         if (dma_has_cap(DMA_PQ, dma_dev->cap_mask)) {
1331                 dma_set_maxpq(dma_dev, iop_adma_get_max_pq(), 0);
1332                 dma_dev->device_prep_dma_pq = iop_adma_prep_dma_pq;
1333         }
1334         if (dma_has_cap(DMA_PQ_VAL, dma_dev->cap_mask))
1335                 dma_dev->device_prep_dma_pq_val =
1336                         iop_adma_prep_dma_pq_val;
1337         if (dma_has_cap(DMA_INTERRUPT, dma_dev->cap_mask))
1338                 dma_dev->device_prep_dma_interrupt =
1339                         iop_adma_prep_dma_interrupt;
1340
1341         iop_chan = kzalloc(sizeof(*iop_chan), GFP_KERNEL);
1342         if (!iop_chan) {
1343                 ret = -ENOMEM;
1344                 goto err_free_dma;
1345         }
1346         iop_chan->device = adev;
1347
1348         iop_chan->mmr_base = devm_ioremap(&pdev->dev, res->start,
1349                                         resource_size(res));
1350         if (!iop_chan->mmr_base) {
1351                 ret = -ENOMEM;
1352                 goto err_free_iop_chan;
1353         }
1354         tasklet_init(&iop_chan->irq_tasklet, iop_adma_tasklet, (unsigned long)
1355                 iop_chan);
1356
1357         /* clear errors before enabling interrupts */
1358         iop_adma_device_clear_err_status(iop_chan);
1359
1360         for (i = 0; i < 3; i++) {
1361                 static const irq_handler_t handler[] = {
1362                         iop_adma_eot_handler,
1363                         iop_adma_eoc_handler,
1364                         iop_adma_err_handler
1365                 };
1366                 int irq = platform_get_irq(pdev, i);
1367                 if (irq < 0) {
1368                         ret = -ENXIO;
1369                         goto err_free_iop_chan;
1370                 } else {
1371                         ret = devm_request_irq(&pdev->dev, irq,
1372                                         handler[i], 0, pdev->name, iop_chan);
1373                         if (ret)
1374                                 goto err_free_iop_chan;
1375                 }
1376         }
1377
1378         spin_lock_init(&iop_chan->lock);
1379         INIT_LIST_HEAD(&iop_chan->chain);
1380         INIT_LIST_HEAD(&iop_chan->all_slots);
1381         iop_chan->common.device = dma_dev;
1382         dma_cookie_init(&iop_chan->common);
1383         list_add_tail(&iop_chan->common.device_node, &dma_dev->channels);
1384
1385         if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask)) {
1386                 ret = iop_adma_memcpy_self_test(adev);
1387                 dev_dbg(&pdev->dev, "memcpy self test returned %d\n", ret);
1388                 if (ret)
1389                         goto err_free_iop_chan;
1390         }
1391
1392         if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
1393                 ret = iop_adma_xor_val_self_test(adev);
1394                 dev_dbg(&pdev->dev, "xor self test returned %d\n", ret);
1395                 if (ret)
1396                         goto err_free_iop_chan;
1397         }
1398
1399         if (dma_has_cap(DMA_PQ, dma_dev->cap_mask) &&
1400             dma_has_cap(DMA_PQ_VAL, dma_dev->cap_mask)) {
1401                 #ifdef CONFIG_RAID6_PQ
1402                 ret = iop_adma_pq_zero_sum_self_test(adev);
1403                 dev_dbg(&pdev->dev, "pq self test returned %d\n", ret);
1404                 #else
1405                 /* can not test raid6, so do not publish capability */
1406                 dma_cap_clear(DMA_PQ, dma_dev->cap_mask);
1407                 dma_cap_clear(DMA_PQ_VAL, dma_dev->cap_mask);
1408                 ret = 0;
1409                 #endif
1410                 if (ret)
1411                         goto err_free_iop_chan;
1412         }
1413
1414         dev_info(&pdev->dev, "Intel(R) IOP: ( %s%s%s%s%s%s)\n",
1415                  dma_has_cap(DMA_PQ, dma_dev->cap_mask) ? "pq " : "",
1416                  dma_has_cap(DMA_PQ_VAL, dma_dev->cap_mask) ? "pq_val " : "",
1417                  dma_has_cap(DMA_XOR, dma_dev->cap_mask) ? "xor " : "",
1418                  dma_has_cap(DMA_XOR_VAL, dma_dev->cap_mask) ? "xor_val " : "",
1419                  dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask) ? "cpy " : "",
1420                  dma_has_cap(DMA_INTERRUPT, dma_dev->cap_mask) ? "intr " : "");
1421
1422         dma_async_device_register(dma_dev);
1423         goto out;
1424
1425  err_free_iop_chan:
1426         kfree(iop_chan);
1427  err_free_dma:
1428         dma_free_coherent(&adev->pdev->dev, plat_data->pool_size,
1429                         adev->dma_desc_pool_virt, adev->dma_desc_pool);
1430  err_free_adev:
1431         kfree(adev);
1432  out:
1433         return ret;
1434 }
1435
1436 static void iop_chan_start_null_memcpy(struct iop_adma_chan *iop_chan)
1437 {
1438         struct iop_adma_desc_slot *sw_desc, *grp_start;
1439         dma_cookie_t cookie;
1440         int slot_cnt, slots_per_op;
1441
1442         dev_dbg(iop_chan->device->common.dev, "%s\n", __func__);
1443
1444         spin_lock_bh(&iop_chan->lock);
1445         slot_cnt = iop_chan_memcpy_slot_count(0, &slots_per_op);
1446         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
1447         if (sw_desc) {
1448                 grp_start = sw_desc->group_head;
1449
1450                 list_splice_init(&sw_desc->tx_list, &iop_chan->chain);
1451                 async_tx_ack(&sw_desc->async_tx);
1452                 iop_desc_init_memcpy(grp_start, 0);
1453                 iop_desc_set_byte_count(grp_start, iop_chan, 0);
1454                 iop_desc_set_dest_addr(grp_start, iop_chan, 0);
1455                 iop_desc_set_memcpy_src_addr(grp_start, 0);
1456
1457                 cookie = dma_cookie_assign(&sw_desc->async_tx);
1458
1459                 /* initialize the completed cookie to be less than
1460                  * the most recently used cookie
1461                  */
1462                 iop_chan->common.completed_cookie = cookie - 1;
1463
1464                 /* channel should not be busy */
1465                 BUG_ON(iop_chan_is_busy(iop_chan));
1466
1467                 /* clear any prior error-status bits */
1468                 iop_adma_device_clear_err_status(iop_chan);
1469
1470                 /* disable operation */
1471                 iop_chan_disable(iop_chan);
1472
1473                 /* set the descriptor address */
1474                 iop_chan_set_next_descriptor(iop_chan, sw_desc->async_tx.phys);
1475
1476                 /* 1/ don't add pre-chained descriptors
1477                  * 2/ dummy read to flush next_desc write
1478                  */
1479                 BUG_ON(iop_desc_get_next_desc(sw_desc));
1480
1481                 /* run the descriptor */
1482                 iop_chan_enable(iop_chan);
1483         } else
1484                 dev_err(iop_chan->device->common.dev,
1485                         "failed to allocate null descriptor\n");
1486         spin_unlock_bh(&iop_chan->lock);
1487 }
1488
1489 static void iop_chan_start_null_xor(struct iop_adma_chan *iop_chan)
1490 {
1491         struct iop_adma_desc_slot *sw_desc, *grp_start;
1492         dma_cookie_t cookie;
1493         int slot_cnt, slots_per_op;
1494
1495         dev_dbg(iop_chan->device->common.dev, "%s\n", __func__);
1496
1497         spin_lock_bh(&iop_chan->lock);
1498         slot_cnt = iop_chan_xor_slot_count(0, 2, &slots_per_op);
1499         sw_desc = iop_adma_alloc_slots(iop_chan, slot_cnt, slots_per_op);
1500         if (sw_desc) {
1501                 grp_start = sw_desc->group_head;
1502                 list_splice_init(&sw_desc->tx_list, &iop_chan->chain);
1503                 async_tx_ack(&sw_desc->async_tx);
1504                 iop_desc_init_null_xor(grp_start, 2, 0);
1505                 iop_desc_set_byte_count(grp_start, iop_chan, 0);
1506                 iop_desc_set_dest_addr(grp_start, iop_chan, 0);
1507                 iop_desc_set_xor_src_addr(grp_start, 0, 0);
1508                 iop_desc_set_xor_src_addr(grp_start, 1, 0);
1509
1510                 cookie = dma_cookie_assign(&sw_desc->async_tx);
1511
1512                 /* initialize the completed cookie to be less than
1513                  * the most recently used cookie
1514                  */
1515                 iop_chan->common.completed_cookie = cookie - 1;
1516
1517                 /* channel should not be busy */
1518                 BUG_ON(iop_chan_is_busy(iop_chan));
1519
1520                 /* clear any prior error-status bits */
1521                 iop_adma_device_clear_err_status(iop_chan);
1522
1523                 /* disable operation */
1524                 iop_chan_disable(iop_chan);
1525
1526                 /* set the descriptor address */
1527                 iop_chan_set_next_descriptor(iop_chan, sw_desc->async_tx.phys);
1528
1529                 /* 1/ don't add pre-chained descriptors
1530                  * 2/ dummy read to flush next_desc write
1531                  */
1532                 BUG_ON(iop_desc_get_next_desc(sw_desc));
1533
1534                 /* run the descriptor */
1535                 iop_chan_enable(iop_chan);
1536         } else
1537                 dev_err(iop_chan->device->common.dev,
1538                         "failed to allocate null descriptor\n");
1539         spin_unlock_bh(&iop_chan->lock);
1540 }
1541
1542 static struct platform_driver iop_adma_driver = {
1543         .probe          = iop_adma_probe,
1544         .remove         = iop_adma_remove,
1545         .driver         = {
1546                 .name   = "iop-adma",
1547         },
1548 };
1549
1550 module_platform_driver(iop_adma_driver);
1551
1552 MODULE_AUTHOR("Intel Corporation");
1553 MODULE_DESCRIPTION("IOP ADMA Engine Driver");
1554 MODULE_LICENSE("GPL");
1555 MODULE_ALIAS("platform:iop-adma");