2 * Copyright (C) 2017 Broadcom
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
10 * Broadcom SBA RAID Driver
12 * The Broadcom stream buffer accelerator (SBA) provides offloading
13 * capabilities for RAID operations. The SBA offload engine is accessible
14 * via Broadcom SoC specific ring manager. Two or more offload engines
15 * can share same Broadcom SoC specific ring manager due to this Broadcom
16 * SoC specific ring manager driver is implemented as a mailbox controller
17 * driver and offload engine drivers are implemented as mallbox clients.
19 * Typically, Broadcom SoC specific ring manager will implement larger
20 * number of hardware rings over one or more SBA hardware devices. By
21 * design, the internal buffer size of SBA hardware device is limited
22 * but all offload operations supported by SBA can be broken down into
23 * multiple small size requests and executed parallely on multiple SBA
24 * hardware devices for achieving high through-put.
26 * The Broadcom SBA RAID driver does not require any register programming
27 * except submitting request to SBA hardware device via mailbox channels.
28 * This driver implements a DMA device with one DMA channel using a set
29 * of mailbox channels provided by Broadcom SoC specific ring manager
30 * driver. To exploit parallelism (as described above), all DMA request
31 * coming to SBA RAID DMA channel are broken down to smaller requests
32 * and submitted to multiple mailbox channels in round-robin fashion.
33 * For having more SBA DMA channels, we can create more SBA device nodes
34 * in Broadcom SoC specific DTS based on number of hardware rings supported
35 * by Broadcom SoC ring manager.
38 #include <linux/bitops.h>
39 #include <linux/dma-mapping.h>
40 #include <linux/dmaengine.h>
41 #include <linux/list.h>
42 #include <linux/mailbox_client.h>
43 #include <linux/mailbox/brcm-message.h>
44 #include <linux/module.h>
45 #include <linux/of_device.h>
46 #include <linux/slab.h>
47 #include <linux/raid/pq.h>
49 #include "dmaengine.h"
51 /* SBA command related defines */
52 #define SBA_TYPE_SHIFT 48
53 #define SBA_TYPE_MASK GENMASK(1, 0)
54 #define SBA_TYPE_A 0x0
55 #define SBA_TYPE_B 0x2
56 #define SBA_TYPE_C 0x3
57 #define SBA_USER_DEF_SHIFT 32
58 #define SBA_USER_DEF_MASK GENMASK(15, 0)
59 #define SBA_R_MDATA_SHIFT 24
60 #define SBA_R_MDATA_MASK GENMASK(7, 0)
61 #define SBA_C_MDATA_MS_SHIFT 18
62 #define SBA_C_MDATA_MS_MASK GENMASK(1, 0)
63 #define SBA_INT_SHIFT 17
64 #define SBA_INT_MASK BIT(0)
65 #define SBA_RESP_SHIFT 16
66 #define SBA_RESP_MASK BIT(0)
67 #define SBA_C_MDATA_SHIFT 8
68 #define SBA_C_MDATA_MASK GENMASK(7, 0)
69 #define SBA_C_MDATA_BNUMx_SHIFT(__bnum) (2 * (__bnum))
70 #define SBA_C_MDATA_BNUMx_MASK GENMASK(1, 0)
71 #define SBA_C_MDATA_DNUM_SHIFT 5
72 #define SBA_C_MDATA_DNUM_MASK GENMASK(4, 0)
73 #define SBA_C_MDATA_LS(__v) ((__v) & 0xff)
74 #define SBA_C_MDATA_MS(__v) (((__v) >> 8) & 0x3)
75 #define SBA_CMD_SHIFT 0
76 #define SBA_CMD_MASK GENMASK(3, 0)
77 #define SBA_CMD_ZERO_BUFFER 0x4
78 #define SBA_CMD_ZERO_ALL_BUFFERS 0x8
79 #define SBA_CMD_LOAD_BUFFER 0x9
80 #define SBA_CMD_XOR 0xa
81 #define SBA_CMD_GALOIS_XOR 0xb
82 #define SBA_CMD_WRITE_BUFFER 0xc
83 #define SBA_CMD_GALOIS 0xe
85 /* Driver helper macros */
86 #define to_sba_request(tx) \
87 container_of(tx, struct sba_request, tx)
88 #define to_sba_device(dchan) \
89 container_of(dchan, struct sba_device, dma_chan)
91 enum sba_request_state
{
92 SBA_REQUEST_STATE_FREE
= 1,
93 SBA_REQUEST_STATE_ALLOCED
= 2,
94 SBA_REQUEST_STATE_PENDING
= 3,
95 SBA_REQUEST_STATE_ACTIVE
= 4,
96 SBA_REQUEST_STATE_RECEIVED
= 5,
97 SBA_REQUEST_STATE_COMPLETED
= 6,
98 SBA_REQUEST_STATE_ABORTED
= 7,
103 struct list_head node
;
104 struct sba_device
*sba
;
105 enum sba_request_state state
;
107 /* Chained requests management */
108 struct sba_request
*first
;
109 struct list_head next
;
110 unsigned int next_count
;
111 atomic_t next_pending_count
;
112 /* BRCM message data */
115 struct brcm_sba_command
*cmds
;
116 struct brcm_message msg
;
117 struct dma_async_tx_descriptor tx
;
126 /* Underlying device */
128 /* DT configuration parameters */
129 enum sba_version ver
;
130 /* Derived configuration parameters */
138 u32 max_resp_pool_size
;
139 u32 max_cmds_pool_size
;
140 /* Maibox client and Mailbox channels */
141 struct mbox_client client
;
143 atomic_t mchans_current
;
144 struct mbox_chan
**mchans
;
145 struct device
*mbox_dev
;
146 /* DMA device and DMA channel */
147 struct dma_device dma_dev
;
148 struct dma_chan dma_chan
;
149 /* DMA channel resources */
151 dma_addr_t resp_dma_base
;
153 dma_addr_t cmds_dma_base
;
154 spinlock_t reqs_lock
;
155 struct sba_request
*reqs
;
157 struct list_head reqs_alloc_list
;
158 struct list_head reqs_pending_list
;
159 struct list_head reqs_active_list
;
160 struct list_head reqs_received_list
;
161 struct list_head reqs_completed_list
;
162 struct list_head reqs_aborted_list
;
163 struct list_head reqs_free_list
;
167 /* ====== SBA command helper routines ===== */
169 static inline u64 __pure
sba_cmd_enc(u64 cmd
, u32 val
, u32 shift
, u32 mask
)
171 cmd
&= ~((u64
)mask
<< shift
);
172 cmd
|= ((u64
)(val
& mask
) << shift
);
176 static inline u32 __pure
sba_cmd_load_c_mdata(u32 b0
)
178 return b0
& SBA_C_MDATA_BNUMx_MASK
;
181 static inline u32 __pure
sba_cmd_write_c_mdata(u32 b0
)
183 return b0
& SBA_C_MDATA_BNUMx_MASK
;
186 static inline u32 __pure
sba_cmd_xor_c_mdata(u32 b1
, u32 b0
)
188 return (b0
& SBA_C_MDATA_BNUMx_MASK
) |
189 ((b1
& SBA_C_MDATA_BNUMx_MASK
) << SBA_C_MDATA_BNUMx_SHIFT(1));
192 static inline u32 __pure
sba_cmd_pq_c_mdata(u32 d
, u32 b1
, u32 b0
)
194 return (b0
& SBA_C_MDATA_BNUMx_MASK
) |
195 ((b1
& SBA_C_MDATA_BNUMx_MASK
) << SBA_C_MDATA_BNUMx_SHIFT(1)) |
196 ((d
& SBA_C_MDATA_DNUM_MASK
) << SBA_C_MDATA_DNUM_SHIFT
);
199 /* ====== Channel resource management routines ===== */
201 static struct sba_request
*sba_alloc_request(struct sba_device
*sba
)
204 struct sba_request
*req
= NULL
;
206 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
208 req
= list_first_entry_or_null(&sba
->reqs_free_list
,
209 struct sba_request
, node
);
211 list_move_tail(&req
->node
, &sba
->reqs_alloc_list
);
212 req
->state
= SBA_REQUEST_STATE_ALLOCED
;
215 INIT_LIST_HEAD(&req
->next
);
217 atomic_set(&req
->next_pending_count
, 1);
219 sba
->reqs_free_count
--;
221 dma_async_tx_descriptor_init(&req
->tx
, &sba
->dma_chan
);
224 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
229 /* Note: Must be called with sba->reqs_lock held */
230 static void _sba_pending_request(struct sba_device
*sba
,
231 struct sba_request
*req
)
233 lockdep_assert_held(&sba
->reqs_lock
);
234 req
->state
= SBA_REQUEST_STATE_PENDING
;
235 list_move_tail(&req
->node
, &sba
->reqs_pending_list
);
236 if (list_empty(&sba
->reqs_active_list
))
237 sba
->reqs_fence
= false;
240 /* Note: Must be called with sba->reqs_lock held */
241 static bool _sba_active_request(struct sba_device
*sba
,
242 struct sba_request
*req
)
244 lockdep_assert_held(&sba
->reqs_lock
);
245 if (list_empty(&sba
->reqs_active_list
))
246 sba
->reqs_fence
= false;
249 req
->state
= SBA_REQUEST_STATE_ACTIVE
;
250 list_move_tail(&req
->node
, &sba
->reqs_active_list
);
252 sba
->reqs_fence
= true;
256 /* Note: Must be called with sba->reqs_lock held */
257 static void _sba_abort_request(struct sba_device
*sba
,
258 struct sba_request
*req
)
260 lockdep_assert_held(&sba
->reqs_lock
);
261 req
->state
= SBA_REQUEST_STATE_ABORTED
;
262 list_move_tail(&req
->node
, &sba
->reqs_aborted_list
);
263 if (list_empty(&sba
->reqs_active_list
))
264 sba
->reqs_fence
= false;
267 /* Note: Must be called with sba->reqs_lock held */
268 static void _sba_free_request(struct sba_device
*sba
,
269 struct sba_request
*req
)
271 lockdep_assert_held(&sba
->reqs_lock
);
272 req
->state
= SBA_REQUEST_STATE_FREE
;
273 list_move_tail(&req
->node
, &sba
->reqs_free_list
);
274 if (list_empty(&sba
->reqs_active_list
))
275 sba
->reqs_fence
= false;
276 sba
->reqs_free_count
++;
279 static void sba_received_request(struct sba_request
*req
)
282 struct sba_device
*sba
= req
->sba
;
284 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
285 req
->state
= SBA_REQUEST_STATE_RECEIVED
;
286 list_move_tail(&req
->node
, &sba
->reqs_received_list
);
287 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
290 static void sba_complete_chained_requests(struct sba_request
*req
)
293 struct sba_request
*nreq
;
294 struct sba_device
*sba
= req
->sba
;
296 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
298 req
->state
= SBA_REQUEST_STATE_COMPLETED
;
299 list_move_tail(&req
->node
, &sba
->reqs_completed_list
);
300 list_for_each_entry(nreq
, &req
->next
, next
) {
301 nreq
->state
= SBA_REQUEST_STATE_COMPLETED
;
302 list_move_tail(&nreq
->node
, &sba
->reqs_completed_list
);
304 if (list_empty(&sba
->reqs_active_list
))
305 sba
->reqs_fence
= false;
307 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
310 static void sba_free_chained_requests(struct sba_request
*req
)
313 struct sba_request
*nreq
;
314 struct sba_device
*sba
= req
->sba
;
316 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
318 _sba_free_request(sba
, req
);
319 list_for_each_entry(nreq
, &req
->next
, next
)
320 _sba_free_request(sba
, nreq
);
322 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
325 static void sba_chain_request(struct sba_request
*first
,
326 struct sba_request
*req
)
329 struct sba_device
*sba
= req
->sba
;
331 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
333 list_add_tail(&req
->next
, &first
->next
);
336 atomic_set(&first
->next_pending_count
, first
->next_count
);
338 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
341 static void sba_cleanup_nonpending_requests(struct sba_device
*sba
)
344 struct sba_request
*req
, *req1
;
346 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
348 /* Freeup all alloced request */
349 list_for_each_entry_safe(req
, req1
, &sba
->reqs_alloc_list
, node
)
350 _sba_free_request(sba
, req
);
352 /* Freeup all received request */
353 list_for_each_entry_safe(req
, req1
, &sba
->reqs_received_list
, node
)
354 _sba_free_request(sba
, req
);
356 /* Freeup all completed request */
357 list_for_each_entry_safe(req
, req1
, &sba
->reqs_completed_list
, node
)
358 _sba_free_request(sba
, req
);
360 /* Set all active requests as aborted */
361 list_for_each_entry_safe(req
, req1
, &sba
->reqs_active_list
, node
)
362 _sba_abort_request(sba
, req
);
365 * Note: We expect that aborted request will be eventually
366 * freed by sba_receive_message()
369 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
372 static void sba_cleanup_pending_requests(struct sba_device
*sba
)
375 struct sba_request
*req
, *req1
;
377 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
379 /* Freeup all pending request */
380 list_for_each_entry_safe(req
, req1
, &sba
->reqs_pending_list
, node
)
381 _sba_free_request(sba
, req
);
383 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
386 /* ====== DMAENGINE callbacks ===== */
388 static void sba_free_chan_resources(struct dma_chan
*dchan
)
391 * Channel resources are pre-alloced so we just free-up
392 * whatever we can so that we can re-use pre-alloced
393 * channel resources next time.
395 sba_cleanup_nonpending_requests(to_sba_device(dchan
));
398 static int sba_device_terminate_all(struct dma_chan
*dchan
)
400 /* Cleanup all pending requests */
401 sba_cleanup_pending_requests(to_sba_device(dchan
));
406 static int sba_send_mbox_request(struct sba_device
*sba
,
407 struct sba_request
*req
)
409 int mchans_idx
, ret
= 0;
411 /* Select mailbox channel in round-robin fashion */
412 mchans_idx
= atomic_inc_return(&sba
->mchans_current
);
413 mchans_idx
= mchans_idx
% sba
->mchans_count
;
415 /* Send message for the request */
417 ret
= mbox_send_message(sba
->mchans
[mchans_idx
], &req
->msg
);
419 dev_err(sba
->dev
, "send message failed with error %d", ret
);
422 ret
= req
->msg
.error
;
424 dev_err(sba
->dev
, "message error %d", ret
);
431 static void sba_issue_pending(struct dma_chan
*dchan
)
435 struct sba_request
*req
, *req1
;
436 struct sba_device
*sba
= to_sba_device(dchan
);
438 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
440 /* Process all pending request */
441 list_for_each_entry_safe(req
, req1
, &sba
->reqs_pending_list
, node
) {
442 /* Try to make request active */
443 if (!_sba_active_request(sba
, req
))
446 /* Send request to mailbox channel */
447 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
448 ret
= sba_send_mbox_request(sba
, req
);
449 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
451 /* If something went wrong then keep request pending */
453 _sba_pending_request(sba
, req
);
458 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
461 static dma_cookie_t
sba_tx_submit(struct dma_async_tx_descriptor
*tx
)
465 struct sba_device
*sba
;
466 struct sba_request
*req
, *nreq
;
471 sba
= to_sba_device(tx
->chan
);
472 req
= to_sba_request(tx
);
474 /* Assign cookie and mark all chained requests pending */
475 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
476 cookie
= dma_cookie_assign(tx
);
477 _sba_pending_request(sba
, req
);
478 list_for_each_entry(nreq
, &req
->next
, next
)
479 _sba_pending_request(sba
, nreq
);
480 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
485 static enum dma_status
sba_tx_status(struct dma_chan
*dchan
,
487 struct dma_tx_state
*txstate
)
491 struct sba_device
*sba
= to_sba_device(dchan
);
493 for (mchan_idx
= 0; mchan_idx
< sba
->mchans_count
; mchan_idx
++)
494 mbox_client_peek_data(sba
->mchans
[mchan_idx
]);
496 ret
= dma_cookie_status(dchan
, cookie
, txstate
);
497 if (ret
== DMA_COMPLETE
)
500 return dma_cookie_status(dchan
, cookie
, txstate
);
503 static void sba_fillup_interrupt_msg(struct sba_request
*req
,
504 struct brcm_sba_command
*cmds
,
505 struct brcm_message
*msg
)
509 struct brcm_sba_command
*cmdsp
= cmds
;
511 /* Type-B command to load dummy data into buf0 */
512 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
513 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
514 cmd
= sba_cmd_enc(cmd
, req
->sba
->hw_resp_size
,
515 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
516 c_mdata
= sba_cmd_load_c_mdata(0);
517 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
518 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
519 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
520 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
522 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
523 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
524 cmdsp
->data
= req
->resp_dma
;
525 cmdsp
->data_len
= req
->sba
->hw_resp_size
;
528 /* Type-A command to write buf0 to dummy location */
529 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
530 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
531 cmd
= sba_cmd_enc(cmd
, req
->sba
->hw_resp_size
,
532 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
533 cmd
= sba_cmd_enc(cmd
, 0x1,
534 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
535 c_mdata
= sba_cmd_write_c_mdata(0);
536 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
537 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
538 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
539 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
541 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
542 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
543 if (req
->sba
->hw_resp_size
) {
544 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
545 cmdsp
->resp
= req
->resp_dma
;
546 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
548 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
549 cmdsp
->data
= req
->resp_dma
;
550 cmdsp
->data_len
= req
->sba
->hw_resp_size
;
553 /* Fillup brcm_message */
554 msg
->type
= BRCM_MESSAGE_SBA
;
555 msg
->sba
.cmds
= cmds
;
556 msg
->sba
.cmds_count
= cmdsp
- cmds
;
561 static struct dma_async_tx_descriptor
*
562 sba_prep_dma_interrupt(struct dma_chan
*dchan
, unsigned long flags
)
564 struct sba_request
*req
= NULL
;
565 struct sba_device
*sba
= to_sba_device(dchan
);
567 /* Alloc new request */
568 req
= sba_alloc_request(sba
);
573 * Force fence so that no requests are submitted
574 * until DMA callback for this request is invoked.
578 /* Fillup request message */
579 sba_fillup_interrupt_msg(req
, req
->cmds
, &req
->msg
);
581 /* Init async_tx descriptor */
582 req
->tx
.flags
= flags
;
583 req
->tx
.cookie
= -EBUSY
;
588 static void sba_fillup_memcpy_msg(struct sba_request
*req
,
589 struct brcm_sba_command
*cmds
,
590 struct brcm_message
*msg
,
591 dma_addr_t msg_offset
, size_t msg_len
,
592 dma_addr_t dst
, dma_addr_t src
)
596 struct brcm_sba_command
*cmdsp
= cmds
;
598 /* Type-B command to load data into buf0 */
599 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
600 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
601 cmd
= sba_cmd_enc(cmd
, msg_len
,
602 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
603 c_mdata
= sba_cmd_load_c_mdata(0);
604 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
605 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
606 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
607 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
609 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
610 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
611 cmdsp
->data
= src
+ msg_offset
;
612 cmdsp
->data_len
= msg_len
;
615 /* Type-A command to write buf0 */
616 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
617 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
618 cmd
= sba_cmd_enc(cmd
, msg_len
,
619 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
620 cmd
= sba_cmd_enc(cmd
, 0x1,
621 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
622 c_mdata
= sba_cmd_write_c_mdata(0);
623 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
624 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
625 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
626 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
628 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
629 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
630 if (req
->sba
->hw_resp_size
) {
631 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
632 cmdsp
->resp
= req
->resp_dma
;
633 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
635 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
636 cmdsp
->data
= dst
+ msg_offset
;
637 cmdsp
->data_len
= msg_len
;
640 /* Fillup brcm_message */
641 msg
->type
= BRCM_MESSAGE_SBA
;
642 msg
->sba
.cmds
= cmds
;
643 msg
->sba
.cmds_count
= cmdsp
- cmds
;
648 static struct sba_request
*
649 sba_prep_dma_memcpy_req(struct sba_device
*sba
,
650 dma_addr_t off
, dma_addr_t dst
, dma_addr_t src
,
651 size_t len
, unsigned long flags
)
653 struct sba_request
*req
= NULL
;
655 /* Alloc new request */
656 req
= sba_alloc_request(sba
);
659 req
->fence
= (flags
& DMA_PREP_FENCE
) ? true : false;
661 /* Fillup request message */
662 sba_fillup_memcpy_msg(req
, req
->cmds
, &req
->msg
,
665 /* Init async_tx descriptor */
666 req
->tx
.flags
= flags
;
667 req
->tx
.cookie
= -EBUSY
;
672 static struct dma_async_tx_descriptor
*
673 sba_prep_dma_memcpy(struct dma_chan
*dchan
, dma_addr_t dst
, dma_addr_t src
,
674 size_t len
, unsigned long flags
)
678 struct sba_device
*sba
= to_sba_device(dchan
);
679 struct sba_request
*first
= NULL
, *req
;
681 /* Create chained requests where each request is upto hw_buf_size */
683 req_len
= (len
< sba
->hw_buf_size
) ? len
: sba
->hw_buf_size
;
685 req
= sba_prep_dma_memcpy_req(sba
, off
, dst
, src
,
689 sba_free_chained_requests(first
);
694 sba_chain_request(first
, req
);
702 return (first
) ? &first
->tx
: NULL
;
705 static void sba_fillup_xor_msg(struct sba_request
*req
,
706 struct brcm_sba_command
*cmds
,
707 struct brcm_message
*msg
,
708 dma_addr_t msg_offset
, size_t msg_len
,
709 dma_addr_t dst
, dma_addr_t
*src
, u32 src_cnt
)
714 struct brcm_sba_command
*cmdsp
= cmds
;
716 /* Type-B command to load data into buf0 */
717 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
718 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
719 cmd
= sba_cmd_enc(cmd
, msg_len
,
720 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
721 c_mdata
= sba_cmd_load_c_mdata(0);
722 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
723 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
724 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
725 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
727 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
728 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
729 cmdsp
->data
= src
[0] + msg_offset
;
730 cmdsp
->data_len
= msg_len
;
733 /* Type-B commands to xor data with buf0 and put it back in buf0 */
734 for (i
= 1; i
< src_cnt
; i
++) {
735 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
736 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
737 cmd
= sba_cmd_enc(cmd
, msg_len
,
738 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
739 c_mdata
= sba_cmd_xor_c_mdata(0, 0);
740 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
741 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
742 cmd
= sba_cmd_enc(cmd
, SBA_CMD_XOR
,
743 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
745 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
746 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
747 cmdsp
->data
= src
[i
] + msg_offset
;
748 cmdsp
->data_len
= msg_len
;
752 /* Type-A command to write buf0 */
753 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
754 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
755 cmd
= sba_cmd_enc(cmd
, msg_len
,
756 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
757 cmd
= sba_cmd_enc(cmd
, 0x1,
758 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
759 c_mdata
= sba_cmd_write_c_mdata(0);
760 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
761 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
762 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
763 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
765 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
766 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
767 if (req
->sba
->hw_resp_size
) {
768 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
769 cmdsp
->resp
= req
->resp_dma
;
770 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
772 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
773 cmdsp
->data
= dst
+ msg_offset
;
774 cmdsp
->data_len
= msg_len
;
777 /* Fillup brcm_message */
778 msg
->type
= BRCM_MESSAGE_SBA
;
779 msg
->sba
.cmds
= cmds
;
780 msg
->sba
.cmds_count
= cmdsp
- cmds
;
786 sba_prep_dma_xor_req(struct sba_device
*sba
,
787 dma_addr_t off
, dma_addr_t dst
, dma_addr_t
*src
,
788 u32 src_cnt
, size_t len
, unsigned long flags
)
790 struct sba_request
*req
= NULL
;
792 /* Alloc new request */
793 req
= sba_alloc_request(sba
);
796 req
->fence
= (flags
& DMA_PREP_FENCE
) ? true : false;
798 /* Fillup request message */
799 sba_fillup_xor_msg(req
, req
->cmds
, &req
->msg
,
800 off
, len
, dst
, src
, src_cnt
);
802 /* Init async_tx descriptor */
803 req
->tx
.flags
= flags
;
804 req
->tx
.cookie
= -EBUSY
;
809 static struct dma_async_tx_descriptor
*
810 sba_prep_dma_xor(struct dma_chan
*dchan
, dma_addr_t dst
, dma_addr_t
*src
,
811 u32 src_cnt
, size_t len
, unsigned long flags
)
815 struct sba_device
*sba
= to_sba_device(dchan
);
816 struct sba_request
*first
= NULL
, *req
;
819 if (unlikely(src_cnt
> sba
->max_xor_srcs
))
822 /* Create chained requests where each request is upto hw_buf_size */
824 req_len
= (len
< sba
->hw_buf_size
) ? len
: sba
->hw_buf_size
;
826 req
= sba_prep_dma_xor_req(sba
, off
, dst
, src
, src_cnt
,
830 sba_free_chained_requests(first
);
835 sba_chain_request(first
, req
);
843 return (first
) ? &first
->tx
: NULL
;
846 static void sba_fillup_pq_msg(struct sba_request
*req
,
848 struct brcm_sba_command
*cmds
,
849 struct brcm_message
*msg
,
850 dma_addr_t msg_offset
, size_t msg_len
,
851 dma_addr_t
*dst_p
, dma_addr_t
*dst_q
,
852 const u8
*scf
, dma_addr_t
*src
, u32 src_cnt
)
857 struct brcm_sba_command
*cmdsp
= cmds
;
860 /* Type-B command to load old P into buf0 */
862 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
863 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
864 cmd
= sba_cmd_enc(cmd
, msg_len
,
865 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
866 c_mdata
= sba_cmd_load_c_mdata(0);
867 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
868 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
869 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
870 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
872 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
873 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
874 cmdsp
->data
= *dst_p
+ msg_offset
;
875 cmdsp
->data_len
= msg_len
;
879 /* Type-B command to load old Q into buf1 */
881 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
882 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
883 cmd
= sba_cmd_enc(cmd
, msg_len
,
884 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
885 c_mdata
= sba_cmd_load_c_mdata(1);
886 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
887 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
888 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
889 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
891 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
892 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
893 cmdsp
->data
= *dst_q
+ msg_offset
;
894 cmdsp
->data_len
= msg_len
;
898 /* Type-A command to zero all buffers */
899 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
900 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
901 cmd
= sba_cmd_enc(cmd
, msg_len
,
902 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
903 cmd
= sba_cmd_enc(cmd
, SBA_CMD_ZERO_ALL_BUFFERS
,
904 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
906 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
907 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
911 /* Type-B commands for generate P onto buf0 and Q onto buf1 */
912 for (i
= 0; i
< src_cnt
; i
++) {
913 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
914 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
915 cmd
= sba_cmd_enc(cmd
, msg_len
,
916 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
917 c_mdata
= sba_cmd_pq_c_mdata(raid6_gflog
[scf
[i
]], 1, 0);
918 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
919 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
920 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_MS(c_mdata
),
921 SBA_C_MDATA_MS_SHIFT
, SBA_C_MDATA_MS_MASK
);
922 cmd
= sba_cmd_enc(cmd
, SBA_CMD_GALOIS_XOR
,
923 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
925 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
926 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
927 cmdsp
->data
= src
[i
] + msg_offset
;
928 cmdsp
->data_len
= msg_len
;
932 /* Type-A command to write buf0 */
934 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
935 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
936 cmd
= sba_cmd_enc(cmd
, msg_len
,
937 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
938 cmd
= sba_cmd_enc(cmd
, 0x1,
939 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
940 c_mdata
= sba_cmd_write_c_mdata(0);
941 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
942 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
943 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
944 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
946 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
947 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
948 if (req
->sba
->hw_resp_size
) {
949 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
950 cmdsp
->resp
= req
->resp_dma
;
951 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
953 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
954 cmdsp
->data
= *dst_p
+ msg_offset
;
955 cmdsp
->data_len
= msg_len
;
959 /* Type-A command to write buf1 */
961 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
962 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
963 cmd
= sba_cmd_enc(cmd
, msg_len
,
964 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
965 cmd
= sba_cmd_enc(cmd
, 0x1,
966 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
967 c_mdata
= sba_cmd_write_c_mdata(1);
968 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
969 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
970 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
971 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
973 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
974 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
975 if (req
->sba
->hw_resp_size
) {
976 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
977 cmdsp
->resp
= req
->resp_dma
;
978 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
980 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
981 cmdsp
->data
= *dst_q
+ msg_offset
;
982 cmdsp
->data_len
= msg_len
;
986 /* Fillup brcm_message */
987 msg
->type
= BRCM_MESSAGE_SBA
;
988 msg
->sba
.cmds
= cmds
;
989 msg
->sba
.cmds_count
= cmdsp
- cmds
;
995 sba_prep_dma_pq_req(struct sba_device
*sba
, dma_addr_t off
,
996 dma_addr_t
*dst_p
, dma_addr_t
*dst_q
, dma_addr_t
*src
,
997 u32 src_cnt
, const u8
*scf
, size_t len
, unsigned long flags
)
999 struct sba_request
*req
= NULL
;
1001 /* Alloc new request */
1002 req
= sba_alloc_request(sba
);
1005 req
->fence
= (flags
& DMA_PREP_FENCE
) ? true : false;
1007 /* Fillup request messages */
1008 sba_fillup_pq_msg(req
, dmaf_continue(flags
),
1009 req
->cmds
, &req
->msg
,
1010 off
, len
, dst_p
, dst_q
, scf
, src
, src_cnt
);
1012 /* Init async_tx descriptor */
1013 req
->tx
.flags
= flags
;
1014 req
->tx
.cookie
= -EBUSY
;
1019 static void sba_fillup_pq_single_msg(struct sba_request
*req
,
1021 struct brcm_sba_command
*cmds
,
1022 struct brcm_message
*msg
,
1023 dma_addr_t msg_offset
, size_t msg_len
,
1024 dma_addr_t
*dst_p
, dma_addr_t
*dst_q
,
1025 dma_addr_t src
, u8 scf
)
1029 u8 pos
, dpos
= raid6_gflog
[scf
];
1030 struct brcm_sba_command
*cmdsp
= cmds
;
1036 /* Type-B command to load old P into buf0 */
1037 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
1038 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1039 cmd
= sba_cmd_enc(cmd
, msg_len
,
1040 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1041 c_mdata
= sba_cmd_load_c_mdata(0);
1042 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1043 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1044 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
1045 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1047 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1048 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
1049 cmdsp
->data
= *dst_p
+ msg_offset
;
1050 cmdsp
->data_len
= msg_len
;
1054 * Type-B commands to xor data with buf0 and put it
1057 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
1058 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1059 cmd
= sba_cmd_enc(cmd
, msg_len
,
1060 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1061 c_mdata
= sba_cmd_xor_c_mdata(0, 0);
1062 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1063 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1064 cmd
= sba_cmd_enc(cmd
, SBA_CMD_XOR
,
1065 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1067 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1068 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
1069 cmdsp
->data
= src
+ msg_offset
;
1070 cmdsp
->data_len
= msg_len
;
1073 /* Type-B command to load old P into buf0 */
1074 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
1075 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1076 cmd
= sba_cmd_enc(cmd
, msg_len
,
1077 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1078 c_mdata
= sba_cmd_load_c_mdata(0);
1079 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1080 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1081 cmd
= sba_cmd_enc(cmd
, SBA_CMD_LOAD_BUFFER
,
1082 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1084 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1085 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
1086 cmdsp
->data
= src
+ msg_offset
;
1087 cmdsp
->data_len
= msg_len
;
1091 /* Type-A command to write buf0 */
1092 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
1093 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1094 cmd
= sba_cmd_enc(cmd
, msg_len
,
1095 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1096 cmd
= sba_cmd_enc(cmd
, 0x1,
1097 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
1098 c_mdata
= sba_cmd_write_c_mdata(0);
1099 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1100 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1101 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
1102 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1104 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1105 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
1106 if (req
->sba
->hw_resp_size
) {
1107 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
1108 cmdsp
->resp
= req
->resp_dma
;
1109 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
1111 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
1112 cmdsp
->data
= *dst_p
+ msg_offset
;
1113 cmdsp
->data_len
= msg_len
;
1120 /* Type-A command to zero all buffers */
1121 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
1122 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1123 cmd
= sba_cmd_enc(cmd
, msg_len
,
1124 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1125 cmd
= sba_cmd_enc(cmd
, SBA_CMD_ZERO_ALL_BUFFERS
,
1126 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1128 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1129 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
1133 goto skip_q_computation
;
1134 pos
= (dpos
< req
->sba
->max_pq_coefs
) ?
1135 dpos
: (req
->sba
->max_pq_coefs
- 1);
1138 * Type-B command to generate initial Q from data
1139 * and store output into buf0
1141 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
1142 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1143 cmd
= sba_cmd_enc(cmd
, msg_len
,
1144 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1145 c_mdata
= sba_cmd_pq_c_mdata(pos
, 0, 0);
1146 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1147 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1148 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_MS(c_mdata
),
1149 SBA_C_MDATA_MS_SHIFT
, SBA_C_MDATA_MS_MASK
);
1150 cmd
= sba_cmd_enc(cmd
, SBA_CMD_GALOIS
,
1151 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1153 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1154 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
1155 cmdsp
->data
= src
+ msg_offset
;
1156 cmdsp
->data_len
= msg_len
;
1161 /* Multiple Type-A command to generate final Q */
1163 pos
= (dpos
< req
->sba
->max_pq_coefs
) ?
1164 dpos
: (req
->sba
->max_pq_coefs
- 1);
1167 * Type-A command to generate Q with buf0 and
1168 * buf1 store result in buf0
1170 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
1171 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1172 cmd
= sba_cmd_enc(cmd
, msg_len
,
1173 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1174 c_mdata
= sba_cmd_pq_c_mdata(pos
, 0, 1);
1175 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1176 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1177 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_MS(c_mdata
),
1178 SBA_C_MDATA_MS_SHIFT
, SBA_C_MDATA_MS_MASK
);
1179 cmd
= sba_cmd_enc(cmd
, SBA_CMD_GALOIS
,
1180 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1182 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1183 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
1192 * Type-B command to XOR previous output with
1193 * buf0 and write it into buf0
1195 cmd
= sba_cmd_enc(0x0, SBA_TYPE_B
,
1196 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1197 cmd
= sba_cmd_enc(cmd
, msg_len
,
1198 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1199 c_mdata
= sba_cmd_xor_c_mdata(0, 0);
1200 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1201 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1202 cmd
= sba_cmd_enc(cmd
, SBA_CMD_XOR
,
1203 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1205 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1206 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_B
;
1207 cmdsp
->data
= *dst_q
+ msg_offset
;
1208 cmdsp
->data_len
= msg_len
;
1212 /* Type-A command to write buf0 */
1213 cmd
= sba_cmd_enc(0x0, SBA_TYPE_A
,
1214 SBA_TYPE_SHIFT
, SBA_TYPE_MASK
);
1215 cmd
= sba_cmd_enc(cmd
, msg_len
,
1216 SBA_USER_DEF_SHIFT
, SBA_USER_DEF_MASK
);
1217 cmd
= sba_cmd_enc(cmd
, 0x1,
1218 SBA_RESP_SHIFT
, SBA_RESP_MASK
);
1219 c_mdata
= sba_cmd_write_c_mdata(0);
1220 cmd
= sba_cmd_enc(cmd
, SBA_C_MDATA_LS(c_mdata
),
1221 SBA_C_MDATA_SHIFT
, SBA_C_MDATA_MASK
);
1222 cmd
= sba_cmd_enc(cmd
, SBA_CMD_WRITE_BUFFER
,
1223 SBA_CMD_SHIFT
, SBA_CMD_MASK
);
1225 *cmdsp
->cmd_dma
= cpu_to_le64(cmd
);
1226 cmdsp
->flags
= BRCM_SBA_CMD_TYPE_A
;
1227 if (req
->sba
->hw_resp_size
) {
1228 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_RESP
;
1229 cmdsp
->resp
= req
->resp_dma
;
1230 cmdsp
->resp_len
= req
->sba
->hw_resp_size
;
1232 cmdsp
->flags
|= BRCM_SBA_CMD_HAS_OUTPUT
;
1233 cmdsp
->data
= *dst_q
+ msg_offset
;
1234 cmdsp
->data_len
= msg_len
;
1238 /* Fillup brcm_message */
1239 msg
->type
= BRCM_MESSAGE_SBA
;
1240 msg
->sba
.cmds
= cmds
;
1241 msg
->sba
.cmds_count
= cmdsp
- cmds
;
1246 struct sba_request
*
1247 sba_prep_dma_pq_single_req(struct sba_device
*sba
, dma_addr_t off
,
1248 dma_addr_t
*dst_p
, dma_addr_t
*dst_q
,
1249 dma_addr_t src
, u8 scf
, size_t len
,
1250 unsigned long flags
)
1252 struct sba_request
*req
= NULL
;
1254 /* Alloc new request */
1255 req
= sba_alloc_request(sba
);
1258 req
->fence
= (flags
& DMA_PREP_FENCE
) ? true : false;
1260 /* Fillup request messages */
1261 sba_fillup_pq_single_msg(req
, dmaf_continue(flags
),
1262 req
->cmds
, &req
->msg
, off
, len
,
1263 dst_p
, dst_q
, src
, scf
);
1265 /* Init async_tx descriptor */
1266 req
->tx
.flags
= flags
;
1267 req
->tx
.cookie
= -EBUSY
;
1272 static struct dma_async_tx_descriptor
*
1273 sba_prep_dma_pq(struct dma_chan
*dchan
, dma_addr_t
*dst
, dma_addr_t
*src
,
1274 u32 src_cnt
, const u8
*scf
, size_t len
, unsigned long flags
)
1280 dma_addr_t
*dst_p
= NULL
, *dst_q
= NULL
;
1281 struct sba_device
*sba
= to_sba_device(dchan
);
1282 struct sba_request
*first
= NULL
, *req
;
1285 if (unlikely(src_cnt
> sba
->max_pq_srcs
))
1287 for (i
= 0; i
< src_cnt
; i
++)
1288 if (sba
->max_pq_coefs
<= raid6_gflog
[scf
[i
]])
1291 /* Figure-out P and Q destination addresses */
1292 if (!(flags
& DMA_PREP_PQ_DISABLE_P
))
1294 if (!(flags
& DMA_PREP_PQ_DISABLE_Q
))
1297 /* Create chained requests where each request is upto hw_buf_size */
1299 req_len
= (len
< sba
->hw_buf_size
) ? len
: sba
->hw_buf_size
;
1302 dst_q_index
= src_cnt
;
1305 for (i
= 0; i
< src_cnt
; i
++) {
1306 if (*dst_q
== src
[i
]) {
1313 if (dst_q_index
< src_cnt
) {
1315 req
= sba_prep_dma_pq_single_req(sba
,
1316 off
, dst_p
, dst_q
, src
[i
], scf
[i
],
1317 req_len
, flags
| DMA_PREP_FENCE
);
1322 sba_chain_request(first
, req
);
1326 flags
|= DMA_PREP_CONTINUE
;
1329 for (i
= 0; i
< src_cnt
; i
++) {
1330 if (dst_q_index
== i
)
1333 req
= sba_prep_dma_pq_single_req(sba
,
1334 off
, dst_p
, dst_q
, src
[i
], scf
[i
],
1335 req_len
, flags
| DMA_PREP_FENCE
);
1340 sba_chain_request(first
, req
);
1344 flags
|= DMA_PREP_CONTINUE
;
1347 req
= sba_prep_dma_pq_req(sba
, off
,
1348 dst_p
, dst_q
, src
, src_cnt
,
1349 scf
, req_len
, flags
);
1354 sba_chain_request(first
, req
);
1363 return (first
) ? &first
->tx
: NULL
;
1367 sba_free_chained_requests(first
);
1371 /* ====== Mailbox callbacks ===== */
1373 static void sba_dma_tx_actions(struct sba_request
*req
)
1375 struct dma_async_tx_descriptor
*tx
= &req
->tx
;
1377 WARN_ON(tx
->cookie
< 0);
1379 if (tx
->cookie
> 0) {
1380 dma_cookie_complete(tx
);
1383 * Call the callback (must not sleep or submit new
1384 * operations to this channel)
1387 tx
->callback(tx
->callback_param
);
1389 dma_descriptor_unmap(tx
);
1392 /* Run dependent operations */
1393 dma_run_dependencies(tx
);
1395 /* If waiting for 'ack' then move to completed list */
1396 if (!async_tx_test_ack(&req
->tx
))
1397 sba_complete_chained_requests(req
);
1399 sba_free_chained_requests(req
);
1402 static void sba_receive_message(struct mbox_client
*cl
, void *msg
)
1404 unsigned long flags
;
1405 struct brcm_message
*m
= msg
;
1406 struct sba_request
*req
= m
->ctx
, *req1
;
1407 struct sba_device
*sba
= req
->sba
;
1409 /* Error count if message has error */
1411 dev_err(sba
->dev
, "%s got message with error %d",
1412 dma_chan_name(&sba
->dma_chan
), m
->error
);
1414 /* Mark request as received */
1415 sba_received_request(req
);
1417 /* Wait for all chained requests to be completed */
1418 if (atomic_dec_return(&req
->first
->next_pending_count
))
1421 /* Point to first request */
1424 /* Update request */
1425 if (req
->state
== SBA_REQUEST_STATE_RECEIVED
)
1426 sba_dma_tx_actions(req
);
1428 sba_free_chained_requests(req
);
1430 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
1432 /* Re-check all completed request waiting for 'ack' */
1433 list_for_each_entry_safe(req
, req1
, &sba
->reqs_completed_list
, node
) {
1434 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
1435 sba_dma_tx_actions(req
);
1436 spin_lock_irqsave(&sba
->reqs_lock
, flags
);
1439 spin_unlock_irqrestore(&sba
->reqs_lock
, flags
);
1442 /* Try to submit pending request */
1443 sba_issue_pending(&sba
->dma_chan
);
1446 /* ====== Platform driver routines ===== */
1448 static int sba_prealloc_channel_resources(struct sba_device
*sba
)
1450 int i
, j
, p
, ret
= 0;
1451 struct sba_request
*req
= NULL
;
1453 sba
->resp_base
= dma_alloc_coherent(sba
->dma_dev
.dev
,
1454 sba
->max_resp_pool_size
,
1455 &sba
->resp_dma_base
, GFP_KERNEL
);
1456 if (!sba
->resp_base
)
1459 sba
->cmds_base
= dma_alloc_coherent(sba
->dma_dev
.dev
,
1460 sba
->max_cmds_pool_size
,
1461 &sba
->cmds_dma_base
, GFP_KERNEL
);
1462 if (!sba
->cmds_base
) {
1464 goto fail_free_resp_pool
;
1467 spin_lock_init(&sba
->reqs_lock
);
1468 sba
->reqs_fence
= false;
1469 INIT_LIST_HEAD(&sba
->reqs_alloc_list
);
1470 INIT_LIST_HEAD(&sba
->reqs_pending_list
);
1471 INIT_LIST_HEAD(&sba
->reqs_active_list
);
1472 INIT_LIST_HEAD(&sba
->reqs_received_list
);
1473 INIT_LIST_HEAD(&sba
->reqs_completed_list
);
1474 INIT_LIST_HEAD(&sba
->reqs_aborted_list
);
1475 INIT_LIST_HEAD(&sba
->reqs_free_list
);
1477 sba
->reqs
= devm_kcalloc(sba
->dev
, sba
->max_req
,
1478 sizeof(*req
), GFP_KERNEL
);
1481 goto fail_free_cmds_pool
;
1484 for (i
= 0, p
= 0; i
< sba
->max_req
; i
++) {
1485 req
= &sba
->reqs
[i
];
1486 INIT_LIST_HEAD(&req
->node
);
1488 req
->state
= SBA_REQUEST_STATE_FREE
;
1489 INIT_LIST_HEAD(&req
->next
);
1490 req
->next_count
= 1;
1491 atomic_set(&req
->next_pending_count
, 0);
1493 req
->resp
= sba
->resp_base
+ p
;
1494 req
->resp_dma
= sba
->resp_dma_base
+ p
;
1495 p
+= sba
->hw_resp_size
;
1496 req
->cmds
= devm_kcalloc(sba
->dev
, sba
->max_cmd_per_req
,
1497 sizeof(*req
->cmds
), GFP_KERNEL
);
1500 goto fail_free_cmds_pool
;
1502 for (j
= 0; j
< sba
->max_cmd_per_req
; j
++) {
1503 req
->cmds
[j
].cmd
= 0;
1504 req
->cmds
[j
].cmd_dma
= sba
->cmds_base
+
1505 (i
* sba
->max_cmd_per_req
+ j
) * sizeof(u64
);
1506 req
->cmds
[j
].cmd_dma_addr
= sba
->cmds_dma_base
+
1507 (i
* sba
->max_cmd_per_req
+ j
) * sizeof(u64
);
1508 req
->cmds
[j
].flags
= 0;
1510 memset(&req
->msg
, 0, sizeof(req
->msg
));
1511 dma_async_tx_descriptor_init(&req
->tx
, &sba
->dma_chan
);
1512 req
->tx
.tx_submit
= sba_tx_submit
;
1513 req
->tx
.phys
= req
->resp_dma
;
1514 list_add_tail(&req
->node
, &sba
->reqs_free_list
);
1517 sba
->reqs_free_count
= sba
->max_req
;
1521 fail_free_cmds_pool
:
1522 dma_free_coherent(sba
->dma_dev
.dev
,
1523 sba
->max_cmds_pool_size
,
1524 sba
->cmds_base
, sba
->cmds_dma_base
);
1525 fail_free_resp_pool
:
1526 dma_free_coherent(sba
->dma_dev
.dev
,
1527 sba
->max_resp_pool_size
,
1528 sba
->resp_base
, sba
->resp_dma_base
);
1532 static void sba_freeup_channel_resources(struct sba_device
*sba
)
1534 dmaengine_terminate_all(&sba
->dma_chan
);
1535 dma_free_coherent(sba
->dma_dev
.dev
, sba
->max_cmds_pool_size
,
1536 sba
->cmds_base
, sba
->cmds_dma_base
);
1537 dma_free_coherent(sba
->dma_dev
.dev
, sba
->max_resp_pool_size
,
1538 sba
->resp_base
, sba
->resp_dma_base
);
1539 sba
->resp_base
= NULL
;
1540 sba
->resp_dma_base
= 0;
1543 static int sba_async_register(struct sba_device
*sba
)
1546 struct dma_device
*dma_dev
= &sba
->dma_dev
;
1548 /* Initialize DMA channel cookie */
1549 sba
->dma_chan
.device
= dma_dev
;
1550 dma_cookie_init(&sba
->dma_chan
);
1552 /* Initialize DMA device capability mask */
1553 dma_cap_zero(dma_dev
->cap_mask
);
1554 dma_cap_set(DMA_INTERRUPT
, dma_dev
->cap_mask
);
1555 dma_cap_set(DMA_MEMCPY
, dma_dev
->cap_mask
);
1556 dma_cap_set(DMA_XOR
, dma_dev
->cap_mask
);
1557 dma_cap_set(DMA_PQ
, dma_dev
->cap_mask
);
1560 * Set mailbox channel device as the base device of
1561 * our dma_device because the actual memory accesses
1562 * will be done by mailbox controller
1564 dma_dev
->dev
= sba
->mbox_dev
;
1566 /* Set base prep routines */
1567 dma_dev
->device_free_chan_resources
= sba_free_chan_resources
;
1568 dma_dev
->device_terminate_all
= sba_device_terminate_all
;
1569 dma_dev
->device_issue_pending
= sba_issue_pending
;
1570 dma_dev
->device_tx_status
= sba_tx_status
;
1572 /* Set interrupt routine */
1573 if (dma_has_cap(DMA_INTERRUPT
, dma_dev
->cap_mask
))
1574 dma_dev
->device_prep_dma_interrupt
= sba_prep_dma_interrupt
;
1576 /* Set memcpy routine */
1577 if (dma_has_cap(DMA_MEMCPY
, dma_dev
->cap_mask
))
1578 dma_dev
->device_prep_dma_memcpy
= sba_prep_dma_memcpy
;
1580 /* Set xor routine and capability */
1581 if (dma_has_cap(DMA_XOR
, dma_dev
->cap_mask
)) {
1582 dma_dev
->device_prep_dma_xor
= sba_prep_dma_xor
;
1583 dma_dev
->max_xor
= sba
->max_xor_srcs
;
1586 /* Set pq routine and capability */
1587 if (dma_has_cap(DMA_PQ
, dma_dev
->cap_mask
)) {
1588 dma_dev
->device_prep_dma_pq
= sba_prep_dma_pq
;
1589 dma_set_maxpq(dma_dev
, sba
->max_pq_srcs
, 0);
1592 /* Initialize DMA device channel list */
1593 INIT_LIST_HEAD(&dma_dev
->channels
);
1594 list_add_tail(&sba
->dma_chan
.device_node
, &dma_dev
->channels
);
1596 /* Register with Linux async DMA framework*/
1597 ret
= dma_async_device_register(dma_dev
);
1599 dev_err(sba
->dev
, "async device register error %d", ret
);
1603 dev_info(sba
->dev
, "%s capabilities: %s%s%s%s\n",
1604 dma_chan_name(&sba
->dma_chan
),
1605 dma_has_cap(DMA_INTERRUPT
, dma_dev
->cap_mask
) ? "interrupt " : "",
1606 dma_has_cap(DMA_MEMCPY
, dma_dev
->cap_mask
) ? "memcpy " : "",
1607 dma_has_cap(DMA_XOR
, dma_dev
->cap_mask
) ? "xor " : "",
1608 dma_has_cap(DMA_PQ
, dma_dev
->cap_mask
) ? "pq " : "");
1613 static int sba_probe(struct platform_device
*pdev
)
1615 int i
, ret
= 0, mchans_count
;
1616 struct sba_device
*sba
;
1617 struct platform_device
*mbox_pdev
;
1618 struct of_phandle_args args
;
1620 /* Allocate main SBA struct */
1621 sba
= devm_kzalloc(&pdev
->dev
, sizeof(*sba
), GFP_KERNEL
);
1625 sba
->dev
= &pdev
->dev
;
1626 platform_set_drvdata(pdev
, sba
);
1628 /* Determine SBA version from DT compatible string */
1629 if (of_device_is_compatible(sba
->dev
->of_node
, "brcm,iproc-sba"))
1630 sba
->ver
= SBA_VER_1
;
1631 else if (of_device_is_compatible(sba
->dev
->of_node
,
1632 "brcm,iproc-sba-v2"))
1633 sba
->ver
= SBA_VER_2
;
1637 /* Derived Configuration parameters */
1640 sba
->max_req
= 1024;
1641 sba
->hw_buf_size
= 4096;
1642 sba
->hw_resp_size
= 8;
1643 sba
->max_pq_coefs
= 6;
1644 sba
->max_pq_srcs
= 6;
1647 sba
->max_req
= 1024;
1648 sba
->hw_buf_size
= 4096;
1649 sba
->hw_resp_size
= 8;
1650 sba
->max_pq_coefs
= 30;
1652 * We can support max_pq_srcs == max_pq_coefs because
1653 * we are limited by number of SBA commands that we can
1654 * fit in one message for underlying ring manager HW.
1656 sba
->max_pq_srcs
= 12;
1661 sba
->max_cmd_per_req
= sba
->max_pq_srcs
+ 3;
1662 sba
->max_xor_srcs
= sba
->max_cmd_per_req
- 1;
1663 sba
->max_resp_pool_size
= sba
->max_req
* sba
->hw_resp_size
;
1664 sba
->max_cmds_pool_size
= sba
->max_req
*
1665 sba
->max_cmd_per_req
* sizeof(u64
);
1667 /* Setup mailbox client */
1668 sba
->client
.dev
= &pdev
->dev
;
1669 sba
->client
.rx_callback
= sba_receive_message
;
1670 sba
->client
.tx_block
= false;
1671 sba
->client
.knows_txdone
= false;
1672 sba
->client
.tx_tout
= 0;
1674 /* Number of channels equals number of mailbox channels */
1675 ret
= of_count_phandle_with_args(pdev
->dev
.of_node
,
1676 "mboxes", "#mbox-cells");
1680 sba
->mchans_count
= 0;
1681 atomic_set(&sba
->mchans_current
, 0);
1683 /* Allocate mailbox channel array */
1684 sba
->mchans
= devm_kcalloc(&pdev
->dev
, sba
->mchans_count
,
1685 sizeof(*sba
->mchans
), GFP_KERNEL
);
1689 /* Request mailbox channels */
1690 for (i
= 0; i
< mchans_count
; i
++) {
1691 sba
->mchans
[i
] = mbox_request_channel(&sba
->client
, i
);
1692 if (IS_ERR(sba
->mchans
[i
])) {
1693 ret
= PTR_ERR(sba
->mchans
[i
]);
1694 goto fail_free_mchans
;
1696 sba
->mchans_count
++;
1699 /* Find-out underlying mailbox device */
1700 ret
= of_parse_phandle_with_args(pdev
->dev
.of_node
,
1701 "mboxes", "#mbox-cells", 0, &args
);
1703 goto fail_free_mchans
;
1704 mbox_pdev
= of_find_device_by_node(args
.np
);
1705 of_node_put(args
.np
);
1708 goto fail_free_mchans
;
1710 sba
->mbox_dev
= &mbox_pdev
->dev
;
1712 /* All mailbox channels should be of same ring manager device */
1713 for (i
= 1; i
< mchans_count
; i
++) {
1714 ret
= of_parse_phandle_with_args(pdev
->dev
.of_node
,
1715 "mboxes", "#mbox-cells", i
, &args
);
1717 goto fail_free_mchans
;
1718 mbox_pdev
= of_find_device_by_node(args
.np
);
1719 of_node_put(args
.np
);
1720 if (sba
->mbox_dev
!= &mbox_pdev
->dev
) {
1722 goto fail_free_mchans
;
1726 /* Register DMA device with linux async framework */
1727 ret
= sba_async_register(sba
);
1729 goto fail_free_mchans
;
1731 /* Prealloc channel resource */
1732 ret
= sba_prealloc_channel_resources(sba
);
1734 goto fail_async_dev_unreg
;
1736 /* Print device info */
1737 dev_info(sba
->dev
, "%s using SBAv%d and %d mailbox channels",
1738 dma_chan_name(&sba
->dma_chan
), sba
->ver
+1,
1743 fail_async_dev_unreg
:
1744 dma_async_device_unregister(&sba
->dma_dev
);
1746 for (i
= 0; i
< sba
->mchans_count
; i
++)
1747 mbox_free_channel(sba
->mchans
[i
]);
1751 static int sba_remove(struct platform_device
*pdev
)
1754 struct sba_device
*sba
= platform_get_drvdata(pdev
);
1756 sba_freeup_channel_resources(sba
);
1758 dma_async_device_unregister(&sba
->dma_dev
);
1760 for (i
= 0; i
< sba
->mchans_count
; i
++)
1761 mbox_free_channel(sba
->mchans
[i
]);
1766 static const struct of_device_id sba_of_match
[] = {
1767 { .compatible
= "brcm,iproc-sba", },
1768 { .compatible
= "brcm,iproc-sba-v2", },
1771 MODULE_DEVICE_TABLE(of
, sba_of_match
);
1773 static struct platform_driver sba_driver
= {
1775 .remove
= sba_remove
,
1777 .name
= "bcm-sba-raid",
1778 .of_match_table
= sba_of_match
,
1781 module_platform_driver(sba_driver
);
1783 MODULE_DESCRIPTION("Broadcom SBA RAID driver");
1784 MODULE_AUTHOR("Anup Patel <anup.patel@broadcom.com>");
1785 MODULE_LICENSE("GPL v2");