2 * Copyright (C) Ericsson AB 2007-2008
3 * Copyright (C) ST-Ericsson SA 2008-2010
4 * Author: Per Forlin <per.forlin@stericsson.com> for ST-Ericsson
5 * Author: Jonas Aaberg <jonas.aberg@stericsson.com> for ST-Ericsson
6 * License terms: GNU General Public License (GPL) version 2
9 #include <linux/kernel.h>
10 #include <linux/slab.h>
11 #include <linux/dmaengine.h>
12 #include <linux/platform_device.h>
13 #include <linux/clk.h>
14 #include <linux/delay.h>
15 #include <linux/err.h>
17 #include <plat/ste_dma40.h>
19 #include "ste_dma40_ll.h"
21 #define D40_NAME "dma40"
23 #define D40_PHY_CHAN -1
25 /* For masking out/in 2 bit channel positions */
26 #define D40_CHAN_POS(chan) (2 * (chan / 2))
27 #define D40_CHAN_POS_MASK(chan) (0x3 << D40_CHAN_POS(chan))
29 /* Maximum iterations taken before giving up suspending a channel */
30 #define D40_SUSPEND_MAX_IT 500
32 /* Hardware requirement on LCLA alignment */
33 #define LCLA_ALIGNMENT 0x40000
35 /* Max number of links per event group */
36 #define D40_LCLA_LINK_PER_EVENT_GRP 128
37 #define D40_LCLA_END D40_LCLA_LINK_PER_EVENT_GRP
39 /* Attempts before giving up to trying to get pages that are aligned */
40 #define MAX_LCLA_ALLOC_ATTEMPTS 256
42 /* Bit markings for allocation map */
43 #define D40_ALLOC_FREE (1 << 31)
44 #define D40_ALLOC_PHY (1 << 30)
45 #define D40_ALLOC_LOG_FREE 0
47 /* Hardware designer of the block */
48 #define D40_HW_DESIGNER 0x8
51 * enum 40_command - The different commands and/or statuses.
53 * @D40_DMA_STOP: DMA channel command STOP or status STOPPED,
54 * @D40_DMA_RUN: The DMA channel is RUNNING of the command RUN.
55 * @D40_DMA_SUSPEND_REQ: Request the DMA to SUSPEND as soon as possible.
56 * @D40_DMA_SUSPENDED: The DMA channel is SUSPENDED.
61 D40_DMA_SUSPEND_REQ
= 2,
66 * struct d40_lli_pool - Structure for keeping LLIs in memory
68 * @base: Pointer to memory area when the pre_alloc_lli's are not large
69 * enough, IE bigger than the most common case, 1 dst and 1 src. NULL if
70 * pre_alloc_lli is used.
71 * @size: The size in bytes of the memory at base or the size of pre_alloc_lli.
72 * @pre_alloc_lli: Pre allocated area for the most common case of transfers,
73 * one buffer to one buffer.
78 /* Space for dst and src, plus an extra for padding */
79 u8 pre_alloc_lli
[3 * sizeof(struct d40_phy_lli
)];
83 * struct d40_desc - A descriptor is one DMA job.
85 * @lli_phy: LLI settings for physical channel. Both src and dst=
86 * points into the lli_pool, to base if lli_len > 1 or to pre_alloc_lli if
88 * @lli_log: Same as above but for logical channels.
89 * @lli_pool: The pool with two entries pre-allocated.
90 * @lli_len: Number of llis of current descriptor.
91 * @lli_current: Number of transfered llis.
92 * @lcla_alloc: Number of LCLA entries allocated.
93 * @txd: DMA engine struct. Used for among other things for communication
96 * @is_in_client_list: true if the client owns this descriptor.
99 * This descriptor is used for both logical and physical transfers.
103 struct d40_phy_lli_bidir lli_phy
;
105 struct d40_log_lli_bidir lli_log
;
107 struct d40_lli_pool lli_pool
;
112 struct dma_async_tx_descriptor txd
;
113 struct list_head node
;
115 bool is_in_client_list
;
119 * struct d40_lcla_pool - LCLA pool settings and data.
121 * @base: The virtual address of LCLA. 18 bit aligned.
122 * @base_unaligned: The orignal kmalloc pointer, if kmalloc is used.
123 * This pointer is only there for clean-up on error.
124 * @pages: The number of pages needed for all physical channels.
125 * Only used later for clean-up on error
126 * @lock: Lock to protect the content in this struct.
127 * @alloc_map: big map over which LCLA entry is own by which job.
129 struct d40_lcla_pool
{
131 void *base_unaligned
;
134 struct d40_desc
**alloc_map
;
138 * struct d40_phy_res - struct for handling eventlines mapped to physical
141 * @lock: A lock protection this entity.
142 * @num: The physical channel number of this entity.
143 * @allocated_src: Bit mapped to show which src event line's are mapped to
144 * this physical channel. Can also be free or physically allocated.
145 * @allocated_dst: Same as for src but is dst.
146 * allocated_dst and allocated_src uses the D40_ALLOC* defines as well as
159 * struct d40_chan - Struct that describes a channel.
161 * @lock: A spinlock to protect this struct.
162 * @log_num: The logical number, if any of this channel.
163 * @completed: Starts with 1, after first interrupt it is set to dma engine's
165 * @pending_tx: The number of pending transfers. Used between interrupt handler
167 * @busy: Set to true when transfer is ongoing on this channel.
168 * @phy_chan: Pointer to physical channel which this instance runs on. If this
169 * point is NULL, then the channel is not allocated.
170 * @chan: DMA engine handle.
171 * @tasklet: Tasklet that gets scheduled from interrupt context to complete a
172 * transfer and call client callback.
173 * @client: Cliented owned descriptor list.
174 * @active: Active descriptor.
175 * @queue: Queued jobs.
176 * @dma_cfg: The client configuration of this dma channel.
177 * @configured: whether the dma_cfg configuration is valid
178 * @base: Pointer to the device instance struct.
179 * @src_def_cfg: Default cfg register setting for src.
180 * @dst_def_cfg: Default cfg register setting for dst.
181 * @log_def: Default logical channel settings.
182 * @lcla: Space for one dst src pair for logical channel transfers.
183 * @lcpa: Pointer to dst and src lcpa settings.
185 * This struct can either "be" a logical or a physical channel.
190 /* ID of the most recent completed transfer */
194 struct d40_phy_res
*phy_chan
;
195 struct dma_chan chan
;
196 struct tasklet_struct tasklet
;
197 struct list_head client
;
198 struct list_head active
;
199 struct list_head queue
;
200 struct stedma40_chan_cfg dma_cfg
;
202 struct d40_base
*base
;
203 /* Default register configurations */
206 struct d40_def_lcsp log_def
;
207 struct d40_log_lli_full
*lcpa
;
208 /* Runtime reconfiguration */
209 dma_addr_t runtime_addr
;
210 enum dma_data_direction runtime_direction
;
214 * struct d40_base - The big global struct, one for each probe'd instance.
216 * @interrupt_lock: Lock used to make sure one interrupt is handle a time.
217 * @execmd_lock: Lock for execute command usage since several channels share
218 * the same physical register.
219 * @dev: The device structure.
220 * @virtbase: The virtual base address of the DMA's register.
221 * @rev: silicon revision detected.
222 * @clk: Pointer to the DMA clock structure.
223 * @phy_start: Physical memory start of the DMA registers.
224 * @phy_size: Size of the DMA register map.
225 * @irq: The IRQ number.
226 * @num_phy_chans: The number of physical channels. Read from HW. This
227 * is the number of available channels for this driver, not counting "Secure
228 * mode" allocated physical channels.
229 * @num_log_chans: The number of logical channels. Calculated from
231 * @dma_both: dma_device channels that can do both memcpy and slave transfers.
232 * @dma_slave: dma_device channels that can do only do slave transfers.
233 * @dma_memcpy: dma_device channels that can do only do memcpy transfers.
234 * @log_chans: Room for all possible logical channels in system.
235 * @lookup_log_chans: Used to map interrupt number to logical channel. Points
236 * to log_chans entries.
237 * @lookup_phy_chans: Used to map interrupt number to physical channel. Points
238 * to phy_chans entries.
239 * @plat_data: Pointer to provided platform_data which is the driver
241 * @phy_res: Vector containing all physical channels.
242 * @lcla_pool: lcla pool settings and data.
243 * @lcpa_base: The virtual mapped address of LCPA.
244 * @phy_lcpa: The physical address of the LCPA.
245 * @lcpa_size: The size of the LCPA area.
246 * @desc_slab: cache for descriptors.
249 spinlock_t interrupt_lock
;
250 spinlock_t execmd_lock
;
252 void __iomem
*virtbase
;
255 phys_addr_t phy_start
;
256 resource_size_t phy_size
;
260 struct dma_device dma_both
;
261 struct dma_device dma_slave
;
262 struct dma_device dma_memcpy
;
263 struct d40_chan
*phy_chans
;
264 struct d40_chan
*log_chans
;
265 struct d40_chan
**lookup_log_chans
;
266 struct d40_chan
**lookup_phy_chans
;
267 struct stedma40_platform_data
*plat_data
;
268 /* Physical half channels */
269 struct d40_phy_res
*phy_res
;
270 struct d40_lcla_pool lcla_pool
;
273 resource_size_t lcpa_size
;
274 struct kmem_cache
*desc_slab
;
278 * struct d40_interrupt_lookup - lookup table for interrupt handler
280 * @src: Interrupt mask register.
281 * @clr: Interrupt clear register.
282 * @is_error: true if this is an error interrupt.
283 * @offset: start delta in the lookup_log_chans in d40_base. If equals to
284 * D40_PHY_CHAN, the lookup_phy_chans shall be used instead.
286 struct d40_interrupt_lookup
{
294 * struct d40_reg_val - simple lookup struct
296 * @reg: The register.
297 * @val: The value that belongs to the register in reg.
304 static struct device
*chan2dev(struct d40_chan
*d40c
)
306 return &d40c
->chan
.dev
->device
;
309 static bool chan_is_physical(struct d40_chan
*chan
)
311 return chan
->log_num
== D40_PHY_CHAN
;
314 static bool chan_is_logical(struct d40_chan
*chan
)
316 return !chan_is_physical(chan
);
319 static void __iomem
*chan_base(struct d40_chan
*chan
)
321 return chan
->base
->virtbase
+ D40_DREG_PCBASE
+
322 chan
->phy_chan
->num
* D40_DREG_PCDELTA
;
325 static int d40_pool_lli_alloc(struct d40_desc
*d40d
,
326 int lli_len
, bool is_log
)
332 align
= sizeof(struct d40_log_lli
);
334 align
= sizeof(struct d40_phy_lli
);
337 base
= d40d
->lli_pool
.pre_alloc_lli
;
338 d40d
->lli_pool
.size
= sizeof(d40d
->lli_pool
.pre_alloc_lli
);
339 d40d
->lli_pool
.base
= NULL
;
341 d40d
->lli_pool
.size
= ALIGN(lli_len
* 2 * align
, align
);
343 base
= kmalloc(d40d
->lli_pool
.size
+ align
, GFP_NOWAIT
);
344 d40d
->lli_pool
.base
= base
;
346 if (d40d
->lli_pool
.base
== NULL
)
351 d40d
->lli_log
.src
= PTR_ALIGN((struct d40_log_lli
*) base
,
353 d40d
->lli_log
.dst
= PTR_ALIGN(d40d
->lli_log
.src
+ lli_len
,
356 d40d
->lli_phy
.src
= PTR_ALIGN((struct d40_phy_lli
*)base
,
358 d40d
->lli_phy
.dst
= PTR_ALIGN(d40d
->lli_phy
.src
+ lli_len
,
365 static void d40_pool_lli_free(struct d40_desc
*d40d
)
367 kfree(d40d
->lli_pool
.base
);
368 d40d
->lli_pool
.base
= NULL
;
369 d40d
->lli_pool
.size
= 0;
370 d40d
->lli_log
.src
= NULL
;
371 d40d
->lli_log
.dst
= NULL
;
372 d40d
->lli_phy
.src
= NULL
;
373 d40d
->lli_phy
.dst
= NULL
;
376 static int d40_lcla_alloc_one(struct d40_chan
*d40c
,
377 struct d40_desc
*d40d
)
384 spin_lock_irqsave(&d40c
->base
->lcla_pool
.lock
, flags
);
386 p
= d40c
->phy_chan
->num
* D40_LCLA_LINK_PER_EVENT_GRP
;
389 * Allocate both src and dst at the same time, therefore the half
390 * start on 1 since 0 can't be used since zero is used as end marker.
392 for (i
= 1 ; i
< D40_LCLA_LINK_PER_EVENT_GRP
/ 2; i
++) {
393 if (!d40c
->base
->lcla_pool
.alloc_map
[p
+ i
]) {
394 d40c
->base
->lcla_pool
.alloc_map
[p
+ i
] = d40d
;
401 spin_unlock_irqrestore(&d40c
->base
->lcla_pool
.lock
, flags
);
406 static int d40_lcla_free_all(struct d40_chan
*d40c
,
407 struct d40_desc
*d40d
)
413 if (chan_is_physical(d40c
))
416 spin_lock_irqsave(&d40c
->base
->lcla_pool
.lock
, flags
);
418 for (i
= 1 ; i
< D40_LCLA_LINK_PER_EVENT_GRP
/ 2; i
++) {
419 if (d40c
->base
->lcla_pool
.alloc_map
[d40c
->phy_chan
->num
*
420 D40_LCLA_LINK_PER_EVENT_GRP
+ i
] == d40d
) {
421 d40c
->base
->lcla_pool
.alloc_map
[d40c
->phy_chan
->num
*
422 D40_LCLA_LINK_PER_EVENT_GRP
+ i
] = NULL
;
424 if (d40d
->lcla_alloc
== 0) {
431 spin_unlock_irqrestore(&d40c
->base
->lcla_pool
.lock
, flags
);
437 static void d40_desc_remove(struct d40_desc
*d40d
)
439 list_del(&d40d
->node
);
442 static struct d40_desc
*d40_desc_get(struct d40_chan
*d40c
)
444 struct d40_desc
*desc
= NULL
;
446 if (!list_empty(&d40c
->client
)) {
450 list_for_each_entry_safe(d
, _d
, &d40c
->client
, node
)
451 if (async_tx_test_ack(&d
->txd
)) {
452 d40_pool_lli_free(d
);
455 memset(desc
, 0, sizeof(*desc
));
461 desc
= kmem_cache_zalloc(d40c
->base
->desc_slab
, GFP_NOWAIT
);
464 INIT_LIST_HEAD(&desc
->node
);
469 static void d40_desc_free(struct d40_chan
*d40c
, struct d40_desc
*d40d
)
472 d40_lcla_free_all(d40c
, d40d
);
473 kmem_cache_free(d40c
->base
->desc_slab
, d40d
);
476 static void d40_desc_submit(struct d40_chan
*d40c
, struct d40_desc
*desc
)
478 list_add_tail(&desc
->node
, &d40c
->active
);
481 static void d40_desc_load(struct d40_chan
*d40c
, struct d40_desc
*d40d
)
483 int curr_lcla
= -EINVAL
, next_lcla
;
485 if (chan_is_physical(d40c
)) {
486 d40_phy_lli_write(d40c
->base
->virtbase
,
490 d40d
->lli_current
= d40d
->lli_len
;
493 if ((d40d
->lli_len
- d40d
->lli_current
) > 1)
494 curr_lcla
= d40_lcla_alloc_one(d40c
, d40d
);
496 d40_log_lli_lcpa_write(d40c
->lcpa
,
497 &d40d
->lli_log
.dst
[d40d
->lli_current
],
498 &d40d
->lli_log
.src
[d40d
->lli_current
],
502 for (; d40d
->lli_current
< d40d
->lli_len
; d40d
->lli_current
++) {
503 struct d40_log_lli
*lcla
;
505 if (d40d
->lli_current
+ 1 < d40d
->lli_len
)
506 next_lcla
= d40_lcla_alloc_one(d40c
, d40d
);
510 lcla
= d40c
->base
->lcla_pool
.base
+
511 d40c
->phy_chan
->num
* 1024 +
514 d40_log_lli_lcla_write(lcla
,
515 &d40d
->lli_log
.dst
[d40d
->lli_current
],
516 &d40d
->lli_log
.src
[d40d
->lli_current
],
519 (void) dma_map_single(d40c
->base
->dev
, lcla
,
520 2 * sizeof(struct d40_log_lli
),
523 curr_lcla
= next_lcla
;
525 if (curr_lcla
== -EINVAL
) {
534 static struct d40_desc
*d40_first_active_get(struct d40_chan
*d40c
)
538 if (list_empty(&d40c
->active
))
541 d
= list_first_entry(&d40c
->active
,
547 static void d40_desc_queue(struct d40_chan
*d40c
, struct d40_desc
*desc
)
549 list_add_tail(&desc
->node
, &d40c
->queue
);
552 static struct d40_desc
*d40_first_queued(struct d40_chan
*d40c
)
556 if (list_empty(&d40c
->queue
))
559 d
= list_first_entry(&d40c
->queue
,
565 static int d40_psize_2_burst_size(bool is_log
, int psize
)
568 if (psize
== STEDMA40_PSIZE_LOG_1
)
571 if (psize
== STEDMA40_PSIZE_PHY_1
)
579 * The dma only supports transmitting packages up to
580 * STEDMA40_MAX_SEG_SIZE << data_width. Calculate the total number of
581 * dma elements required to send the entire sg list
583 static int d40_size_2_dmalen(int size
, u32 data_width1
, u32 data_width2
)
586 u32 max_w
= max(data_width1
, data_width2
);
587 u32 min_w
= min(data_width1
, data_width2
);
588 u32 seg_max
= ALIGN(STEDMA40_MAX_SEG_SIZE
<< min_w
, 1 << max_w
);
590 if (seg_max
> STEDMA40_MAX_SEG_SIZE
)
591 seg_max
-= (1 << max_w
);
593 if (!IS_ALIGNED(size
, 1 << max_w
))
599 dmalen
= size
/ seg_max
;
600 if (dmalen
* seg_max
< size
)
606 static int d40_sg_2_dmalen(struct scatterlist
*sgl
, int sg_len
,
607 u32 data_width1
, u32 data_width2
)
609 struct scatterlist
*sg
;
614 for_each_sg(sgl
, sg
, sg_len
, i
) {
615 ret
= d40_size_2_dmalen(sg_dma_len(sg
),
616 data_width1
, data_width2
);
624 /* Support functions for logical channels */
626 static int d40_channel_execute_command(struct d40_chan
*d40c
,
627 enum d40_command command
)
631 void __iomem
*active_reg
;
636 spin_lock_irqsave(&d40c
->base
->execmd_lock
, flags
);
638 if (d40c
->phy_chan
->num
% 2 == 0)
639 active_reg
= d40c
->base
->virtbase
+ D40_DREG_ACTIVE
;
641 active_reg
= d40c
->base
->virtbase
+ D40_DREG_ACTIVO
;
643 if (command
== D40_DMA_SUSPEND_REQ
) {
644 status
= (readl(active_reg
) &
645 D40_CHAN_POS_MASK(d40c
->phy_chan
->num
)) >>
646 D40_CHAN_POS(d40c
->phy_chan
->num
);
648 if (status
== D40_DMA_SUSPENDED
|| status
== D40_DMA_STOP
)
652 wmask
= 0xffffffff & ~(D40_CHAN_POS_MASK(d40c
->phy_chan
->num
));
653 writel(wmask
| (command
<< D40_CHAN_POS(d40c
->phy_chan
->num
)),
656 if (command
== D40_DMA_SUSPEND_REQ
) {
658 for (i
= 0 ; i
< D40_SUSPEND_MAX_IT
; i
++) {
659 status
= (readl(active_reg
) &
660 D40_CHAN_POS_MASK(d40c
->phy_chan
->num
)) >>
661 D40_CHAN_POS(d40c
->phy_chan
->num
);
665 * Reduce the number of bus accesses while
666 * waiting for the DMA to suspend.
670 if (status
== D40_DMA_STOP
||
671 status
== D40_DMA_SUSPENDED
)
675 if (i
== D40_SUSPEND_MAX_IT
) {
676 dev_err(&d40c
->chan
.dev
->device
,
677 "[%s]: unable to suspend the chl %d (log: %d) status %x\n",
678 __func__
, d40c
->phy_chan
->num
, d40c
->log_num
,
686 spin_unlock_irqrestore(&d40c
->base
->execmd_lock
, flags
);
690 static void d40_term_all(struct d40_chan
*d40c
)
692 struct d40_desc
*d40d
;
694 /* Release active descriptors */
695 while ((d40d
= d40_first_active_get(d40c
))) {
696 d40_desc_remove(d40d
);
697 d40_desc_free(d40c
, d40d
);
700 /* Release queued descriptors waiting for transfer */
701 while ((d40d
= d40_first_queued(d40c
))) {
702 d40_desc_remove(d40d
);
703 d40_desc_free(d40c
, d40d
);
707 d40c
->pending_tx
= 0;
711 static void __d40_config_set_event(struct d40_chan
*d40c
, bool enable
,
714 void __iomem
*addr
= chan_base(d40c
) + reg
;
718 writel((D40_DEACTIVATE_EVENTLINE
<< D40_EVENTLINE_POS(event
))
719 | ~D40_EVENTLINE_MASK(event
), addr
);
724 * The hardware sometimes doesn't register the enable when src and dst
725 * event lines are active on the same logical channel. Retry to ensure
726 * it does. Usually only one retry is sufficient.
730 writel((D40_ACTIVATE_EVENTLINE
<< D40_EVENTLINE_POS(event
))
731 | ~D40_EVENTLINE_MASK(event
), addr
);
733 if (readl(addr
) & D40_EVENTLINE_MASK(event
))
738 dev_dbg(chan2dev(d40c
),
739 "[%s] workaround enable S%cLNK (%d tries)\n",
740 __func__
, reg
== D40_CHAN_REG_SSLNK
? 'S' : 'D',
746 static void d40_config_set_event(struct d40_chan
*d40c
, bool do_enable
)
750 spin_lock_irqsave(&d40c
->phy_chan
->lock
, flags
);
752 /* Enable event line connected to device (or memcpy) */
753 if ((d40c
->dma_cfg
.dir
== STEDMA40_PERIPH_TO_MEM
) ||
754 (d40c
->dma_cfg
.dir
== STEDMA40_PERIPH_TO_PERIPH
)) {
755 u32 event
= D40_TYPE_TO_EVENT(d40c
->dma_cfg
.src_dev_type
);
757 __d40_config_set_event(d40c
, do_enable
, event
,
761 if (d40c
->dma_cfg
.dir
!= STEDMA40_PERIPH_TO_MEM
) {
762 u32 event
= D40_TYPE_TO_EVENT(d40c
->dma_cfg
.dst_dev_type
);
764 __d40_config_set_event(d40c
, do_enable
, event
,
768 spin_unlock_irqrestore(&d40c
->phy_chan
->lock
, flags
);
771 static u32
d40_chan_has_events(struct d40_chan
*d40c
)
773 void __iomem
*chanbase
= chan_base(d40c
);
776 val
= readl(chanbase
+ D40_CHAN_REG_SSLNK
);
777 val
|= readl(chanbase
+ D40_CHAN_REG_SDLNK
);
782 static u32
d40_get_prmo(struct d40_chan
*d40c
)
784 static const unsigned int phy_map
[] = {
785 [STEDMA40_PCHAN_BASIC_MODE
]
786 = D40_DREG_PRMO_PCHAN_BASIC
,
787 [STEDMA40_PCHAN_MODULO_MODE
]
788 = D40_DREG_PRMO_PCHAN_MODULO
,
789 [STEDMA40_PCHAN_DOUBLE_DST_MODE
]
790 = D40_DREG_PRMO_PCHAN_DOUBLE_DST
,
792 static const unsigned int log_map
[] = {
793 [STEDMA40_LCHAN_SRC_PHY_DST_LOG
]
794 = D40_DREG_PRMO_LCHAN_SRC_PHY_DST_LOG
,
795 [STEDMA40_LCHAN_SRC_LOG_DST_PHY
]
796 = D40_DREG_PRMO_LCHAN_SRC_LOG_DST_PHY
,
797 [STEDMA40_LCHAN_SRC_LOG_DST_LOG
]
798 = D40_DREG_PRMO_LCHAN_SRC_LOG_DST_LOG
,
801 if (chan_is_physical(d40c
))
802 return phy_map
[d40c
->dma_cfg
.mode_opt
];
804 return log_map
[d40c
->dma_cfg
.mode_opt
];
807 static void d40_config_write(struct d40_chan
*d40c
)
812 /* Odd addresses are even addresses + 4 */
813 addr_base
= (d40c
->phy_chan
->num
% 2) * 4;
814 /* Setup channel mode to logical or physical */
815 var
= ((u32
)(chan_is_logical(d40c
)) + 1) <<
816 D40_CHAN_POS(d40c
->phy_chan
->num
);
817 writel(var
, d40c
->base
->virtbase
+ D40_DREG_PRMSE
+ addr_base
);
819 /* Setup operational mode option register */
820 var
= d40_get_prmo(d40c
) << D40_CHAN_POS(d40c
->phy_chan
->num
);
822 writel(var
, d40c
->base
->virtbase
+ D40_DREG_PRMOE
+ addr_base
);
824 if (chan_is_logical(d40c
)) {
825 int lidx
= (d40c
->phy_chan
->num
<< D40_SREG_ELEM_LOG_LIDX_POS
)
826 & D40_SREG_ELEM_LOG_LIDX_MASK
;
827 void __iomem
*chanbase
= chan_base(d40c
);
829 /* Set default config for CFG reg */
830 writel(d40c
->src_def_cfg
, chanbase
+ D40_CHAN_REG_SSCFG
);
831 writel(d40c
->dst_def_cfg
, chanbase
+ D40_CHAN_REG_SDCFG
);
833 /* Set LIDX for lcla */
834 writel(lidx
, chanbase
+ D40_CHAN_REG_SSELT
);
835 writel(lidx
, chanbase
+ D40_CHAN_REG_SDELT
);
839 static u32
d40_residue(struct d40_chan
*d40c
)
843 if (chan_is_logical(d40c
))
844 num_elt
= (readl(&d40c
->lcpa
->lcsp2
) & D40_MEM_LCSP2_ECNT_MASK
)
845 >> D40_MEM_LCSP2_ECNT_POS
;
847 u32 val
= readl(chan_base(d40c
) + D40_CHAN_REG_SDELT
);
848 num_elt
= (val
& D40_SREG_ELEM_PHY_ECNT_MASK
)
849 >> D40_SREG_ELEM_PHY_ECNT_POS
;
852 return num_elt
* (1 << d40c
->dma_cfg
.dst_info
.data_width
);
855 static bool d40_tx_is_linked(struct d40_chan
*d40c
)
859 if (chan_is_logical(d40c
))
860 is_link
= readl(&d40c
->lcpa
->lcsp3
) & D40_MEM_LCSP3_DLOS_MASK
;
862 is_link
= readl(chan_base(d40c
) + D40_CHAN_REG_SDLNK
)
863 & D40_SREG_LNK_PHYS_LNK_MASK
;
868 static int d40_pause(struct dma_chan
*chan
)
870 struct d40_chan
*d40c
=
871 container_of(chan
, struct d40_chan
, chan
);
878 spin_lock_irqsave(&d40c
->lock
, flags
);
880 res
= d40_channel_execute_command(d40c
, D40_DMA_SUSPEND_REQ
);
882 if (chan_is_logical(d40c
)) {
883 d40_config_set_event(d40c
, false);
884 /* Resume the other logical channels if any */
885 if (d40_chan_has_events(d40c
))
886 res
= d40_channel_execute_command(d40c
,
891 spin_unlock_irqrestore(&d40c
->lock
, flags
);
895 static int d40_resume(struct dma_chan
*chan
)
897 struct d40_chan
*d40c
=
898 container_of(chan
, struct d40_chan
, chan
);
905 spin_lock_irqsave(&d40c
->lock
, flags
);
907 if (d40c
->base
->rev
== 0)
908 if (chan_is_logical(d40c
)) {
909 res
= d40_channel_execute_command(d40c
,
910 D40_DMA_SUSPEND_REQ
);
914 /* If bytes left to transfer or linked tx resume job */
915 if (d40_residue(d40c
) || d40_tx_is_linked(d40c
)) {
917 if (chan_is_logical(d40c
))
918 d40_config_set_event(d40c
, true);
920 res
= d40_channel_execute_command(d40c
, D40_DMA_RUN
);
924 spin_unlock_irqrestore(&d40c
->lock
, flags
);
928 static dma_cookie_t
d40_tx_submit(struct dma_async_tx_descriptor
*tx
)
930 struct d40_chan
*d40c
= container_of(tx
->chan
,
933 struct d40_desc
*d40d
= container_of(tx
, struct d40_desc
, txd
);
936 spin_lock_irqsave(&d40c
->lock
, flags
);
940 if (d40c
->chan
.cookie
< 0)
941 d40c
->chan
.cookie
= 1;
943 d40d
->txd
.cookie
= d40c
->chan
.cookie
;
945 d40_desc_queue(d40c
, d40d
);
947 spin_unlock_irqrestore(&d40c
->lock
, flags
);
952 static int d40_start(struct d40_chan
*d40c
)
954 if (d40c
->base
->rev
== 0) {
957 if (chan_is_logical(d40c
)) {
958 err
= d40_channel_execute_command(d40c
,
959 D40_DMA_SUSPEND_REQ
);
965 if (chan_is_logical(d40c
))
966 d40_config_set_event(d40c
, true);
968 return d40_channel_execute_command(d40c
, D40_DMA_RUN
);
971 static struct d40_desc
*d40_queue_start(struct d40_chan
*d40c
)
973 struct d40_desc
*d40d
;
976 /* Start queued jobs, if any */
977 d40d
= d40_first_queued(d40c
);
982 /* Remove from queue */
983 d40_desc_remove(d40d
);
985 /* Add to active queue */
986 d40_desc_submit(d40c
, d40d
);
988 /* Initiate DMA job */
989 d40_desc_load(d40c
, d40d
);
992 err
= d40_start(d40c
);
1001 /* called from interrupt context */
1002 static void dma_tc_handle(struct d40_chan
*d40c
)
1004 struct d40_desc
*d40d
;
1006 /* Get first active entry from list */
1007 d40d
= d40_first_active_get(d40c
);
1012 d40_lcla_free_all(d40c
, d40d
);
1014 if (d40d
->lli_current
< d40d
->lli_len
) {
1015 d40_desc_load(d40c
, d40d
);
1017 (void) d40_start(d40c
);
1021 if (d40_queue_start(d40c
) == NULL
)
1025 tasklet_schedule(&d40c
->tasklet
);
1029 static void dma_tasklet(unsigned long data
)
1031 struct d40_chan
*d40c
= (struct d40_chan
*) data
;
1032 struct d40_desc
*d40d
;
1033 unsigned long flags
;
1034 dma_async_tx_callback callback
;
1035 void *callback_param
;
1037 spin_lock_irqsave(&d40c
->lock
, flags
);
1039 /* Get first active entry from list */
1040 d40d
= d40_first_active_get(d40c
);
1045 d40c
->completed
= d40d
->txd
.cookie
;
1048 * If terminating a channel pending_tx is set to zero.
1049 * This prevents any finished active jobs to return to the client.
1051 if (d40c
->pending_tx
== 0) {
1052 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1056 /* Callback to client */
1057 callback
= d40d
->txd
.callback
;
1058 callback_param
= d40d
->txd
.callback_param
;
1060 if (async_tx_test_ack(&d40d
->txd
)) {
1061 d40_pool_lli_free(d40d
);
1062 d40_desc_remove(d40d
);
1063 d40_desc_free(d40c
, d40d
);
1065 if (!d40d
->is_in_client_list
) {
1066 d40_desc_remove(d40d
);
1067 d40_lcla_free_all(d40c
, d40d
);
1068 list_add_tail(&d40d
->node
, &d40c
->client
);
1069 d40d
->is_in_client_list
= true;
1075 if (d40c
->pending_tx
)
1076 tasklet_schedule(&d40c
->tasklet
);
1078 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1080 if (callback
&& (d40d
->txd
.flags
& DMA_PREP_INTERRUPT
))
1081 callback(callback_param
);
1086 /* Rescue manouver if receiving double interrupts */
1087 if (d40c
->pending_tx
> 0)
1089 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1092 static irqreturn_t
d40_handle_interrupt(int irq
, void *data
)
1094 static const struct d40_interrupt_lookup il
[] = {
1095 {D40_DREG_LCTIS0
, D40_DREG_LCICR0
, false, 0},
1096 {D40_DREG_LCTIS1
, D40_DREG_LCICR1
, false, 32},
1097 {D40_DREG_LCTIS2
, D40_DREG_LCICR2
, false, 64},
1098 {D40_DREG_LCTIS3
, D40_DREG_LCICR3
, false, 96},
1099 {D40_DREG_LCEIS0
, D40_DREG_LCICR0
, true, 0},
1100 {D40_DREG_LCEIS1
, D40_DREG_LCICR1
, true, 32},
1101 {D40_DREG_LCEIS2
, D40_DREG_LCICR2
, true, 64},
1102 {D40_DREG_LCEIS3
, D40_DREG_LCICR3
, true, 96},
1103 {D40_DREG_PCTIS
, D40_DREG_PCICR
, false, D40_PHY_CHAN
},
1104 {D40_DREG_PCEIS
, D40_DREG_PCICR
, true, D40_PHY_CHAN
},
1108 u32 regs
[ARRAY_SIZE(il
)];
1112 struct d40_chan
*d40c
;
1113 unsigned long flags
;
1114 struct d40_base
*base
= data
;
1116 spin_lock_irqsave(&base
->interrupt_lock
, flags
);
1118 /* Read interrupt status of both logical and physical channels */
1119 for (i
= 0; i
< ARRAY_SIZE(il
); i
++)
1120 regs
[i
] = readl(base
->virtbase
+ il
[i
].src
);
1124 chan
= find_next_bit((unsigned long *)regs
,
1125 BITS_PER_LONG
* ARRAY_SIZE(il
), chan
+ 1);
1127 /* No more set bits found? */
1128 if (chan
== BITS_PER_LONG
* ARRAY_SIZE(il
))
1131 row
= chan
/ BITS_PER_LONG
;
1132 idx
= chan
& (BITS_PER_LONG
- 1);
1135 writel(1 << idx
, base
->virtbase
+ il
[row
].clr
);
1137 if (il
[row
].offset
== D40_PHY_CHAN
)
1138 d40c
= base
->lookup_phy_chans
[idx
];
1140 d40c
= base
->lookup_log_chans
[il
[row
].offset
+ idx
];
1141 spin_lock(&d40c
->lock
);
1143 if (!il
[row
].is_error
)
1144 dma_tc_handle(d40c
);
1147 "[%s] IRQ chan: %ld offset %d idx %d\n",
1148 __func__
, chan
, il
[row
].offset
, idx
);
1150 spin_unlock(&d40c
->lock
);
1153 spin_unlock_irqrestore(&base
->interrupt_lock
, flags
);
1158 static int d40_validate_conf(struct d40_chan
*d40c
,
1159 struct stedma40_chan_cfg
*conf
)
1162 u32 dst_event_group
= D40_TYPE_TO_GROUP(conf
->dst_dev_type
);
1163 u32 src_event_group
= D40_TYPE_TO_GROUP(conf
->src_dev_type
);
1164 bool is_log
= conf
->mode
== STEDMA40_MODE_LOGICAL
;
1167 dev_err(&d40c
->chan
.dev
->device
, "[%s] Invalid direction.\n",
1172 if (conf
->dst_dev_type
!= STEDMA40_DEV_DST_MEMORY
&&
1173 d40c
->base
->plat_data
->dev_tx
[conf
->dst_dev_type
] == 0 &&
1174 d40c
->runtime_addr
== 0) {
1176 dev_err(&d40c
->chan
.dev
->device
,
1177 "[%s] Invalid TX channel address (%d)\n",
1178 __func__
, conf
->dst_dev_type
);
1182 if (conf
->src_dev_type
!= STEDMA40_DEV_SRC_MEMORY
&&
1183 d40c
->base
->plat_data
->dev_rx
[conf
->src_dev_type
] == 0 &&
1184 d40c
->runtime_addr
== 0) {
1185 dev_err(&d40c
->chan
.dev
->device
,
1186 "[%s] Invalid RX channel address (%d)\n",
1187 __func__
, conf
->src_dev_type
);
1191 if (conf
->dir
== STEDMA40_MEM_TO_PERIPH
&&
1192 dst_event_group
== STEDMA40_DEV_DST_MEMORY
) {
1193 dev_err(&d40c
->chan
.dev
->device
, "[%s] Invalid dst\n",
1198 if (conf
->dir
== STEDMA40_PERIPH_TO_MEM
&&
1199 src_event_group
== STEDMA40_DEV_SRC_MEMORY
) {
1200 dev_err(&d40c
->chan
.dev
->device
, "[%s] Invalid src\n",
1205 if (src_event_group
== STEDMA40_DEV_SRC_MEMORY
&&
1206 dst_event_group
== STEDMA40_DEV_DST_MEMORY
&& is_log
) {
1207 dev_err(&d40c
->chan
.dev
->device
,
1208 "[%s] No event line\n", __func__
);
1212 if (conf
->dir
== STEDMA40_PERIPH_TO_PERIPH
&&
1213 (src_event_group
!= dst_event_group
)) {
1214 dev_err(&d40c
->chan
.dev
->device
,
1215 "[%s] Invalid event group\n", __func__
);
1219 if (conf
->dir
== STEDMA40_PERIPH_TO_PERIPH
) {
1221 * DMAC HW supports it. Will be added to this driver,
1222 * in case any dma client requires it.
1224 dev_err(&d40c
->chan
.dev
->device
,
1225 "[%s] periph to periph not supported\n",
1230 if (d40_psize_2_burst_size(is_log
, conf
->src_info
.psize
) *
1231 (1 << conf
->src_info
.data_width
) !=
1232 d40_psize_2_burst_size(is_log
, conf
->dst_info
.psize
) *
1233 (1 << conf
->dst_info
.data_width
)) {
1235 * The DMAC hardware only supports
1236 * src (burst x width) == dst (burst x width)
1239 dev_err(&d40c
->chan
.dev
->device
,
1240 "[%s] src (burst x width) != dst (burst x width)\n",
1248 static bool d40_alloc_mask_set(struct d40_phy_res
*phy
, bool is_src
,
1249 int log_event_line
, bool is_log
)
1251 unsigned long flags
;
1252 spin_lock_irqsave(&phy
->lock
, flags
);
1254 /* Physical interrupts are masked per physical full channel */
1255 if (phy
->allocated_src
== D40_ALLOC_FREE
&&
1256 phy
->allocated_dst
== D40_ALLOC_FREE
) {
1257 phy
->allocated_dst
= D40_ALLOC_PHY
;
1258 phy
->allocated_src
= D40_ALLOC_PHY
;
1264 /* Logical channel */
1266 if (phy
->allocated_src
== D40_ALLOC_PHY
)
1269 if (phy
->allocated_src
== D40_ALLOC_FREE
)
1270 phy
->allocated_src
= D40_ALLOC_LOG_FREE
;
1272 if (!(phy
->allocated_src
& (1 << log_event_line
))) {
1273 phy
->allocated_src
|= 1 << log_event_line
;
1278 if (phy
->allocated_dst
== D40_ALLOC_PHY
)
1281 if (phy
->allocated_dst
== D40_ALLOC_FREE
)
1282 phy
->allocated_dst
= D40_ALLOC_LOG_FREE
;
1284 if (!(phy
->allocated_dst
& (1 << log_event_line
))) {
1285 phy
->allocated_dst
|= 1 << log_event_line
;
1292 spin_unlock_irqrestore(&phy
->lock
, flags
);
1295 spin_unlock_irqrestore(&phy
->lock
, flags
);
1299 static bool d40_alloc_mask_free(struct d40_phy_res
*phy
, bool is_src
,
1302 unsigned long flags
;
1303 bool is_free
= false;
1305 spin_lock_irqsave(&phy
->lock
, flags
);
1306 if (!log_event_line
) {
1307 phy
->allocated_dst
= D40_ALLOC_FREE
;
1308 phy
->allocated_src
= D40_ALLOC_FREE
;
1313 /* Logical channel */
1315 phy
->allocated_src
&= ~(1 << log_event_line
);
1316 if (phy
->allocated_src
== D40_ALLOC_LOG_FREE
)
1317 phy
->allocated_src
= D40_ALLOC_FREE
;
1319 phy
->allocated_dst
&= ~(1 << log_event_line
);
1320 if (phy
->allocated_dst
== D40_ALLOC_LOG_FREE
)
1321 phy
->allocated_dst
= D40_ALLOC_FREE
;
1324 is_free
= ((phy
->allocated_src
| phy
->allocated_dst
) ==
1328 spin_unlock_irqrestore(&phy
->lock
, flags
);
1333 static int d40_allocate_channel(struct d40_chan
*d40c
)
1338 struct d40_phy_res
*phys
;
1343 bool is_log
= d40c
->dma_cfg
.mode
== STEDMA40_MODE_LOGICAL
;
1345 phys
= d40c
->base
->phy_res
;
1347 if (d40c
->dma_cfg
.dir
== STEDMA40_PERIPH_TO_MEM
) {
1348 dev_type
= d40c
->dma_cfg
.src_dev_type
;
1349 log_num
= 2 * dev_type
;
1351 } else if (d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_PERIPH
||
1352 d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_MEM
) {
1353 /* dst event lines are used for logical memcpy */
1354 dev_type
= d40c
->dma_cfg
.dst_dev_type
;
1355 log_num
= 2 * dev_type
+ 1;
1360 event_group
= D40_TYPE_TO_GROUP(dev_type
);
1361 event_line
= D40_TYPE_TO_EVENT(dev_type
);
1364 if (d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_MEM
) {
1365 /* Find physical half channel */
1366 for (i
= 0; i
< d40c
->base
->num_phy_chans
; i
++) {
1368 if (d40_alloc_mask_set(&phys
[i
], is_src
,
1373 for (j
= 0; j
< d40c
->base
->num_phy_chans
; j
+= 8) {
1374 int phy_num
= j
+ event_group
* 2;
1375 for (i
= phy_num
; i
< phy_num
+ 2; i
++) {
1376 if (d40_alloc_mask_set(&phys
[i
],
1385 d40c
->phy_chan
= &phys
[i
];
1386 d40c
->log_num
= D40_PHY_CHAN
;
1392 /* Find logical channel */
1393 for (j
= 0; j
< d40c
->base
->num_phy_chans
; j
+= 8) {
1394 int phy_num
= j
+ event_group
* 2;
1396 * Spread logical channels across all available physical rather
1397 * than pack every logical channel at the first available phy
1401 for (i
= phy_num
; i
< phy_num
+ 2; i
++) {
1402 if (d40_alloc_mask_set(&phys
[i
], is_src
,
1403 event_line
, is_log
))
1407 for (i
= phy_num
+ 1; i
>= phy_num
; i
--) {
1408 if (d40_alloc_mask_set(&phys
[i
], is_src
,
1409 event_line
, is_log
))
1417 d40c
->phy_chan
= &phys
[i
];
1418 d40c
->log_num
= log_num
;
1422 d40c
->base
->lookup_log_chans
[d40c
->log_num
] = d40c
;
1424 d40c
->base
->lookup_phy_chans
[d40c
->phy_chan
->num
] = d40c
;
1430 static int d40_config_memcpy(struct d40_chan
*d40c
)
1432 dma_cap_mask_t cap
= d40c
->chan
.device
->cap_mask
;
1434 if (dma_has_cap(DMA_MEMCPY
, cap
) && !dma_has_cap(DMA_SLAVE
, cap
)) {
1435 d40c
->dma_cfg
= *d40c
->base
->plat_data
->memcpy_conf_log
;
1436 d40c
->dma_cfg
.src_dev_type
= STEDMA40_DEV_SRC_MEMORY
;
1437 d40c
->dma_cfg
.dst_dev_type
= d40c
->base
->plat_data
->
1438 memcpy
[d40c
->chan
.chan_id
];
1440 } else if (dma_has_cap(DMA_MEMCPY
, cap
) &&
1441 dma_has_cap(DMA_SLAVE
, cap
)) {
1442 d40c
->dma_cfg
= *d40c
->base
->plat_data
->memcpy_conf_phy
;
1444 dev_err(&d40c
->chan
.dev
->device
, "[%s] No memcpy\n",
1453 static int d40_free_dma(struct d40_chan
*d40c
)
1458 struct d40_phy_res
*phy
= d40c
->phy_chan
;
1461 struct d40_desc
*_d
;
1464 /* Terminate all queued and active transfers */
1467 /* Release client owned descriptors */
1468 if (!list_empty(&d40c
->client
))
1469 list_for_each_entry_safe(d
, _d
, &d40c
->client
, node
) {
1470 d40_pool_lli_free(d
);
1472 d40_desc_free(d40c
, d
);
1476 dev_err(&d40c
->chan
.dev
->device
, "[%s] phy == null\n",
1481 if (phy
->allocated_src
== D40_ALLOC_FREE
&&
1482 phy
->allocated_dst
== D40_ALLOC_FREE
) {
1483 dev_err(&d40c
->chan
.dev
->device
, "[%s] channel already free\n",
1488 if (d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_PERIPH
||
1489 d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_MEM
) {
1490 event
= D40_TYPE_TO_EVENT(d40c
->dma_cfg
.dst_dev_type
);
1492 } else if (d40c
->dma_cfg
.dir
== STEDMA40_PERIPH_TO_MEM
) {
1493 event
= D40_TYPE_TO_EVENT(d40c
->dma_cfg
.src_dev_type
);
1496 dev_err(&d40c
->chan
.dev
->device
,
1497 "[%s] Unknown direction\n", __func__
);
1501 res
= d40_channel_execute_command(d40c
, D40_DMA_SUSPEND_REQ
);
1503 dev_err(&d40c
->chan
.dev
->device
, "[%s] suspend failed\n",
1508 if (chan_is_logical(d40c
)) {
1509 /* Release logical channel, deactivate the event line */
1511 d40_config_set_event(d40c
, false);
1512 d40c
->base
->lookup_log_chans
[d40c
->log_num
] = NULL
;
1515 * Check if there are more logical allocation
1516 * on this phy channel.
1518 if (!d40_alloc_mask_free(phy
, is_src
, event
)) {
1519 /* Resume the other logical channels if any */
1520 if (d40_chan_has_events(d40c
)) {
1521 res
= d40_channel_execute_command(d40c
,
1524 dev_err(&d40c
->chan
.dev
->device
,
1525 "[%s] Executing RUN command\n",
1533 (void) d40_alloc_mask_free(phy
, is_src
, 0);
1536 /* Release physical channel */
1537 res
= d40_channel_execute_command(d40c
, D40_DMA_STOP
);
1539 dev_err(&d40c
->chan
.dev
->device
,
1540 "[%s] Failed to stop channel\n", __func__
);
1543 d40c
->phy_chan
= NULL
;
1544 d40c
->configured
= false;
1545 d40c
->base
->lookup_phy_chans
[phy
->num
] = NULL
;
1550 static bool d40_is_paused(struct d40_chan
*d40c
)
1552 void __iomem
*chanbase
= chan_base(d40c
);
1553 bool is_paused
= false;
1554 unsigned long flags
;
1555 void __iomem
*active_reg
;
1559 spin_lock_irqsave(&d40c
->lock
, flags
);
1561 if (chan_is_physical(d40c
)) {
1562 if (d40c
->phy_chan
->num
% 2 == 0)
1563 active_reg
= d40c
->base
->virtbase
+ D40_DREG_ACTIVE
;
1565 active_reg
= d40c
->base
->virtbase
+ D40_DREG_ACTIVO
;
1567 status
= (readl(active_reg
) &
1568 D40_CHAN_POS_MASK(d40c
->phy_chan
->num
)) >>
1569 D40_CHAN_POS(d40c
->phy_chan
->num
);
1570 if (status
== D40_DMA_SUSPENDED
|| status
== D40_DMA_STOP
)
1576 if (d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_PERIPH
||
1577 d40c
->dma_cfg
.dir
== STEDMA40_MEM_TO_MEM
) {
1578 event
= D40_TYPE_TO_EVENT(d40c
->dma_cfg
.dst_dev_type
);
1579 status
= readl(chanbase
+ D40_CHAN_REG_SDLNK
);
1580 } else if (d40c
->dma_cfg
.dir
== STEDMA40_PERIPH_TO_MEM
) {
1581 event
= D40_TYPE_TO_EVENT(d40c
->dma_cfg
.src_dev_type
);
1582 status
= readl(chanbase
+ D40_CHAN_REG_SSLNK
);
1584 dev_err(&d40c
->chan
.dev
->device
,
1585 "[%s] Unknown direction\n", __func__
);
1589 status
= (status
& D40_EVENTLINE_MASK(event
)) >>
1590 D40_EVENTLINE_POS(event
);
1592 if (status
!= D40_DMA_RUN
)
1595 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1601 static u32
stedma40_residue(struct dma_chan
*chan
)
1603 struct d40_chan
*d40c
=
1604 container_of(chan
, struct d40_chan
, chan
);
1606 unsigned long flags
;
1608 spin_lock_irqsave(&d40c
->lock
, flags
);
1609 bytes_left
= d40_residue(d40c
);
1610 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1615 struct dma_async_tx_descriptor
*stedma40_memcpy_sg(struct dma_chan
*chan
,
1616 struct scatterlist
*sgl_dst
,
1617 struct scatterlist
*sgl_src
,
1618 unsigned int sgl_len
,
1619 unsigned long dma_flags
)
1622 struct d40_desc
*d40d
;
1623 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
,
1625 unsigned long flags
;
1627 if (d40c
->phy_chan
== NULL
) {
1628 dev_err(&d40c
->chan
.dev
->device
,
1629 "[%s] Unallocated channel.\n", __func__
);
1630 return ERR_PTR(-EINVAL
);
1633 spin_lock_irqsave(&d40c
->lock
, flags
);
1634 d40d
= d40_desc_get(d40c
);
1639 d40d
->lli_len
= d40_sg_2_dmalen(sgl_dst
, sgl_len
,
1640 d40c
->dma_cfg
.src_info
.data_width
,
1641 d40c
->dma_cfg
.dst_info
.data_width
);
1642 if (d40d
->lli_len
< 0) {
1643 dev_err(&d40c
->chan
.dev
->device
,
1644 "[%s] Unaligned size\n", __func__
);
1648 d40d
->lli_current
= 0;
1649 d40d
->txd
.flags
= dma_flags
;
1651 if (chan_is_logical(d40c
)) {
1653 if (d40_pool_lli_alloc(d40d
, d40d
->lli_len
, true) < 0) {
1654 dev_err(&d40c
->chan
.dev
->device
,
1655 "[%s] Out of memory\n", __func__
);
1659 (void) d40_log_sg_to_lli(sgl_src
,
1662 d40c
->log_def
.lcsp1
,
1663 d40c
->dma_cfg
.src_info
.data_width
,
1664 d40c
->dma_cfg
.dst_info
.data_width
);
1666 (void) d40_log_sg_to_lli(sgl_dst
,
1669 d40c
->log_def
.lcsp3
,
1670 d40c
->dma_cfg
.dst_info
.data_width
,
1671 d40c
->dma_cfg
.src_info
.data_width
);
1673 if (d40_pool_lli_alloc(d40d
, d40d
->lli_len
, false) < 0) {
1674 dev_err(&d40c
->chan
.dev
->device
,
1675 "[%s] Out of memory\n", __func__
);
1679 res
= d40_phy_sg_to_lli(sgl_src
,
1683 virt_to_phys(d40d
->lli_phy
.src
),
1685 d40c
->dma_cfg
.src_info
.data_width
,
1686 d40c
->dma_cfg
.dst_info
.data_width
,
1687 d40c
->dma_cfg
.src_info
.psize
);
1692 res
= d40_phy_sg_to_lli(sgl_dst
,
1696 virt_to_phys(d40d
->lli_phy
.dst
),
1698 d40c
->dma_cfg
.dst_info
.data_width
,
1699 d40c
->dma_cfg
.src_info
.data_width
,
1700 d40c
->dma_cfg
.dst_info
.psize
);
1705 (void) dma_map_single(d40c
->base
->dev
, d40d
->lli_phy
.src
,
1706 d40d
->lli_pool
.size
, DMA_TO_DEVICE
);
1709 dma_async_tx_descriptor_init(&d40d
->txd
, chan
);
1711 d40d
->txd
.tx_submit
= d40_tx_submit
;
1713 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1718 d40_desc_free(d40c
, d40d
);
1719 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1722 EXPORT_SYMBOL(stedma40_memcpy_sg
);
1724 bool stedma40_filter(struct dma_chan
*chan
, void *data
)
1726 struct stedma40_chan_cfg
*info
= data
;
1727 struct d40_chan
*d40c
=
1728 container_of(chan
, struct d40_chan
, chan
);
1732 err
= d40_validate_conf(d40c
, info
);
1734 d40c
->dma_cfg
= *info
;
1736 err
= d40_config_memcpy(d40c
);
1739 d40c
->configured
= true;
1743 EXPORT_SYMBOL(stedma40_filter
);
1745 /* DMA ENGINE functions */
1746 static int d40_alloc_chan_resources(struct dma_chan
*chan
)
1749 unsigned long flags
;
1750 struct d40_chan
*d40c
=
1751 container_of(chan
, struct d40_chan
, chan
);
1753 spin_lock_irqsave(&d40c
->lock
, flags
);
1755 d40c
->completed
= chan
->cookie
= 1;
1757 /* If no dma configuration is set use default configuration (memcpy) */
1758 if (!d40c
->configured
) {
1759 err
= d40_config_memcpy(d40c
);
1761 dev_err(&d40c
->chan
.dev
->device
,
1762 "[%s] Failed to configure memcpy channel\n",
1767 is_free_phy
= (d40c
->phy_chan
== NULL
);
1769 err
= d40_allocate_channel(d40c
);
1771 dev_err(&d40c
->chan
.dev
->device
,
1772 "[%s] Failed to allocate channel\n", __func__
);
1776 /* Fill in basic CFG register values */
1777 d40_phy_cfg(&d40c
->dma_cfg
, &d40c
->src_def_cfg
,
1778 &d40c
->dst_def_cfg
, chan_is_logical(d40c
));
1780 if (chan_is_logical(d40c
)) {
1781 d40_log_cfg(&d40c
->dma_cfg
,
1782 &d40c
->log_def
.lcsp1
, &d40c
->log_def
.lcsp3
);
1784 if (d40c
->dma_cfg
.dir
== STEDMA40_PERIPH_TO_MEM
)
1785 d40c
->lcpa
= d40c
->base
->lcpa_base
+
1786 d40c
->dma_cfg
.src_dev_type
* D40_LCPA_CHAN_SIZE
;
1788 d40c
->lcpa
= d40c
->base
->lcpa_base
+
1789 d40c
->dma_cfg
.dst_dev_type
*
1790 D40_LCPA_CHAN_SIZE
+ D40_LCPA_CHAN_DST_DELTA
;
1794 * Only write channel configuration to the DMA if the physical
1795 * resource is free. In case of multiple logical channels
1796 * on the same physical resource, only the first write is necessary.
1799 d40_config_write(d40c
);
1801 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1805 static void d40_free_chan_resources(struct dma_chan
*chan
)
1807 struct d40_chan
*d40c
=
1808 container_of(chan
, struct d40_chan
, chan
);
1810 unsigned long flags
;
1812 if (d40c
->phy_chan
== NULL
) {
1813 dev_err(&d40c
->chan
.dev
->device
,
1814 "[%s] Cannot free unallocated channel\n", __func__
);
1819 spin_lock_irqsave(&d40c
->lock
, flags
);
1821 err
= d40_free_dma(d40c
);
1824 dev_err(&d40c
->chan
.dev
->device
,
1825 "[%s] Failed to free channel\n", __func__
);
1826 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1829 static struct dma_async_tx_descriptor
*d40_prep_memcpy(struct dma_chan
*chan
,
1833 unsigned long dma_flags
)
1835 struct d40_desc
*d40d
;
1836 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
,
1838 unsigned long flags
;
1840 if (d40c
->phy_chan
== NULL
) {
1841 dev_err(&d40c
->chan
.dev
->device
,
1842 "[%s] Channel is not allocated.\n", __func__
);
1843 return ERR_PTR(-EINVAL
);
1846 spin_lock_irqsave(&d40c
->lock
, flags
);
1847 d40d
= d40_desc_get(d40c
);
1850 dev_err(&d40c
->chan
.dev
->device
,
1851 "[%s] Descriptor is NULL\n", __func__
);
1855 d40d
->txd
.flags
= dma_flags
;
1856 d40d
->lli_len
= d40_size_2_dmalen(size
,
1857 d40c
->dma_cfg
.src_info
.data_width
,
1858 d40c
->dma_cfg
.dst_info
.data_width
);
1859 if (d40d
->lli_len
< 0) {
1860 dev_err(&d40c
->chan
.dev
->device
,
1861 "[%s] Unaligned size\n", __func__
);
1866 dma_async_tx_descriptor_init(&d40d
->txd
, chan
);
1868 d40d
->txd
.tx_submit
= d40_tx_submit
;
1870 if (chan_is_logical(d40c
)) {
1872 if (d40_pool_lli_alloc(d40d
, d40d
->lli_len
, true) < 0) {
1873 dev_err(&d40c
->chan
.dev
->device
,
1874 "[%s] Out of memory\n", __func__
);
1877 d40d
->lli_current
= 0;
1879 if (d40_log_buf_to_lli(d40d
->lli_log
.src
,
1882 d40c
->log_def
.lcsp1
,
1883 d40c
->dma_cfg
.src_info
.data_width
,
1884 d40c
->dma_cfg
.dst_info
.data_width
,
1888 if (d40_log_buf_to_lli(d40d
->lli_log
.dst
,
1891 d40c
->log_def
.lcsp3
,
1892 d40c
->dma_cfg
.dst_info
.data_width
,
1893 d40c
->dma_cfg
.src_info
.data_width
,
1899 if (d40_pool_lli_alloc(d40d
, d40d
->lli_len
, false) < 0) {
1900 dev_err(&d40c
->chan
.dev
->device
,
1901 "[%s] Out of memory\n", __func__
);
1905 if (d40_phy_buf_to_lli(d40d
->lli_phy
.src
,
1908 d40c
->dma_cfg
.src_info
.psize
,
1912 d40c
->dma_cfg
.src_info
.data_width
,
1913 d40c
->dma_cfg
.dst_info
.data_width
,
1917 if (d40_phy_buf_to_lli(d40d
->lli_phy
.dst
,
1920 d40c
->dma_cfg
.dst_info
.psize
,
1924 d40c
->dma_cfg
.dst_info
.data_width
,
1925 d40c
->dma_cfg
.src_info
.data_width
,
1929 (void) dma_map_single(d40c
->base
->dev
, d40d
->lli_phy
.src
,
1930 d40d
->lli_pool
.size
, DMA_TO_DEVICE
);
1933 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1938 d40_desc_free(d40c
, d40d
);
1939 spin_unlock_irqrestore(&d40c
->lock
, flags
);
1943 static struct dma_async_tx_descriptor
*
1944 d40_prep_sg(struct dma_chan
*chan
,
1945 struct scatterlist
*dst_sg
, unsigned int dst_nents
,
1946 struct scatterlist
*src_sg
, unsigned int src_nents
,
1947 unsigned long dma_flags
)
1949 if (dst_nents
!= src_nents
)
1952 return stedma40_memcpy_sg(chan
, dst_sg
, src_sg
, dst_nents
, dma_flags
);
1955 static int d40_prep_slave_sg_log(struct d40_desc
*d40d
,
1956 struct d40_chan
*d40c
,
1957 struct scatterlist
*sgl
,
1958 unsigned int sg_len
,
1959 enum dma_data_direction direction
,
1960 unsigned long dma_flags
)
1962 dma_addr_t dev_addr
= 0;
1965 d40d
->lli_len
= d40_sg_2_dmalen(sgl
, sg_len
,
1966 d40c
->dma_cfg
.src_info
.data_width
,
1967 d40c
->dma_cfg
.dst_info
.data_width
);
1968 if (d40d
->lli_len
< 0) {
1969 dev_err(&d40c
->chan
.dev
->device
,
1970 "[%s] Unaligned size\n", __func__
);
1974 if (d40_pool_lli_alloc(d40d
, d40d
->lli_len
, true) < 0) {
1975 dev_err(&d40c
->chan
.dev
->device
,
1976 "[%s] Out of memory\n", __func__
);
1980 d40d
->lli_current
= 0;
1982 if (direction
== DMA_FROM_DEVICE
)
1983 if (d40c
->runtime_addr
)
1984 dev_addr
= d40c
->runtime_addr
;
1986 dev_addr
= d40c
->base
->plat_data
->dev_rx
[d40c
->dma_cfg
.src_dev_type
];
1987 else if (direction
== DMA_TO_DEVICE
)
1988 if (d40c
->runtime_addr
)
1989 dev_addr
= d40c
->runtime_addr
;
1991 dev_addr
= d40c
->base
->plat_data
->dev_tx
[d40c
->dma_cfg
.dst_dev_type
];
1996 total_size
= d40_log_sg_to_dev(sgl
, sg_len
,
1999 d40c
->dma_cfg
.src_info
.data_width
,
2000 d40c
->dma_cfg
.dst_info
.data_width
,
2010 static int d40_prep_slave_sg_phy(struct d40_desc
*d40d
,
2011 struct d40_chan
*d40c
,
2012 struct scatterlist
*sgl
,
2013 unsigned int sgl_len
,
2014 enum dma_data_direction direction
,
2015 unsigned long dma_flags
)
2017 dma_addr_t src_dev_addr
;
2018 dma_addr_t dst_dev_addr
;
2021 d40d
->lli_len
= d40_sg_2_dmalen(sgl
, sgl_len
,
2022 d40c
->dma_cfg
.src_info
.data_width
,
2023 d40c
->dma_cfg
.dst_info
.data_width
);
2024 if (d40d
->lli_len
< 0) {
2025 dev_err(&d40c
->chan
.dev
->device
,
2026 "[%s] Unaligned size\n", __func__
);
2030 if (d40_pool_lli_alloc(d40d
, d40d
->lli_len
, false) < 0) {
2031 dev_err(&d40c
->chan
.dev
->device
,
2032 "[%s] Out of memory\n", __func__
);
2036 d40d
->lli_current
= 0;
2038 if (direction
== DMA_FROM_DEVICE
) {
2040 if (d40c
->runtime_addr
)
2041 src_dev_addr
= d40c
->runtime_addr
;
2043 src_dev_addr
= d40c
->base
->plat_data
->dev_rx
[d40c
->dma_cfg
.src_dev_type
];
2044 } else if (direction
== DMA_TO_DEVICE
) {
2045 if (d40c
->runtime_addr
)
2046 dst_dev_addr
= d40c
->runtime_addr
;
2048 dst_dev_addr
= d40c
->base
->plat_data
->dev_tx
[d40c
->dma_cfg
.dst_dev_type
];
2053 res
= d40_phy_sg_to_lli(sgl
,
2057 virt_to_phys(d40d
->lli_phy
.src
),
2059 d40c
->dma_cfg
.src_info
.data_width
,
2060 d40c
->dma_cfg
.dst_info
.data_width
,
2061 d40c
->dma_cfg
.src_info
.psize
);
2065 res
= d40_phy_sg_to_lli(sgl
,
2069 virt_to_phys(d40d
->lli_phy
.dst
),
2071 d40c
->dma_cfg
.dst_info
.data_width
,
2072 d40c
->dma_cfg
.src_info
.data_width
,
2073 d40c
->dma_cfg
.dst_info
.psize
);
2077 (void) dma_map_single(d40c
->base
->dev
, d40d
->lli_phy
.src
,
2078 d40d
->lli_pool
.size
, DMA_TO_DEVICE
);
2082 static struct dma_async_tx_descriptor
*d40_prep_slave_sg(struct dma_chan
*chan
,
2083 struct scatterlist
*sgl
,
2084 unsigned int sg_len
,
2085 enum dma_data_direction direction
,
2086 unsigned long dma_flags
)
2088 struct d40_desc
*d40d
;
2089 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
,
2091 unsigned long flags
;
2094 if (d40c
->phy_chan
== NULL
) {
2095 dev_err(&d40c
->chan
.dev
->device
,
2096 "[%s] Cannot prepare unallocated channel\n", __func__
);
2097 return ERR_PTR(-EINVAL
);
2100 spin_lock_irqsave(&d40c
->lock
, flags
);
2101 d40d
= d40_desc_get(d40c
);
2106 if (chan_is_logical(d40c
))
2107 err
= d40_prep_slave_sg_log(d40d
, d40c
, sgl
, sg_len
,
2108 direction
, dma_flags
);
2110 err
= d40_prep_slave_sg_phy(d40d
, d40c
, sgl
, sg_len
,
2111 direction
, dma_flags
);
2113 dev_err(&d40c
->chan
.dev
->device
,
2114 "[%s] Failed to prepare %s slave sg job: %d\n",
2116 chan_is_logical(d40c
) ? "log" : "phy", err
);
2120 d40d
->txd
.flags
= dma_flags
;
2122 dma_async_tx_descriptor_init(&d40d
->txd
, chan
);
2124 d40d
->txd
.tx_submit
= d40_tx_submit
;
2126 spin_unlock_irqrestore(&d40c
->lock
, flags
);
2131 d40_desc_free(d40c
, d40d
);
2132 spin_unlock_irqrestore(&d40c
->lock
, flags
);
2136 static enum dma_status
d40_tx_status(struct dma_chan
*chan
,
2137 dma_cookie_t cookie
,
2138 struct dma_tx_state
*txstate
)
2140 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
, chan
);
2141 dma_cookie_t last_used
;
2142 dma_cookie_t last_complete
;
2145 if (d40c
->phy_chan
== NULL
) {
2146 dev_err(&d40c
->chan
.dev
->device
,
2147 "[%s] Cannot read status of unallocated channel\n",
2152 last_complete
= d40c
->completed
;
2153 last_used
= chan
->cookie
;
2155 if (d40_is_paused(d40c
))
2158 ret
= dma_async_is_complete(cookie
, last_complete
, last_used
);
2160 dma_set_tx_state(txstate
, last_complete
, last_used
,
2161 stedma40_residue(chan
));
2166 static void d40_issue_pending(struct dma_chan
*chan
)
2168 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
, chan
);
2169 unsigned long flags
;
2171 if (d40c
->phy_chan
== NULL
) {
2172 dev_err(&d40c
->chan
.dev
->device
,
2173 "[%s] Channel is not allocated!\n", __func__
);
2177 spin_lock_irqsave(&d40c
->lock
, flags
);
2179 /* Busy means that pending jobs are already being processed */
2181 (void) d40_queue_start(d40c
);
2183 spin_unlock_irqrestore(&d40c
->lock
, flags
);
2186 /* Runtime reconfiguration extension */
2187 static void d40_set_runtime_config(struct dma_chan
*chan
,
2188 struct dma_slave_config
*config
)
2190 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
, chan
);
2191 struct stedma40_chan_cfg
*cfg
= &d40c
->dma_cfg
;
2192 enum dma_slave_buswidth config_addr_width
;
2193 dma_addr_t config_addr
;
2194 u32 config_maxburst
;
2195 enum stedma40_periph_data_width addr_width
;
2198 if (config
->direction
== DMA_FROM_DEVICE
) {
2199 dma_addr_t dev_addr_rx
=
2200 d40c
->base
->plat_data
->dev_rx
[cfg
->src_dev_type
];
2202 config_addr
= config
->src_addr
;
2204 dev_dbg(d40c
->base
->dev
,
2205 "channel has a pre-wired RX address %08x "
2206 "overriding with %08x\n",
2207 dev_addr_rx
, config_addr
);
2208 if (cfg
->dir
!= STEDMA40_PERIPH_TO_MEM
)
2209 dev_dbg(d40c
->base
->dev
,
2210 "channel was not configured for peripheral "
2211 "to memory transfer (%d) overriding\n",
2213 cfg
->dir
= STEDMA40_PERIPH_TO_MEM
;
2215 config_addr_width
= config
->src_addr_width
;
2216 config_maxburst
= config
->src_maxburst
;
2218 } else if (config
->direction
== DMA_TO_DEVICE
) {
2219 dma_addr_t dev_addr_tx
=
2220 d40c
->base
->plat_data
->dev_tx
[cfg
->dst_dev_type
];
2222 config_addr
= config
->dst_addr
;
2224 dev_dbg(d40c
->base
->dev
,
2225 "channel has a pre-wired TX address %08x "
2226 "overriding with %08x\n",
2227 dev_addr_tx
, config_addr
);
2228 if (cfg
->dir
!= STEDMA40_MEM_TO_PERIPH
)
2229 dev_dbg(d40c
->base
->dev
,
2230 "channel was not configured for memory "
2231 "to peripheral transfer (%d) overriding\n",
2233 cfg
->dir
= STEDMA40_MEM_TO_PERIPH
;
2235 config_addr_width
= config
->dst_addr_width
;
2236 config_maxburst
= config
->dst_maxburst
;
2239 dev_err(d40c
->base
->dev
,
2240 "unrecognized channel direction %d\n",
2245 switch (config_addr_width
) {
2246 case DMA_SLAVE_BUSWIDTH_1_BYTE
:
2247 addr_width
= STEDMA40_BYTE_WIDTH
;
2249 case DMA_SLAVE_BUSWIDTH_2_BYTES
:
2250 addr_width
= STEDMA40_HALFWORD_WIDTH
;
2252 case DMA_SLAVE_BUSWIDTH_4_BYTES
:
2253 addr_width
= STEDMA40_WORD_WIDTH
;
2255 case DMA_SLAVE_BUSWIDTH_8_BYTES
:
2256 addr_width
= STEDMA40_DOUBLEWORD_WIDTH
;
2259 dev_err(d40c
->base
->dev
,
2260 "illegal peripheral address width "
2262 config
->src_addr_width
);
2266 if (chan_is_logical(d40c
)) {
2267 if (config_maxburst
>= 16)
2268 psize
= STEDMA40_PSIZE_LOG_16
;
2269 else if (config_maxburst
>= 8)
2270 psize
= STEDMA40_PSIZE_LOG_8
;
2271 else if (config_maxburst
>= 4)
2272 psize
= STEDMA40_PSIZE_LOG_4
;
2274 psize
= STEDMA40_PSIZE_LOG_1
;
2276 if (config_maxburst
>= 16)
2277 psize
= STEDMA40_PSIZE_PHY_16
;
2278 else if (config_maxburst
>= 8)
2279 psize
= STEDMA40_PSIZE_PHY_8
;
2280 else if (config_maxburst
>= 4)
2281 psize
= STEDMA40_PSIZE_PHY_4
;
2282 else if (config_maxburst
>= 2)
2283 psize
= STEDMA40_PSIZE_PHY_2
;
2285 psize
= STEDMA40_PSIZE_PHY_1
;
2288 /* Set up all the endpoint configs */
2289 cfg
->src_info
.data_width
= addr_width
;
2290 cfg
->src_info
.psize
= psize
;
2291 cfg
->src_info
.big_endian
= false;
2292 cfg
->src_info
.flow_ctrl
= STEDMA40_NO_FLOW_CTRL
;
2293 cfg
->dst_info
.data_width
= addr_width
;
2294 cfg
->dst_info
.psize
= psize
;
2295 cfg
->dst_info
.big_endian
= false;
2296 cfg
->dst_info
.flow_ctrl
= STEDMA40_NO_FLOW_CTRL
;
2298 /* Fill in register values */
2299 if (chan_is_logical(d40c
))
2300 d40_log_cfg(cfg
, &d40c
->log_def
.lcsp1
, &d40c
->log_def
.lcsp3
);
2302 d40_phy_cfg(cfg
, &d40c
->src_def_cfg
,
2303 &d40c
->dst_def_cfg
, false);
2305 /* These settings will take precedence later */
2306 d40c
->runtime_addr
= config_addr
;
2307 d40c
->runtime_direction
= config
->direction
;
2308 dev_dbg(d40c
->base
->dev
,
2309 "configured channel %s for %s, data width %d, "
2310 "maxburst %d bytes, LE, no flow control\n",
2311 dma_chan_name(chan
),
2312 (config
->direction
== DMA_FROM_DEVICE
) ? "RX" : "TX",
2317 static int d40_control(struct dma_chan
*chan
, enum dma_ctrl_cmd cmd
,
2320 unsigned long flags
;
2321 struct d40_chan
*d40c
= container_of(chan
, struct d40_chan
, chan
);
2323 if (d40c
->phy_chan
== NULL
) {
2324 dev_err(&d40c
->chan
.dev
->device
,
2325 "[%s] Channel is not allocated!\n", __func__
);
2330 case DMA_TERMINATE_ALL
:
2331 spin_lock_irqsave(&d40c
->lock
, flags
);
2333 spin_unlock_irqrestore(&d40c
->lock
, flags
);
2336 return d40_pause(chan
);
2338 return d40_resume(chan
);
2339 case DMA_SLAVE_CONFIG
:
2340 d40_set_runtime_config(chan
,
2341 (struct dma_slave_config
*) arg
);
2347 /* Other commands are unimplemented */
2351 /* Initialization functions */
2353 static void __init
d40_chan_init(struct d40_base
*base
, struct dma_device
*dma
,
2354 struct d40_chan
*chans
, int offset
,
2358 struct d40_chan
*d40c
;
2360 INIT_LIST_HEAD(&dma
->channels
);
2362 for (i
= offset
; i
< offset
+ num_chans
; i
++) {
2365 d40c
->chan
.device
= dma
;
2367 spin_lock_init(&d40c
->lock
);
2369 d40c
->log_num
= D40_PHY_CHAN
;
2371 INIT_LIST_HEAD(&d40c
->active
);
2372 INIT_LIST_HEAD(&d40c
->queue
);
2373 INIT_LIST_HEAD(&d40c
->client
);
2375 tasklet_init(&d40c
->tasklet
, dma_tasklet
,
2376 (unsigned long) d40c
);
2378 list_add_tail(&d40c
->chan
.device_node
,
2383 static int __init
d40_dmaengine_init(struct d40_base
*base
,
2384 int num_reserved_chans
)
2388 d40_chan_init(base
, &base
->dma_slave
, base
->log_chans
,
2389 0, base
->num_log_chans
);
2391 dma_cap_zero(base
->dma_slave
.cap_mask
);
2392 dma_cap_set(DMA_SLAVE
, base
->dma_slave
.cap_mask
);
2394 base
->dma_slave
.device_alloc_chan_resources
= d40_alloc_chan_resources
;
2395 base
->dma_slave
.device_free_chan_resources
= d40_free_chan_resources
;
2396 base
->dma_slave
.device_prep_dma_memcpy
= d40_prep_memcpy
;
2397 base
->dma_slave
.device_prep_dma_sg
= d40_prep_sg
;
2398 base
->dma_slave
.device_prep_slave_sg
= d40_prep_slave_sg
;
2399 base
->dma_slave
.device_tx_status
= d40_tx_status
;
2400 base
->dma_slave
.device_issue_pending
= d40_issue_pending
;
2401 base
->dma_slave
.device_control
= d40_control
;
2402 base
->dma_slave
.dev
= base
->dev
;
2404 err
= dma_async_device_register(&base
->dma_slave
);
2408 "[%s] Failed to register slave channels\n",
2413 d40_chan_init(base
, &base
->dma_memcpy
, base
->log_chans
,
2414 base
->num_log_chans
, base
->plat_data
->memcpy_len
);
2416 dma_cap_zero(base
->dma_memcpy
.cap_mask
);
2417 dma_cap_set(DMA_MEMCPY
, base
->dma_memcpy
.cap_mask
);
2418 dma_cap_set(DMA_SG
, base
->dma_slave
.cap_mask
);
2420 base
->dma_memcpy
.device_alloc_chan_resources
= d40_alloc_chan_resources
;
2421 base
->dma_memcpy
.device_free_chan_resources
= d40_free_chan_resources
;
2422 base
->dma_memcpy
.device_prep_dma_memcpy
= d40_prep_memcpy
;
2423 base
->dma_slave
.device_prep_dma_sg
= d40_prep_sg
;
2424 base
->dma_memcpy
.device_prep_slave_sg
= d40_prep_slave_sg
;
2425 base
->dma_memcpy
.device_tx_status
= d40_tx_status
;
2426 base
->dma_memcpy
.device_issue_pending
= d40_issue_pending
;
2427 base
->dma_memcpy
.device_control
= d40_control
;
2428 base
->dma_memcpy
.dev
= base
->dev
;
2430 * This controller can only access address at even
2431 * 32bit boundaries, i.e. 2^2
2433 base
->dma_memcpy
.copy_align
= 2;
2435 err
= dma_async_device_register(&base
->dma_memcpy
);
2439 "[%s] Failed to regsiter memcpy only channels\n",
2444 d40_chan_init(base
, &base
->dma_both
, base
->phy_chans
,
2445 0, num_reserved_chans
);
2447 dma_cap_zero(base
->dma_both
.cap_mask
);
2448 dma_cap_set(DMA_SLAVE
, base
->dma_both
.cap_mask
);
2449 dma_cap_set(DMA_MEMCPY
, base
->dma_both
.cap_mask
);
2450 dma_cap_set(DMA_SG
, base
->dma_slave
.cap_mask
);
2452 base
->dma_both
.device_alloc_chan_resources
= d40_alloc_chan_resources
;
2453 base
->dma_both
.device_free_chan_resources
= d40_free_chan_resources
;
2454 base
->dma_both
.device_prep_dma_memcpy
= d40_prep_memcpy
;
2455 base
->dma_slave
.device_prep_dma_sg
= d40_prep_sg
;
2456 base
->dma_both
.device_prep_slave_sg
= d40_prep_slave_sg
;
2457 base
->dma_both
.device_tx_status
= d40_tx_status
;
2458 base
->dma_both
.device_issue_pending
= d40_issue_pending
;
2459 base
->dma_both
.device_control
= d40_control
;
2460 base
->dma_both
.dev
= base
->dev
;
2461 base
->dma_both
.copy_align
= 2;
2462 err
= dma_async_device_register(&base
->dma_both
);
2466 "[%s] Failed to register logical and physical capable channels\n",
2472 dma_async_device_unregister(&base
->dma_memcpy
);
2474 dma_async_device_unregister(&base
->dma_slave
);
2479 /* Initialization functions. */
2481 static int __init
d40_phy_res_init(struct d40_base
*base
)
2484 int num_phy_chans_avail
= 0;
2486 int odd_even_bit
= -2;
2488 val
[0] = readl(base
->virtbase
+ D40_DREG_PRSME
);
2489 val
[1] = readl(base
->virtbase
+ D40_DREG_PRSMO
);
2491 for (i
= 0; i
< base
->num_phy_chans
; i
++) {
2492 base
->phy_res
[i
].num
= i
;
2493 odd_even_bit
+= 2 * ((i
% 2) == 0);
2494 if (((val
[i
% 2] >> odd_even_bit
) & 3) == 1) {
2495 /* Mark security only channels as occupied */
2496 base
->phy_res
[i
].allocated_src
= D40_ALLOC_PHY
;
2497 base
->phy_res
[i
].allocated_dst
= D40_ALLOC_PHY
;
2499 base
->phy_res
[i
].allocated_src
= D40_ALLOC_FREE
;
2500 base
->phy_res
[i
].allocated_dst
= D40_ALLOC_FREE
;
2501 num_phy_chans_avail
++;
2503 spin_lock_init(&base
->phy_res
[i
].lock
);
2506 /* Mark disabled channels as occupied */
2507 for (i
= 0; base
->plat_data
->disabled_channels
[i
] != -1; i
++) {
2508 int chan
= base
->plat_data
->disabled_channels
[i
];
2510 base
->phy_res
[chan
].allocated_src
= D40_ALLOC_PHY
;
2511 base
->phy_res
[chan
].allocated_dst
= D40_ALLOC_PHY
;
2512 num_phy_chans_avail
--;
2515 dev_info(base
->dev
, "%d of %d physical DMA channels available\n",
2516 num_phy_chans_avail
, base
->num_phy_chans
);
2518 /* Verify settings extended vs standard */
2519 val
[0] = readl(base
->virtbase
+ D40_DREG_PRTYP
);
2521 for (i
= 0; i
< base
->num_phy_chans
; i
++) {
2523 if (base
->phy_res
[i
].allocated_src
== D40_ALLOC_FREE
&&
2524 (val
[0] & 0x3) != 1)
2526 "[%s] INFO: channel %d is misconfigured (%d)\n",
2527 __func__
, i
, val
[0] & 0x3);
2529 val
[0] = val
[0] >> 2;
2532 return num_phy_chans_avail
;
2535 static struct d40_base
* __init
d40_hw_detect_init(struct platform_device
*pdev
)
2537 static const struct d40_reg_val dma_id_regs
[] = {
2539 { .reg
= D40_DREG_PERIPHID0
, .val
= 0x0040},
2540 { .reg
= D40_DREG_PERIPHID1
, .val
= 0x0000},
2542 * D40_DREG_PERIPHID2 Depends on HW revision:
2543 * MOP500/HREF ED has 0x0008,
2545 * HREF V1 has 0x0028
2547 { .reg
= D40_DREG_PERIPHID3
, .val
= 0x0000},
2550 { .reg
= D40_DREG_CELLID0
, .val
= 0x000d},
2551 { .reg
= D40_DREG_CELLID1
, .val
= 0x00f0},
2552 { .reg
= D40_DREG_CELLID2
, .val
= 0x0005},
2553 { .reg
= D40_DREG_CELLID3
, .val
= 0x00b1}
2555 struct stedma40_platform_data
*plat_data
;
2556 struct clk
*clk
= NULL
;
2557 void __iomem
*virtbase
= NULL
;
2558 struct resource
*res
= NULL
;
2559 struct d40_base
*base
= NULL
;
2560 int num_log_chans
= 0;
2566 clk
= clk_get(&pdev
->dev
, NULL
);
2569 dev_err(&pdev
->dev
, "[%s] No matching clock found\n",
2576 /* Get IO for DMAC base address */
2577 res
= platform_get_resource_byname(pdev
, IORESOURCE_MEM
, "base");
2581 if (request_mem_region(res
->start
, resource_size(res
),
2582 D40_NAME
" I/O base") == NULL
)
2585 virtbase
= ioremap(res
->start
, resource_size(res
));
2589 /* HW version check */
2590 for (i
= 0; i
< ARRAY_SIZE(dma_id_regs
); i
++) {
2591 if (dma_id_regs
[i
].val
!=
2592 readl(virtbase
+ dma_id_regs
[i
].reg
)) {
2594 "[%s] Unknown hardware! Expected 0x%x at 0x%x but got 0x%x\n",
2598 readl(virtbase
+ dma_id_regs
[i
].reg
));
2603 /* Get silicon revision and designer */
2604 val
= readl(virtbase
+ D40_DREG_PERIPHID2
);
2606 if ((val
& D40_DREG_PERIPHID2_DESIGNER_MASK
) !=
2609 "[%s] Unknown designer! Got %x wanted %x\n",
2610 __func__
, val
& D40_DREG_PERIPHID2_DESIGNER_MASK
,
2615 rev
= (val
& D40_DREG_PERIPHID2_REV_MASK
) >>
2616 D40_DREG_PERIPHID2_REV_POS
;
2618 /* The number of physical channels on this HW */
2619 num_phy_chans
= 4 * (readl(virtbase
+ D40_DREG_ICFG
) & 0x7) + 4;
2621 dev_info(&pdev
->dev
, "hardware revision: %d @ 0x%x\n",
2624 plat_data
= pdev
->dev
.platform_data
;
2626 /* Count the number of logical channels in use */
2627 for (i
= 0; i
< plat_data
->dev_len
; i
++)
2628 if (plat_data
->dev_rx
[i
] != 0)
2631 for (i
= 0; i
< plat_data
->dev_len
; i
++)
2632 if (plat_data
->dev_tx
[i
] != 0)
2635 base
= kzalloc(ALIGN(sizeof(struct d40_base
), 4) +
2636 (num_phy_chans
+ num_log_chans
+ plat_data
->memcpy_len
) *
2637 sizeof(struct d40_chan
), GFP_KERNEL
);
2640 dev_err(&pdev
->dev
, "[%s] Out of memory\n", __func__
);
2646 base
->num_phy_chans
= num_phy_chans
;
2647 base
->num_log_chans
= num_log_chans
;
2648 base
->phy_start
= res
->start
;
2649 base
->phy_size
= resource_size(res
);
2650 base
->virtbase
= virtbase
;
2651 base
->plat_data
= plat_data
;
2652 base
->dev
= &pdev
->dev
;
2653 base
->phy_chans
= ((void *)base
) + ALIGN(sizeof(struct d40_base
), 4);
2654 base
->log_chans
= &base
->phy_chans
[num_phy_chans
];
2656 base
->phy_res
= kzalloc(num_phy_chans
* sizeof(struct d40_phy_res
),
2661 base
->lookup_phy_chans
= kzalloc(num_phy_chans
*
2662 sizeof(struct d40_chan
*),
2664 if (!base
->lookup_phy_chans
)
2667 if (num_log_chans
+ plat_data
->memcpy_len
) {
2669 * The max number of logical channels are event lines for all
2670 * src devices and dst devices
2672 base
->lookup_log_chans
= kzalloc(plat_data
->dev_len
* 2 *
2673 sizeof(struct d40_chan
*),
2675 if (!base
->lookup_log_chans
)
2679 base
->lcla_pool
.alloc_map
= kzalloc(num_phy_chans
*
2680 sizeof(struct d40_desc
*) *
2681 D40_LCLA_LINK_PER_EVENT_GRP
,
2683 if (!base
->lcla_pool
.alloc_map
)
2686 base
->desc_slab
= kmem_cache_create(D40_NAME
, sizeof(struct d40_desc
),
2687 0, SLAB_HWCACHE_ALIGN
,
2689 if (base
->desc_slab
== NULL
)
2702 release_mem_region(res
->start
,
2703 resource_size(res
));
2708 kfree(base
->lcla_pool
.alloc_map
);
2709 kfree(base
->lookup_log_chans
);
2710 kfree(base
->lookup_phy_chans
);
2711 kfree(base
->phy_res
);
2718 static void __init
d40_hw_init(struct d40_base
*base
)
2721 static const struct d40_reg_val dma_init_reg
[] = {
2722 /* Clock every part of the DMA block from start */
2723 { .reg
= D40_DREG_GCC
, .val
= 0x0000ff01},
2725 /* Interrupts on all logical channels */
2726 { .reg
= D40_DREG_LCMIS0
, .val
= 0xFFFFFFFF},
2727 { .reg
= D40_DREG_LCMIS1
, .val
= 0xFFFFFFFF},
2728 { .reg
= D40_DREG_LCMIS2
, .val
= 0xFFFFFFFF},
2729 { .reg
= D40_DREG_LCMIS3
, .val
= 0xFFFFFFFF},
2730 { .reg
= D40_DREG_LCICR0
, .val
= 0xFFFFFFFF},
2731 { .reg
= D40_DREG_LCICR1
, .val
= 0xFFFFFFFF},
2732 { .reg
= D40_DREG_LCICR2
, .val
= 0xFFFFFFFF},
2733 { .reg
= D40_DREG_LCICR3
, .val
= 0xFFFFFFFF},
2734 { .reg
= D40_DREG_LCTIS0
, .val
= 0xFFFFFFFF},
2735 { .reg
= D40_DREG_LCTIS1
, .val
= 0xFFFFFFFF},
2736 { .reg
= D40_DREG_LCTIS2
, .val
= 0xFFFFFFFF},
2737 { .reg
= D40_DREG_LCTIS3
, .val
= 0xFFFFFFFF}
2740 u32 prmseo
[2] = {0, 0};
2741 u32 activeo
[2] = {0xFFFFFFFF, 0xFFFFFFFF};
2745 for (i
= 0; i
< ARRAY_SIZE(dma_init_reg
); i
++)
2746 writel(dma_init_reg
[i
].val
,
2747 base
->virtbase
+ dma_init_reg
[i
].reg
);
2749 /* Configure all our dma channels to default settings */
2750 for (i
= 0; i
< base
->num_phy_chans
; i
++) {
2752 activeo
[i
% 2] = activeo
[i
% 2] << 2;
2754 if (base
->phy_res
[base
->num_phy_chans
- i
- 1].allocated_src
2756 activeo
[i
% 2] |= 3;
2760 /* Enable interrupt # */
2761 pcmis
= (pcmis
<< 1) | 1;
2763 /* Clear interrupt # */
2764 pcicr
= (pcicr
<< 1) | 1;
2766 /* Set channel to physical mode */
2767 prmseo
[i
% 2] = prmseo
[i
% 2] << 2;
2772 writel(prmseo
[1], base
->virtbase
+ D40_DREG_PRMSE
);
2773 writel(prmseo
[0], base
->virtbase
+ D40_DREG_PRMSO
);
2774 writel(activeo
[1], base
->virtbase
+ D40_DREG_ACTIVE
);
2775 writel(activeo
[0], base
->virtbase
+ D40_DREG_ACTIVO
);
2777 /* Write which interrupt to enable */
2778 writel(pcmis
, base
->virtbase
+ D40_DREG_PCMIS
);
2780 /* Write which interrupt to clear */
2781 writel(pcicr
, base
->virtbase
+ D40_DREG_PCICR
);
2785 static int __init
d40_lcla_allocate(struct d40_base
*base
)
2787 unsigned long *page_list
;
2792 * This is somewhat ugly. We need 8192 bytes that are 18 bit aligned,
2793 * To full fill this hardware requirement without wasting 256 kb
2794 * we allocate pages until we get an aligned one.
2796 page_list
= kmalloc(sizeof(unsigned long) * MAX_LCLA_ALLOC_ATTEMPTS
,
2804 /* Calculating how many pages that are required */
2805 base
->lcla_pool
.pages
= SZ_1K
* base
->num_phy_chans
/ PAGE_SIZE
;
2807 for (i
= 0; i
< MAX_LCLA_ALLOC_ATTEMPTS
; i
++) {
2808 page_list
[i
] = __get_free_pages(GFP_KERNEL
,
2809 base
->lcla_pool
.pages
);
2810 if (!page_list
[i
]) {
2813 "[%s] Failed to allocate %d pages.\n",
2814 __func__
, base
->lcla_pool
.pages
);
2816 for (j
= 0; j
< i
; j
++)
2817 free_pages(page_list
[j
], base
->lcla_pool
.pages
);
2821 if ((virt_to_phys((void *)page_list
[i
]) &
2822 (LCLA_ALIGNMENT
- 1)) == 0)
2826 for (j
= 0; j
< i
; j
++)
2827 free_pages(page_list
[j
], base
->lcla_pool
.pages
);
2829 if (i
< MAX_LCLA_ALLOC_ATTEMPTS
) {
2830 base
->lcla_pool
.base
= (void *)page_list
[i
];
2833 * After many attempts and no succees with finding the correct
2834 * alignment, try with allocating a big buffer.
2837 "[%s] Failed to get %d pages @ 18 bit align.\n",
2838 __func__
, base
->lcla_pool
.pages
);
2839 base
->lcla_pool
.base_unaligned
= kmalloc(SZ_1K
*
2840 base
->num_phy_chans
+
2843 if (!base
->lcla_pool
.base_unaligned
) {
2848 base
->lcla_pool
.base
= PTR_ALIGN(base
->lcla_pool
.base_unaligned
,
2852 writel(virt_to_phys(base
->lcla_pool
.base
),
2853 base
->virtbase
+ D40_DREG_LCLA
);
2859 static int __init
d40_probe(struct platform_device
*pdev
)
2863 struct d40_base
*base
;
2864 struct resource
*res
= NULL
;
2865 int num_reserved_chans
;
2868 base
= d40_hw_detect_init(pdev
);
2873 num_reserved_chans
= d40_phy_res_init(base
);
2875 platform_set_drvdata(pdev
, base
);
2877 spin_lock_init(&base
->interrupt_lock
);
2878 spin_lock_init(&base
->execmd_lock
);
2880 /* Get IO for logical channel parameter address */
2881 res
= platform_get_resource_byname(pdev
, IORESOURCE_MEM
, "lcpa");
2885 "[%s] No \"lcpa\" memory resource\n",
2889 base
->lcpa_size
= resource_size(res
);
2890 base
->phy_lcpa
= res
->start
;
2892 if (request_mem_region(res
->start
, resource_size(res
),
2893 D40_NAME
" I/O lcpa") == NULL
) {
2896 "[%s] Failed to request LCPA region 0x%x-0x%x\n",
2897 __func__
, res
->start
, res
->end
);
2901 /* We make use of ESRAM memory for this. */
2902 val
= readl(base
->virtbase
+ D40_DREG_LCPA
);
2903 if (res
->start
!= val
&& val
!= 0) {
2904 dev_warn(&pdev
->dev
,
2905 "[%s] Mismatch LCPA dma 0x%x, def 0x%x\n",
2906 __func__
, val
, res
->start
);
2908 writel(res
->start
, base
->virtbase
+ D40_DREG_LCPA
);
2910 base
->lcpa_base
= ioremap(res
->start
, resource_size(res
));
2911 if (!base
->lcpa_base
) {
2914 "[%s] Failed to ioremap LCPA region\n",
2919 ret
= d40_lcla_allocate(base
);
2921 dev_err(&pdev
->dev
, "[%s] Failed to allocate LCLA area\n",
2926 spin_lock_init(&base
->lcla_pool
.lock
);
2928 base
->irq
= platform_get_irq(pdev
, 0);
2930 ret
= request_irq(base
->irq
, d40_handle_interrupt
, 0, D40_NAME
, base
);
2933 dev_err(&pdev
->dev
, "[%s] No IRQ defined\n", __func__
);
2937 err
= d40_dmaengine_init(base
, num_reserved_chans
);
2943 dev_info(base
->dev
, "initialized\n");
2948 if (base
->desc_slab
)
2949 kmem_cache_destroy(base
->desc_slab
);
2951 iounmap(base
->virtbase
);
2952 if (!base
->lcla_pool
.base_unaligned
&& base
->lcla_pool
.base
)
2953 free_pages((unsigned long)base
->lcla_pool
.base
,
2954 base
->lcla_pool
.pages
);
2956 kfree(base
->lcla_pool
.base_unaligned
);
2959 release_mem_region(base
->phy_lcpa
,
2961 if (base
->phy_start
)
2962 release_mem_region(base
->phy_start
,
2965 clk_disable(base
->clk
);
2969 kfree(base
->lcla_pool
.alloc_map
);
2970 kfree(base
->lookup_log_chans
);
2971 kfree(base
->lookup_phy_chans
);
2972 kfree(base
->phy_res
);
2976 dev_err(&pdev
->dev
, "[%s] probe failed\n", __func__
);
2980 static struct platform_driver d40_driver
= {
2982 .owner
= THIS_MODULE
,
2987 static int __init
stedma40_init(void)
2989 return platform_driver_probe(&d40_driver
, d40_probe
);
2991 arch_initcall(stedma40_init
);