1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Copyright (c) 2013 - 2015 Linaro Ltd.
4 * Copyright (c) 2013 HiSilicon Limited.
5 */
6#include <linux/sched.h>
7#include <linux/device.h>
8#include <linux/dma-mapping.h>
9#include <linux/dmapool.h>
10#include <linux/dmaengine.h>
11#include <linux/init.h>
12#include <linux/interrupt.h>
13#include <linux/kernel.h>
14#include <linux/module.h>
15#include <linux/platform_device.h>
16#include <linux/slab.h>
17#include <linux/spinlock.h>
18#include <linux/of.h>
19#include <linux/clk.h>
20#include <linux/of_dma.h>
21
22#include "virt-dma.h"
23
24#define DRIVER_NAME		"k3-dma"
25#define DMA_MAX_SIZE		0x1ffc
26#define DMA_CYCLIC_MAX_PERIOD	0x1000
27#define LLI_BLOCK_SIZE		(4 * PAGE_SIZE)
28
29#define INT_STAT		0x00
30#define INT_TC1			0x04
31#define INT_TC2			0x08
32#define INT_ERR1		0x0c
33#define INT_ERR2		0x10
34#define INT_TC1_MASK		0x18
35#define INT_TC2_MASK		0x1c
36#define INT_ERR1_MASK		0x20
37#define INT_ERR2_MASK		0x24
38#define INT_TC1_RAW		0x600
39#define INT_TC2_RAW		0x608
40#define INT_ERR1_RAW		0x610
41#define INT_ERR2_RAW		0x618
42#define CH_PRI			0x688
43#define CH_STAT			0x690
44#define CX_CUR_CNT		0x704
45#define CX_LLI			0x800
46#define CX_CNT1			0x80c
47#define CX_CNT0			0x810
48#define CX_SRC			0x814
49#define CX_DST			0x818
50#define CX_CFG			0x81c
51
52#define CX_LLI_CHAIN_EN		0x2
53#define CX_CFG_EN		0x1
54#define CX_CFG_NODEIRQ		BIT(1)
55#define CX_CFG_MEM2PER		(0x1 << 2)
56#define CX_CFG_PER2MEM		(0x2 << 2)
57#define CX_CFG_SRCINCR		(0x1 << 31)
58#define CX_CFG_DSTINCR		(0x1 << 30)
59
60struct k3_desc_hw {
61	u32 lli;
62	u32 reserved[3];
63	u32 count;
64	u32 saddr;
65	u32 daddr;
66	u32 config;
67} __aligned(32);
68
69struct k3_dma_desc_sw {
70	struct virt_dma_desc	vd;
71	dma_addr_t		desc_hw_lli;
72	size_t			desc_num;
73	size_t			size;
74	struct k3_desc_hw	*desc_hw;
75};
76
77struct k3_dma_phy;
78
79struct k3_dma_chan {
80	u32			ccfg;
81	struct virt_dma_chan	vc;
82	struct k3_dma_phy	*phy;
83	struct list_head	node;
84	dma_addr_t		dev_addr;
85	enum dma_status		status;
86	bool			cyclic;
87	struct dma_slave_config	slave_config;
88};
89
90struct k3_dma_phy {
91	u32			idx;
92	void __iomem		*base;
93	struct k3_dma_chan	*vchan;
94	struct k3_dma_desc_sw	*ds_run;
95	struct k3_dma_desc_sw	*ds_done;
96};
97
98struct k3_dma_dev {
99	struct dma_device	slave;
100	void __iomem		*base;
101	struct tasklet_struct	task;
102	spinlock_t		lock;
103	struct list_head	chan_pending;
104	struct k3_dma_phy	*phy;
105	struct k3_dma_chan	*chans;
106	struct clk		*clk;
107	struct dma_pool		*pool;
108	u32			dma_channels;
109	u32			dma_requests;
110	u32			dma_channel_mask;
111	unsigned int		irq;
112};
113
114
115#define K3_FLAG_NOCLK	BIT(1)
116
117struct k3dma_soc_data {
118	unsigned long flags;
119};
120
121
122#define to_k3_dma(dmadev) container_of(dmadev, struct k3_dma_dev, slave)
123
124static int k3_dma_config_write(struct dma_chan *chan,
125			       enum dma_transfer_direction dir,
126			       struct dma_slave_config *cfg);
127
128static struct k3_dma_chan *to_k3_chan(struct dma_chan *chan)
129{
130	return container_of(chan, struct k3_dma_chan, vc.chan);
131}
132
133static void k3_dma_pause_dma(struct k3_dma_phy *phy, bool on)
134{
135	u32 val = 0;
136
137	if (on) {
138		val = readl_relaxed(phy->base + CX_CFG);
139		val |= CX_CFG_EN;
140		writel_relaxed(val, phy->base + CX_CFG);
141	} else {
142		val = readl_relaxed(phy->base + CX_CFG);
143		val &= ~CX_CFG_EN;
144		writel_relaxed(val, phy->base + CX_CFG);
145	}
146}
147
148static void k3_dma_terminate_chan(struct k3_dma_phy *phy, struct k3_dma_dev *d)
149{
150	u32 val = 0;
151
152	k3_dma_pause_dma(phy, false);
153
154	val = 0x1 << phy->idx;
155	writel_relaxed(val, d->base + INT_TC1_RAW);
156	writel_relaxed(val, d->base + INT_TC2_RAW);
157	writel_relaxed(val, d->base + INT_ERR1_RAW);
158	writel_relaxed(val, d->base + INT_ERR2_RAW);
159}
160
161static void k3_dma_set_desc(struct k3_dma_phy *phy, struct k3_desc_hw *hw)
162{
163	writel_relaxed(hw->lli, phy->base + CX_LLI);
164	writel_relaxed(hw->count, phy->base + CX_CNT0);
165	writel_relaxed(hw->saddr, phy->base + CX_SRC);
166	writel_relaxed(hw->daddr, phy->base + CX_DST);
167	writel_relaxed(hw->config, phy->base + CX_CFG);
168}
169
170static u32 k3_dma_get_curr_cnt(struct k3_dma_dev *d, struct k3_dma_phy *phy)
171{
172	u32 cnt = 0;
173
174	cnt = readl_relaxed(d->base + CX_CUR_CNT + phy->idx * 0x10);
175	cnt &= 0xffff;
176	return cnt;
177}
178
179static u32 k3_dma_get_curr_lli(struct k3_dma_phy *phy)
180{
181	return readl_relaxed(phy->base + CX_LLI);
182}
183
184static u32 k3_dma_get_chan_stat(struct k3_dma_dev *d)
185{
186	return readl_relaxed(d->base + CH_STAT);
187}
188
189static void k3_dma_enable_dma(struct k3_dma_dev *d, bool on)
190{
191	if (on) {
192		/* set same priority */
193		writel_relaxed(0x0, d->base + CH_PRI);
194
195		/* unmask irq */
196		writel_relaxed(0xffff, d->base + INT_TC1_MASK);
197		writel_relaxed(0xffff, d->base + INT_TC2_MASK);
198		writel_relaxed(0xffff, d->base + INT_ERR1_MASK);
199		writel_relaxed(0xffff, d->base + INT_ERR2_MASK);
200	} else {
201		/* mask irq */
202		writel_relaxed(0x0, d->base + INT_TC1_MASK);
203		writel_relaxed(0x0, d->base + INT_TC2_MASK);
204		writel_relaxed(0x0, d->base + INT_ERR1_MASK);
205		writel_relaxed(0x0, d->base + INT_ERR2_MASK);
206	}
207}
208
209static irqreturn_t k3_dma_int_handler(int irq, void *dev_id)
210{
211	struct k3_dma_dev *d = (struct k3_dma_dev *)dev_id;
212	struct k3_dma_phy *p;
213	struct k3_dma_chan *c;
214	u32 stat = readl_relaxed(d->base + INT_STAT);
215	u32 tc1  = readl_relaxed(d->base + INT_TC1);
216	u32 tc2  = readl_relaxed(d->base + INT_TC2);
217	u32 err1 = readl_relaxed(d->base + INT_ERR1);
218	u32 err2 = readl_relaxed(d->base + INT_ERR2);
219	u32 i, irq_chan = 0;
220
221	while (stat) {
222		i = __ffs(stat);
223		stat &= ~BIT(i);
224		if (likely(tc1 & BIT(i)) || (tc2 & BIT(i))) {
225
226			p = &d->phy[i];
227			c = p->vchan;
228			if (c && (tc1 & BIT(i))) {
229				spin_lock(&c->vc.lock);
230				if (p->ds_run != NULL) {
231					vchan_cookie_complete(&p->ds_run->vd);
232					p->ds_done = p->ds_run;
233					p->ds_run = NULL;
234				}
235				spin_unlock(&c->vc.lock);
236			}
237			if (c && (tc2 & BIT(i))) {
238				spin_lock(&c->vc.lock);
239				if (p->ds_run != NULL)
240					vchan_cyclic_callback(&p->ds_run->vd);
241				spin_unlock(&c->vc.lock);
242			}
243			irq_chan |= BIT(i);
244		}
245		if (unlikely((err1 & BIT(i)) || (err2 & BIT(i))))
246			dev_warn(d->slave.dev, "DMA ERR\n");
247	}
248
249	writel_relaxed(irq_chan, d->base + INT_TC1_RAW);
250	writel_relaxed(irq_chan, d->base + INT_TC2_RAW);
251	writel_relaxed(err1, d->base + INT_ERR1_RAW);
252	writel_relaxed(err2, d->base + INT_ERR2_RAW);
253
254	if (irq_chan)
255		tasklet_schedule(&d->task);
256
257	if (irq_chan || err1 || err2)
258		return IRQ_HANDLED;
259
260	return IRQ_NONE;
261}
262
263static int k3_dma_start_txd(struct k3_dma_chan *c)
264{
265	struct k3_dma_dev *d = to_k3_dma(c->vc.chan.device);
266	struct virt_dma_desc *vd = vchan_next_desc(&c->vc);
267
268	if (!c->phy)
269		return -EAGAIN;
270
271	if (BIT(c->phy->idx) & k3_dma_get_chan_stat(d))
272		return -EAGAIN;
273
274	/* Avoid losing track of  ds_run if a transaction is in flight */
275	if (c->phy->ds_run)
276		return -EAGAIN;
277
278	if (vd) {
279		struct k3_dma_desc_sw *ds =
280			container_of(vd, struct k3_dma_desc_sw, vd);
281		/*
282		 * fetch and remove request from vc->desc_issued
283		 * so vc->desc_issued only contains desc pending
284		 */
285		list_del(&ds->vd.node);
286
287		c->phy->ds_run = ds;
288		c->phy->ds_done = NULL;
289		/* start dma */
290		k3_dma_set_desc(c->phy, &ds->desc_hw[0]);
291		return 0;
292	}
293	c->phy->ds_run = NULL;
294	c->phy->ds_done = NULL;
295	return -EAGAIN;
296}
297
298static void k3_dma_tasklet(struct tasklet_struct *t)
299{
300	struct k3_dma_dev *d = from_tasklet(d, t, task);
301	struct k3_dma_phy *p;
302	struct k3_dma_chan *c, *cn;
303	unsigned pch, pch_alloc = 0;
304
305	/* check new dma request of running channel in vc->desc_issued */
306	list_for_each_entry_safe(c, cn, &d->slave.channels, vc.chan.device_node) {
307		spin_lock_irq(&c->vc.lock);
308		p = c->phy;
309		if (p && p->ds_done) {
310			if (k3_dma_start_txd(c)) {
311				/* No current txd associated with this channel */
312				dev_dbg(d->slave.dev, "pchan %u: free\n", p->idx);
313				/* Mark this channel free */
314				c->phy = NULL;
315				p->vchan = NULL;
316			}
317		}
318		spin_unlock_irq(&c->vc.lock);
319	}
320
321	/* check new channel request in d->chan_pending */
322	spin_lock_irq(&d->lock);
323	for (pch = 0; pch < d->dma_channels; pch++) {
324		if (!(d->dma_channel_mask & (1 << pch)))
325			continue;
326
327		p = &d->phy[pch];
328
329		if (p->vchan == NULL && !list_empty(&d->chan_pending)) {
330			c = list_first_entry(&d->chan_pending,
331				struct k3_dma_chan, node);
332			/* remove from d->chan_pending */
333			list_del_init(&c->node);
334			pch_alloc |= 1 << pch;
335			/* Mark this channel allocated */
336			p->vchan = c;
337			c->phy = p;
338			dev_dbg(d->slave.dev, "pchan %u: alloc vchan %p\n", pch, &c->vc);
339		}
340	}
341	spin_unlock_irq(&d->lock);
342
343	for (pch = 0; pch < d->dma_channels; pch++) {
344		if (!(d->dma_channel_mask & (1 << pch)))
345			continue;
346
347		if (pch_alloc & (1 << pch)) {
348			p = &d->phy[pch];
349			c = p->vchan;
350			if (c) {
351				spin_lock_irq(&c->vc.lock);
352				k3_dma_start_txd(c);
353				spin_unlock_irq(&c->vc.lock);
354			}
355		}
356	}
357}
358
359static void k3_dma_free_chan_resources(struct dma_chan *chan)
360{
361	struct k3_dma_chan *c = to_k3_chan(chan);
362	struct k3_dma_dev *d = to_k3_dma(chan->device);
363	unsigned long flags;
364
365	spin_lock_irqsave(&d->lock, flags);
366	list_del_init(&c->node);
367	spin_unlock_irqrestore(&d->lock, flags);
368
369	vchan_free_chan_resources(&c->vc);
370	c->ccfg = 0;
371}
372
373static enum dma_status k3_dma_tx_status(struct dma_chan *chan,
374	dma_cookie_t cookie, struct dma_tx_state *state)
375{
376	struct k3_dma_chan *c = to_k3_chan(chan);
377	struct k3_dma_dev *d = to_k3_dma(chan->device);
378	struct k3_dma_phy *p;
379	struct virt_dma_desc *vd;
380	unsigned long flags;
381	enum dma_status ret;
382	size_t bytes = 0;
383
384	ret = dma_cookie_status(&c->vc.chan, cookie, state);
385	if (ret == DMA_COMPLETE)
386		return ret;
387
388	spin_lock_irqsave(&c->vc.lock, flags);
389	p = c->phy;
390	ret = c->status;
391
392	/*
393	 * If the cookie is on our issue queue, then the residue is
394	 * its total size.
395	 */
396	vd = vchan_find_desc(&c->vc, cookie);
397	if (vd && !c->cyclic) {
398		bytes = container_of(vd, struct k3_dma_desc_sw, vd)->size;
399	} else if ((!p) || (!p->ds_run)) {
400		bytes = 0;
401	} else {
402		struct k3_dma_desc_sw *ds = p->ds_run;
403		u32 clli = 0, index = 0;
404
405		bytes = k3_dma_get_curr_cnt(d, p);
406		clli = k3_dma_get_curr_lli(p);
407		index = ((clli - ds->desc_hw_lli) /
408				sizeof(struct k3_desc_hw)) + 1;
409		for (; index < ds->desc_num; index++) {
410			bytes += ds->desc_hw[index].count;
411			/* end of lli */
412			if (!ds->desc_hw[index].lli)
413				break;
414		}
415	}
416	spin_unlock_irqrestore(&c->vc.lock, flags);
417	dma_set_residue(state, bytes);
418	return ret;
419}
420
421static void k3_dma_issue_pending(struct dma_chan *chan)
422{
423	struct k3_dma_chan *c = to_k3_chan(chan);
424	struct k3_dma_dev *d = to_k3_dma(chan->device);
425	unsigned long flags;
426
427	spin_lock_irqsave(&c->vc.lock, flags);
428	/* add request to vc->desc_issued */
429	if (vchan_issue_pending(&c->vc)) {
430		spin_lock(&d->lock);
431		if (!c->phy) {
432			if (list_empty(&c->node)) {
433				/* if new channel, add chan_pending */
434				list_add_tail(&c->node, &d->chan_pending);
435				/* check in tasklet */
436				tasklet_schedule(&d->task);
437				dev_dbg(d->slave.dev, "vchan %p: issued\n", &c->vc);
438			}
439		}
440		spin_unlock(&d->lock);
441	} else
442		dev_dbg(d->slave.dev, "vchan %p: nothing to issue\n", &c->vc);
443	spin_unlock_irqrestore(&c->vc.lock, flags);
444}
445
446static void k3_dma_fill_desc(struct k3_dma_desc_sw *ds, dma_addr_t dst,
447			dma_addr_t src, size_t len, u32 num, u32 ccfg)
448{
449	if (num != ds->desc_num - 1)
450		ds->desc_hw[num].lli = ds->desc_hw_lli + (num + 1) *
451			sizeof(struct k3_desc_hw);
452
453	ds->desc_hw[num].lli |= CX_LLI_CHAIN_EN;
454	ds->desc_hw[num].count = len;
455	ds->desc_hw[num].saddr = src;
456	ds->desc_hw[num].daddr = dst;
457	ds->desc_hw[num].config = ccfg;
458}
459
460static struct k3_dma_desc_sw *k3_dma_alloc_desc_resource(int num,
461							struct dma_chan *chan)
462{
463	struct k3_dma_chan *c = to_k3_chan(chan);
464	struct k3_dma_desc_sw *ds;
465	struct k3_dma_dev *d = to_k3_dma(chan->device);
466	int lli_limit = LLI_BLOCK_SIZE / sizeof(struct k3_desc_hw);
467
468	if (num > lli_limit) {
469		dev_dbg(chan->device->dev, "vch %p: sg num %d exceed max %d\n",
470			&c->vc, num, lli_limit);
471		return NULL;
472	}
473
474	ds = kzalloc(sizeof(*ds), GFP_NOWAIT);
475	if (!ds)
476		return NULL;
477
478	ds->desc_hw = dma_pool_zalloc(d->pool, GFP_NOWAIT, &ds->desc_hw_lli);
479	if (!ds->desc_hw) {
480		dev_dbg(chan->device->dev, "vch %p: dma alloc fail\n", &c->vc);
481		kfree(ds);
482		return NULL;
483	}
484	ds->desc_num = num;
485	return ds;
486}
487
488static struct dma_async_tx_descriptor *k3_dma_prep_memcpy(
489	struct dma_chan *chan,	dma_addr_t dst, dma_addr_t src,
490	size_t len, unsigned long flags)
491{
492	struct k3_dma_chan *c = to_k3_chan(chan);
493	struct k3_dma_desc_sw *ds;
494	size_t copy = 0;
495	int num = 0;
496
497	if (!len)
498		return NULL;
499
500	num = DIV_ROUND_UP(len, DMA_MAX_SIZE);
501
502	ds = k3_dma_alloc_desc_resource(num, chan);
503	if (!ds)
504		return NULL;
505
506	c->cyclic = 0;
507	ds->size = len;
508	num = 0;
509
510	if (!c->ccfg) {
511		/* default is memtomem, without calling device_config */
512		c->ccfg = CX_CFG_SRCINCR | CX_CFG_DSTINCR | CX_CFG_EN;
513		c->ccfg |= (0xf << 20) | (0xf << 24);	/* burst = 16 */
514		c->ccfg |= (0x3 << 12) | (0x3 << 16);	/* width = 64 bit */
515	}
516
517	do {
518		copy = min_t(size_t, len, DMA_MAX_SIZE);
519		k3_dma_fill_desc(ds, dst, src, copy, num++, c->ccfg);
520
521		src += copy;
522		dst += copy;
523		len -= copy;
524	} while (len);
525
526	ds->desc_hw[num-1].lli = 0;	/* end of link */
527	return vchan_tx_prep(&c->vc, &ds->vd, flags);
528}
529
530static struct dma_async_tx_descriptor *k3_dma_prep_slave_sg(
531	struct dma_chan *chan, struct scatterlist *sgl, unsigned int sglen,
532	enum dma_transfer_direction dir, unsigned long flags, void *context)
533{
534	struct k3_dma_chan *c = to_k3_chan(chan);
535	struct k3_dma_desc_sw *ds;
536	size_t len, avail, total = 0;
537	struct scatterlist *sg;
538	dma_addr_t addr, src = 0, dst = 0;
539	int num = sglen, i;
540
541	if (sgl == NULL)
542		return NULL;
543
544	c->cyclic = 0;
545
546	for_each_sg(sgl, sg, sglen, i) {
547		avail = sg_dma_len(sg);
548		if (avail > DMA_MAX_SIZE)
549			num += DIV_ROUND_UP(avail, DMA_MAX_SIZE) - 1;
550	}
551
552	ds = k3_dma_alloc_desc_resource(num, chan);
553	if (!ds)
554		return NULL;
555	num = 0;
556	k3_dma_config_write(chan, dir, &c->slave_config);
557
558	for_each_sg(sgl, sg, sglen, i) {
559		addr = sg_dma_address(sg);
560		avail = sg_dma_len(sg);
561		total += avail;
562
563		do {
564			len = min_t(size_t, avail, DMA_MAX_SIZE);
565
566			if (dir == DMA_MEM_TO_DEV) {
567				src = addr;
568				dst = c->dev_addr;
569			} else if (dir == DMA_DEV_TO_MEM) {
570				src = c->dev_addr;
571				dst = addr;
572			}
573
574			k3_dma_fill_desc(ds, dst, src, len, num++, c->ccfg);
575
576			addr += len;
577			avail -= len;
578		} while (avail);
579	}
580
581	ds->desc_hw[num-1].lli = 0;	/* end of link */
582	ds->size = total;
583	return vchan_tx_prep(&c->vc, &ds->vd, flags);
584}
585
586static struct dma_async_tx_descriptor *
587k3_dma_prep_dma_cyclic(struct dma_chan *chan, dma_addr_t buf_addr,
588		       size_t buf_len, size_t period_len,
589		       enum dma_transfer_direction dir,
590		       unsigned long flags)
591{
592	struct k3_dma_chan *c = to_k3_chan(chan);
593	struct k3_dma_desc_sw *ds;
594	size_t len, avail, total = 0;
595	dma_addr_t addr, src = 0, dst = 0;
596	int num = 1, since = 0;
597	size_t modulo = DMA_CYCLIC_MAX_PERIOD;
598	u32 en_tc2 = 0;
599
600	dev_dbg(chan->device->dev, "%s: buf %pad, dst %pad, buf len %zu, period_len = %zu, dir %d\n",
601	       __func__, &buf_addr, &to_k3_chan(chan)->dev_addr,
602	       buf_len, period_len, (int)dir);
603
604	avail = buf_len;
605	if (avail > modulo)
606		num += DIV_ROUND_UP(avail, modulo) - 1;
607
608	ds = k3_dma_alloc_desc_resource(num, chan);
609	if (!ds)
610		return NULL;
611
612	c->cyclic = 1;
613	addr = buf_addr;
614	avail = buf_len;
615	total = avail;
616	num = 0;
617	k3_dma_config_write(chan, dir, &c->slave_config);
618
619	if (period_len < modulo)
620		modulo = period_len;
621
622	do {
623		len = min_t(size_t, avail, modulo);
624
625		if (dir == DMA_MEM_TO_DEV) {
626			src = addr;
627			dst = c->dev_addr;
628		} else if (dir == DMA_DEV_TO_MEM) {
629			src = c->dev_addr;
630			dst = addr;
631		}
632		since += len;
633		if (since >= period_len) {
634			/* descriptor asks for TC2 interrupt on completion */
635			en_tc2 = CX_CFG_NODEIRQ;
636			since -= period_len;
637		} else
638			en_tc2 = 0;
639
640		k3_dma_fill_desc(ds, dst, src, len, num++, c->ccfg | en_tc2);
641
642		addr += len;
643		avail -= len;
644	} while (avail);
645
646	/* "Cyclic" == end of link points back to start of link */
647	ds->desc_hw[num - 1].lli |= ds->desc_hw_lli;
648
649	ds->size = total;
650
651	return vchan_tx_prep(&c->vc, &ds->vd, flags);
652}
653
654static int k3_dma_config(struct dma_chan *chan,
655			 struct dma_slave_config *cfg)
656{
657	struct k3_dma_chan *c = to_k3_chan(chan);
658
659	memcpy(&c->slave_config, cfg, sizeof(*cfg));
660
661	return 0;
662}
663
664static int k3_dma_config_write(struct dma_chan *chan,
665			       enum dma_transfer_direction dir,
666			       struct dma_slave_config *cfg)
667{
668	struct k3_dma_chan *c = to_k3_chan(chan);
669	u32 maxburst = 0, val = 0;
670	enum dma_slave_buswidth width = DMA_SLAVE_BUSWIDTH_UNDEFINED;
671
672	if (dir == DMA_DEV_TO_MEM) {
673		c->ccfg = CX_CFG_DSTINCR;
674		c->dev_addr = cfg->src_addr;
675		maxburst = cfg->src_maxburst;
676		width = cfg->src_addr_width;
677	} else if (dir == DMA_MEM_TO_DEV) {
678		c->ccfg = CX_CFG_SRCINCR;
679		c->dev_addr = cfg->dst_addr;
680		maxburst = cfg->dst_maxburst;
681		width = cfg->dst_addr_width;
682	}
683	switch (width) {
684	case DMA_SLAVE_BUSWIDTH_1_BYTE:
685	case DMA_SLAVE_BUSWIDTH_2_BYTES:
686	case DMA_SLAVE_BUSWIDTH_4_BYTES:
687	case DMA_SLAVE_BUSWIDTH_8_BYTES:
688		val =  __ffs(width);
689		break;
690	default:
691		val = 3;
692		break;
693	}
694	c->ccfg |= (val << 12) | (val << 16);
695
696	if ((maxburst == 0) || (maxburst > 16))
697		val = 15;
698	else
699		val = maxburst - 1;
700	c->ccfg |= (val << 20) | (val << 24);
701	c->ccfg |= CX_CFG_MEM2PER | CX_CFG_EN;
702
703	/* specific request line */
704	c->ccfg |= c->vc.chan.chan_id << 4;
705
706	return 0;
707}
708
709static void k3_dma_free_desc(struct virt_dma_desc *vd)
710{
711	struct k3_dma_desc_sw *ds =
712		container_of(vd, struct k3_dma_desc_sw, vd);
713	struct k3_dma_dev *d = to_k3_dma(vd->tx.chan->device);
714
715	dma_pool_free(d->pool, ds->desc_hw, ds->desc_hw_lli);
716	kfree(ds);
717}
718
719static int k3_dma_terminate_all(struct dma_chan *chan)
720{
721	struct k3_dma_chan *c = to_k3_chan(chan);
722	struct k3_dma_dev *d = to_k3_dma(chan->device);
723	struct k3_dma_phy *p = c->phy;
724	unsigned long flags;
725	LIST_HEAD(head);
726
727	dev_dbg(d->slave.dev, "vchan %p: terminate all\n", &c->vc);
728
729	/* Prevent this channel being scheduled */
730	spin_lock(&d->lock);
731	list_del_init(&c->node);
732	spin_unlock(&d->lock);
733
734	/* Clear the tx descriptor lists */
735	spin_lock_irqsave(&c->vc.lock, flags);
736	vchan_get_all_descriptors(&c->vc, &head);
737	if (p) {
738		/* vchan is assigned to a pchan - stop the channel */
739		k3_dma_terminate_chan(p, d);
740		c->phy = NULL;
741		p->vchan = NULL;
742		if (p->ds_run) {
743			vchan_terminate_vdesc(&p->ds_run->vd);
744			p->ds_run = NULL;
745		}
746		p->ds_done = NULL;
747	}
748	spin_unlock_irqrestore(&c->vc.lock, flags);
749	vchan_dma_desc_free_list(&c->vc, &head);
750
751	return 0;
752}
753
754static void k3_dma_synchronize(struct dma_chan *chan)
755{
756	struct k3_dma_chan *c = to_k3_chan(chan);
757
758	vchan_synchronize(&c->vc);
759}
760
761static int k3_dma_transfer_pause(struct dma_chan *chan)
762{
763	struct k3_dma_chan *c = to_k3_chan(chan);
764	struct k3_dma_dev *d = to_k3_dma(chan->device);
765	struct k3_dma_phy *p = c->phy;
766
767	dev_dbg(d->slave.dev, "vchan %p: pause\n", &c->vc);
768	if (c->status == DMA_IN_PROGRESS) {
769		c->status = DMA_PAUSED;
770		if (p) {
771			k3_dma_pause_dma(p, false);
772		} else {
773			spin_lock(&d->lock);
774			list_del_init(&c->node);
775			spin_unlock(&d->lock);
776		}
777	}
778
779	return 0;
780}
781
782static int k3_dma_transfer_resume(struct dma_chan *chan)
783{
784	struct k3_dma_chan *c = to_k3_chan(chan);
785	struct k3_dma_dev *d = to_k3_dma(chan->device);
786	struct k3_dma_phy *p = c->phy;
787	unsigned long flags;
788
789	dev_dbg(d->slave.dev, "vchan %p: resume\n", &c->vc);
790	spin_lock_irqsave(&c->vc.lock, flags);
791	if (c->status == DMA_PAUSED) {
792		c->status = DMA_IN_PROGRESS;
793		if (p) {
794			k3_dma_pause_dma(p, true);
795		} else if (!list_empty(&c->vc.desc_issued)) {
796			spin_lock(&d->lock);
797			list_add_tail(&c->node, &d->chan_pending);
798			spin_unlock(&d->lock);
799		}
800	}
801	spin_unlock_irqrestore(&c->vc.lock, flags);
802
803	return 0;
804}
805
806static const struct k3dma_soc_data k3_v1_dma_data = {
807	.flags = 0,
808};
809
810static const struct k3dma_soc_data asp_v1_dma_data = {
811	.flags = K3_FLAG_NOCLK,
812};
813
814static const struct of_device_id k3_pdma_dt_ids[] = {
815	{ .compatible = "hisilicon,k3-dma-1.0",
816	  .data = &k3_v1_dma_data
817	},
818	{ .compatible = "hisilicon,hisi-pcm-asp-dma-1.0",
819	  .data = &asp_v1_dma_data
820	},
821	{}
822};
823MODULE_DEVICE_TABLE(of, k3_pdma_dt_ids);
824
825static struct dma_chan *k3_of_dma_simple_xlate(struct of_phandle_args *dma_spec,
826						struct of_dma *ofdma)
827{
828	struct k3_dma_dev *d = ofdma->of_dma_data;
829	unsigned int request = dma_spec->args[0];
830
831	if (request >= d->dma_requests)
832		return NULL;
833
834	return dma_get_slave_channel(&(d->chans[request].vc.chan));
835}
836
837static int k3_dma_probe(struct platform_device *op)
838{
839	const struct k3dma_soc_data *soc_data;
840	struct k3_dma_dev *d;
841	int i, ret, irq = 0;
842
843	d = devm_kzalloc(&op->dev, sizeof(*d), GFP_KERNEL);
844	if (!d)
845		return -ENOMEM;
846
847	soc_data = device_get_match_data(&op->dev);
848	if (!soc_data)
849		return -EINVAL;
850
851	d->base = devm_platform_ioremap_resource(op, 0);
852	if (IS_ERR(d->base))
853		return PTR_ERR(d->base);
854
855	of_property_read_u32((&op->dev)->of_node,
856			"dma-channels", &d->dma_channels);
857	of_property_read_u32((&op->dev)->of_node,
858			"dma-requests", &d->dma_requests);
859	ret = of_property_read_u32((&op->dev)->of_node,
860			"dma-channel-mask", &d->dma_channel_mask);
861	if (ret) {
862		dev_warn(&op->dev,
863			 "dma-channel-mask doesn't exist, considering all as available.\n");
864		d->dma_channel_mask = (u32)~0UL;
865	}
866
867	if (!(soc_data->flags & K3_FLAG_NOCLK)) {
868		d->clk = devm_clk_get(&op->dev, NULL);
869		if (IS_ERR(d->clk)) {
870			dev_err(&op->dev, "no dma clk\n");
871			return PTR_ERR(d->clk);
872		}
873	}
874
875	irq = platform_get_irq(op, 0);
876	ret = devm_request_irq(&op->dev, irq,
877			k3_dma_int_handler, 0, DRIVER_NAME, d);
878	if (ret)
879		return ret;
880
881	d->irq = irq;
882
883	/* A DMA memory pool for LLIs, align on 32-byte boundary */
884	d->pool = dmam_pool_create(DRIVER_NAME, &op->dev,
885					LLI_BLOCK_SIZE, 32, 0);
886	if (!d->pool)
887		return -ENOMEM;
888
889	/* init phy channel */
890	d->phy = devm_kcalloc(&op->dev,
891		d->dma_channels, sizeof(struct k3_dma_phy), GFP_KERNEL);
892	if (d->phy == NULL)
893		return -ENOMEM;
894
895	for (i = 0; i < d->dma_channels; i++) {
896		struct k3_dma_phy *p;
897
898		if (!(d->dma_channel_mask & BIT(i)))
899			continue;
900
901		p = &d->phy[i];
902		p->idx = i;
903		p->base = d->base + i * 0x40;
904	}
905
906	INIT_LIST_HEAD(&d->slave.channels);
907	dma_cap_set(DMA_SLAVE, d->slave.cap_mask);
908	dma_cap_set(DMA_MEMCPY, d->slave.cap_mask);
909	dma_cap_set(DMA_CYCLIC, d->slave.cap_mask);
910	d->slave.dev = &op->dev;
911	d->slave.device_free_chan_resources = k3_dma_free_chan_resources;
912	d->slave.device_tx_status = k3_dma_tx_status;
913	d->slave.device_prep_dma_memcpy = k3_dma_prep_memcpy;
914	d->slave.device_prep_slave_sg = k3_dma_prep_slave_sg;
915	d->slave.device_prep_dma_cyclic = k3_dma_prep_dma_cyclic;
916	d->slave.device_issue_pending = k3_dma_issue_pending;
917	d->slave.device_config = k3_dma_config;
918	d->slave.device_pause = k3_dma_transfer_pause;
919	d->slave.device_resume = k3_dma_transfer_resume;
920	d->slave.device_terminate_all = k3_dma_terminate_all;
921	d->slave.device_synchronize = k3_dma_synchronize;
922	d->slave.copy_align = DMAENGINE_ALIGN_8_BYTES;
923
924	/* init virtual channel */
925	d->chans = devm_kcalloc(&op->dev,
926		d->dma_requests, sizeof(struct k3_dma_chan), GFP_KERNEL);
927	if (d->chans == NULL)
928		return -ENOMEM;
929
930	for (i = 0; i < d->dma_requests; i++) {
931		struct k3_dma_chan *c = &d->chans[i];
932
933		c->status = DMA_IN_PROGRESS;
934		INIT_LIST_HEAD(&c->node);
935		c->vc.desc_free = k3_dma_free_desc;
936		vchan_init(&c->vc, &d->slave);
937	}
938
939	/* Enable clock before accessing registers */
940	ret = clk_prepare_enable(d->clk);
941	if (ret < 0) {
942		dev_err(&op->dev, "clk_prepare_enable failed: %d\n", ret);
943		return ret;
944	}
945
946	k3_dma_enable_dma(d, true);
947
948	ret = dma_async_device_register(&d->slave);
949	if (ret)
950		goto dma_async_register_fail;
951
952	ret = of_dma_controller_register((&op->dev)->of_node,
953					k3_of_dma_simple_xlate, d);
954	if (ret)
955		goto of_dma_register_fail;
956
957	spin_lock_init(&d->lock);
958	INIT_LIST_HEAD(&d->chan_pending);
959	tasklet_setup(&d->task, k3_dma_tasklet);
960	platform_set_drvdata(op, d);
961	dev_info(&op->dev, "initialized\n");
962
963	return 0;
964
965of_dma_register_fail:
966	dma_async_device_unregister(&d->slave);
967dma_async_register_fail:
968	clk_disable_unprepare(d->clk);
969	return ret;
970}
971
972static void k3_dma_remove(struct platform_device *op)
973{
974	struct k3_dma_chan *c, *cn;
975	struct k3_dma_dev *d = platform_get_drvdata(op);
976
977	dma_async_device_unregister(&d->slave);
978	of_dma_controller_free((&op->dev)->of_node);
979
980	devm_free_irq(&op->dev, d->irq, d);
981
982	list_for_each_entry_safe(c, cn, &d->slave.channels, vc.chan.device_node) {
983		list_del(&c->vc.chan.device_node);
984		tasklet_kill(&c->vc.task);
985	}
986	tasklet_kill(&d->task);
987	clk_disable_unprepare(d->clk);
988}
989
990#ifdef CONFIG_PM_SLEEP
991static int k3_dma_suspend_dev(struct device *dev)
992{
993	struct k3_dma_dev *d = dev_get_drvdata(dev);
994	u32 stat = 0;
995
996	stat = k3_dma_get_chan_stat(d);
997	if (stat) {
998		dev_warn(d->slave.dev,
999			"chan %d is running fail to suspend\n", stat);
1000		return -1;
1001	}
1002	k3_dma_enable_dma(d, false);
1003	clk_disable_unprepare(d->clk);
1004	return 0;
1005}
1006
1007static int k3_dma_resume_dev(struct device *dev)
1008{
1009	struct k3_dma_dev *d = dev_get_drvdata(dev);
1010	int ret = 0;
1011
1012	ret = clk_prepare_enable(d->clk);
1013	if (ret < 0) {
1014		dev_err(d->slave.dev, "clk_prepare_enable failed: %d\n", ret);
1015		return ret;
1016	}
1017	k3_dma_enable_dma(d, true);
1018	return 0;
1019}
1020#endif
1021
1022static SIMPLE_DEV_PM_OPS(k3_dma_pmops, k3_dma_suspend_dev, k3_dma_resume_dev);
1023
1024static struct platform_driver k3_pdma_driver = {
1025	.driver		= {
1026		.name	= DRIVER_NAME,
1027		.pm	= &k3_dma_pmops,
1028		.of_match_table = k3_pdma_dt_ids,
1029	},
1030	.probe		= k3_dma_probe,
1031	.remove_new	= k3_dma_remove,
1032};
1033
1034module_platform_driver(k3_pdma_driver);
1035
1036MODULE_DESCRIPTION("HiSilicon k3 DMA Driver");
1037MODULE_ALIAS("platform:k3dma");
1038MODULE_LICENSE("GPL v2");
1039