xref: /openbmc/linux/drivers/gpu/host1x/cdma.c (revision c24973ed)
19952f691SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
26579324aSTerje Bergstrom /*
36579324aSTerje Bergstrom  * Tegra host1x Command DMA
46579324aSTerje Bergstrom  *
56579324aSTerje Bergstrom  * Copyright (c) 2010-2013, NVIDIA Corporation.
66579324aSTerje Bergstrom  */
76579324aSTerje Bergstrom 
86579324aSTerje Bergstrom 
96579324aSTerje Bergstrom #include <asm/cacheflush.h>
106579324aSTerje Bergstrom #include <linux/device.h>
116579324aSTerje Bergstrom #include <linux/dma-mapping.h>
1235d747a8SThierry Reding #include <linux/host1x.h>
136579324aSTerje Bergstrom #include <linux/interrupt.h>
146579324aSTerje Bergstrom #include <linux/kernel.h>
156579324aSTerje Bergstrom #include <linux/kfifo.h>
166579324aSTerje Bergstrom #include <linux/slab.h>
176579324aSTerje Bergstrom #include <trace/events/host1x.h>
186579324aSTerje Bergstrom 
196579324aSTerje Bergstrom #include "cdma.h"
206579324aSTerje Bergstrom #include "channel.h"
216579324aSTerje Bergstrom #include "dev.h"
226579324aSTerje Bergstrom #include "debug.h"
236579324aSTerje Bergstrom #include "job.h"
246579324aSTerje Bergstrom 
256579324aSTerje Bergstrom /*
266579324aSTerje Bergstrom  * push_buffer
276579324aSTerje Bergstrom  *
286579324aSTerje Bergstrom  * The push buffer is a circular array of words to be fetched by command DMA.
296579324aSTerje Bergstrom  * Note that it works slightly differently to the sync queue; fence == pos
306579324aSTerje Bergstrom  * means that the push buffer is full, not empty.
316579324aSTerje Bergstrom  */
326579324aSTerje Bergstrom 
33e1f338c0SThierry Reding /*
34e1f338c0SThierry Reding  * Typically the commands written into the push buffer are a pair of words. We
35e1f338c0SThierry Reding  * use slots to represent each of these pairs and to simplify things. Note the
36e1f338c0SThierry Reding  * strange number of slots allocated here. 512 slots will fit exactly within a
37e1f338c0SThierry Reding  * single memory page. We also need one additional word at the end of the push
38e1f338c0SThierry Reding  * buffer for the RESTART opcode that will instruct the CDMA to jump back to
39e1f338c0SThierry Reding  * the beginning of the push buffer. With 512 slots, this means that we'll use
40e1f338c0SThierry Reding  * 2 memory pages and waste 4092 bytes of the second page that will never be
41e1f338c0SThierry Reding  * used.
42e1f338c0SThierry Reding  */
43e1f338c0SThierry Reding #define HOST1X_PUSHBUFFER_SLOTS	511
446579324aSTerje Bergstrom 
456579324aSTerje Bergstrom /*
466579324aSTerje Bergstrom  * Clean up push buffer resources
476579324aSTerje Bergstrom  */
host1x_pushbuffer_destroy(struct push_buffer * pb)486579324aSTerje Bergstrom static void host1x_pushbuffer_destroy(struct push_buffer *pb)
496579324aSTerje Bergstrom {
506579324aSTerje Bergstrom 	struct host1x_cdma *cdma = pb_to_cdma(pb);
516579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
526579324aSTerje Bergstrom 
532f8a6da8SEmil Goode 	if (!pb->mapped)
54404bfb78SMikko Perttunen 		return;
55404bfb78SMikko Perttunen 
56404bfb78SMikko Perttunen 	if (host1x->domain) {
57404bfb78SMikko Perttunen 		iommu_unmap(host1x->domain, pb->dma, pb->alloc_size);
58404bfb78SMikko Perttunen 		free_iova(&host1x->iova, iova_pfn(&host1x->iova, pb->dma));
59404bfb78SMikko Perttunen 	}
60404bfb78SMikko Perttunen 
61404bfb78SMikko Perttunen 	dma_free_wc(host1x->dev, pb->alloc_size, pb->mapped, pb->phys);
626579324aSTerje Bergstrom 
636579324aSTerje Bergstrom 	pb->mapped = NULL;
646579324aSTerje Bergstrom 	pb->phys = 0;
656579324aSTerje Bergstrom }
666579324aSTerje Bergstrom 
676579324aSTerje Bergstrom /*
686579324aSTerje Bergstrom  * Init push buffer resources
696579324aSTerje Bergstrom  */
host1x_pushbuffer_init(struct push_buffer * pb)706579324aSTerje Bergstrom static int host1x_pushbuffer_init(struct push_buffer *pb)
716579324aSTerje Bergstrom {
726579324aSTerje Bergstrom 	struct host1x_cdma *cdma = pb_to_cdma(pb);
736579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
74404bfb78SMikko Perttunen 	struct iova *alloc;
75404bfb78SMikko Perttunen 	u32 size;
76404bfb78SMikko Perttunen 	int err;
776579324aSTerje Bergstrom 
786579324aSTerje Bergstrom 	pb->mapped = NULL;
796579324aSTerje Bergstrom 	pb->phys = 0;
80404bfb78SMikko Perttunen 	pb->size = HOST1X_PUSHBUFFER_SLOTS * 8;
81404bfb78SMikko Perttunen 
82404bfb78SMikko Perttunen 	size = pb->size + 4;
836579324aSTerje Bergstrom 
846579324aSTerje Bergstrom 	/* initialize buffer pointers */
85404bfb78SMikko Perttunen 	pb->fence = pb->size - 8;
866579324aSTerje Bergstrom 	pb->pos = 0;
876579324aSTerje Bergstrom 
88404bfb78SMikko Perttunen 	if (host1x->domain) {
89404bfb78SMikko Perttunen 		unsigned long shift;
90404bfb78SMikko Perttunen 
91404bfb78SMikko Perttunen 		size = iova_align(&host1x->iova, size);
92404bfb78SMikko Perttunen 
93404bfb78SMikko Perttunen 		pb->mapped = dma_alloc_wc(host1x->dev, size, &pb->phys,
94f6e45661SLuis R. Rodriguez 					  GFP_KERNEL);
956579324aSTerje Bergstrom 		if (!pb->mapped)
96404bfb78SMikko Perttunen 			return -ENOMEM;
97404bfb78SMikko Perttunen 
98404bfb78SMikko Perttunen 		shift = iova_shift(&host1x->iova);
99404bfb78SMikko Perttunen 		alloc = alloc_iova(&host1x->iova, size >> shift,
100404bfb78SMikko Perttunen 				   host1x->iova_end >> shift, true);
101404bfb78SMikko Perttunen 		if (!alloc) {
102404bfb78SMikko Perttunen 			err = -ENOMEM;
103404bfb78SMikko Perttunen 			goto iommu_free_mem;
104404bfb78SMikko Perttunen 		}
105404bfb78SMikko Perttunen 
106404bfb78SMikko Perttunen 		pb->dma = iova_dma_addr(&host1x->iova, alloc);
107404bfb78SMikko Perttunen 		err = iommu_map(host1x->domain, pb->dma, pb->phys, size,
108404bfb78SMikko Perttunen 				IOMMU_READ, GFP_KERNEL);
109404bfb78SMikko Perttunen 		if (err)
110404bfb78SMikko Perttunen 			goto iommu_free_iova;
111404bfb78SMikko Perttunen 	} else {
112404bfb78SMikko Perttunen 		pb->mapped = dma_alloc_wc(host1x->dev, size, &pb->phys,
113404bfb78SMikko Perttunen 					  GFP_KERNEL);
114404bfb78SMikko Perttunen 		if (!pb->mapped)
115404bfb78SMikko Perttunen 			return -ENOMEM;
116404bfb78SMikko Perttunen 
117404bfb78SMikko Perttunen 		pb->dma = pb->phys;
118404bfb78SMikko Perttunen 	}
119404bfb78SMikko Perttunen 
120404bfb78SMikko Perttunen 	pb->alloc_size = size;
1216579324aSTerje Bergstrom 
1226579324aSTerje Bergstrom 	host1x_hw_pushbuffer_init(host1x, pb);
1236579324aSTerje Bergstrom 
1246579324aSTerje Bergstrom 	return 0;
1256579324aSTerje Bergstrom 
126404bfb78SMikko Perttunen iommu_free_iova:
127404bfb78SMikko Perttunen 	__free_iova(&host1x->iova, alloc);
128404bfb78SMikko Perttunen iommu_free_mem:
12927db6a00SDmitry Osipenko 	dma_free_wc(host1x->dev, size, pb->mapped, pb->phys);
130404bfb78SMikko Perttunen 
131404bfb78SMikko Perttunen 	return err;
1326579324aSTerje Bergstrom }
1336579324aSTerje Bergstrom 
1346579324aSTerje Bergstrom /*
1356579324aSTerje Bergstrom  * Push two words to the push buffer
1366579324aSTerje Bergstrom  * Caller must ensure push buffer is not full
1376579324aSTerje Bergstrom  */
host1x_pushbuffer_push(struct push_buffer * pb,u32 op1,u32 op2)1386579324aSTerje Bergstrom static void host1x_pushbuffer_push(struct push_buffer *pb, u32 op1, u32 op2)
1396579324aSTerje Bergstrom {
140ebb2475cSThierry Reding 	u32 *p = (u32 *)((void *)pb->mapped + pb->pos);
141ebb2475cSThierry Reding 
142ebb2475cSThierry Reding 	WARN_ON(pb->pos == pb->fence);
1436579324aSTerje Bergstrom 	*(p++) = op1;
1446579324aSTerje Bergstrom 	*(p++) = op2;
145e1f338c0SThierry Reding 	pb->pos += 8;
146e1f338c0SThierry Reding 
147e1f338c0SThierry Reding 	if (pb->pos >= pb->size)
148e1f338c0SThierry Reding 		pb->pos -= pb->size;
1496579324aSTerje Bergstrom }
1506579324aSTerje Bergstrom 
1516579324aSTerje Bergstrom /*
1526579324aSTerje Bergstrom  * Pop a number of two word slots from the push buffer
1536579324aSTerje Bergstrom  * Caller must ensure push buffer is not empty
1546579324aSTerje Bergstrom  */
host1x_pushbuffer_pop(struct push_buffer * pb,unsigned int slots)1556579324aSTerje Bergstrom static void host1x_pushbuffer_pop(struct push_buffer *pb, unsigned int slots)
1566579324aSTerje Bergstrom {
1576579324aSTerje Bergstrom 	/* Advance the next write position */
158e1f338c0SThierry Reding 	pb->fence += slots * 8;
159e1f338c0SThierry Reding 
160e1f338c0SThierry Reding 	if (pb->fence >= pb->size)
161e1f338c0SThierry Reding 		pb->fence -= pb->size;
1626579324aSTerje Bergstrom }
1636579324aSTerje Bergstrom 
1646579324aSTerje Bergstrom /*
1656579324aSTerje Bergstrom  * Return the number of two word slots free in the push buffer
1666579324aSTerje Bergstrom  */
host1x_pushbuffer_space(struct push_buffer * pb)1676579324aSTerje Bergstrom static u32 host1x_pushbuffer_space(struct push_buffer *pb)
1686579324aSTerje Bergstrom {
169e1f338c0SThierry Reding 	unsigned int fence = pb->fence;
170e1f338c0SThierry Reding 
171e1f338c0SThierry Reding 	if (pb->fence < pb->pos)
172e1f338c0SThierry Reding 		fence += pb->size;
173e1f338c0SThierry Reding 
174e1f338c0SThierry Reding 	return (fence - pb->pos) / 8;
1756579324aSTerje Bergstrom }
1766579324aSTerje Bergstrom 
1776579324aSTerje Bergstrom /*
1786579324aSTerje Bergstrom  * Sleep (if necessary) until the requested event happens
1796579324aSTerje Bergstrom  *   - CDMA_EVENT_SYNC_QUEUE_EMPTY : sync queue is completely empty.
1806579324aSTerje Bergstrom  *     - Returns 1
1816579324aSTerje Bergstrom  *   - CDMA_EVENT_PUSH_BUFFER_SPACE : there is space in the push buffer
1826579324aSTerje Bergstrom  *     - Return the amount of space (> 0)
1836579324aSTerje Bergstrom  * Must be called with the cdma lock held.
1846579324aSTerje Bergstrom  */
host1x_cdma_wait_locked(struct host1x_cdma * cdma,enum cdma_event event)1856579324aSTerje Bergstrom unsigned int host1x_cdma_wait_locked(struct host1x_cdma *cdma,
1866579324aSTerje Bergstrom 				     enum cdma_event event)
1876579324aSTerje Bergstrom {
1886579324aSTerje Bergstrom 	for (;;) {
1890b8070d1SThierry Reding 		struct push_buffer *pb = &cdma->push_buffer;
1906579324aSTerje Bergstrom 		unsigned int space;
1916579324aSTerje Bergstrom 
1920b8070d1SThierry Reding 		switch (event) {
1930b8070d1SThierry Reding 		case CDMA_EVENT_SYNC_QUEUE_EMPTY:
1946579324aSTerje Bergstrom 			space = list_empty(&cdma->sync_queue) ? 1 : 0;
1950b8070d1SThierry Reding 			break;
1960b8070d1SThierry Reding 
1970b8070d1SThierry Reding 		case CDMA_EVENT_PUSH_BUFFER_SPACE:
1986579324aSTerje Bergstrom 			space = host1x_pushbuffer_space(pb);
1990b8070d1SThierry Reding 			break;
2000b8070d1SThierry Reding 
2010b8070d1SThierry Reding 		default:
2026579324aSTerje Bergstrom 			WARN_ON(1);
2036579324aSTerje Bergstrom 			return -EINVAL;
2046579324aSTerje Bergstrom 		}
2056579324aSTerje Bergstrom 
2066579324aSTerje Bergstrom 		if (space)
2076579324aSTerje Bergstrom 			return space;
2086579324aSTerje Bergstrom 
2096579324aSTerje Bergstrom 		trace_host1x_wait_cdma(dev_name(cdma_to_channel(cdma)->dev),
2106579324aSTerje Bergstrom 				       event);
2116579324aSTerje Bergstrom 
2126579324aSTerje Bergstrom 		/* If somebody has managed to already start waiting, yield */
2136579324aSTerje Bergstrom 		if (cdma->event != CDMA_EVENT_NONE) {
2146579324aSTerje Bergstrom 			mutex_unlock(&cdma->lock);
2156579324aSTerje Bergstrom 			schedule();
2166579324aSTerje Bergstrom 			mutex_lock(&cdma->lock);
2176579324aSTerje Bergstrom 			continue;
2186579324aSTerje Bergstrom 		}
2190b8070d1SThierry Reding 
2206579324aSTerje Bergstrom 		cdma->event = event;
2216579324aSTerje Bergstrom 
2226579324aSTerje Bergstrom 		mutex_unlock(&cdma->lock);
2230747a672SArnd Bergmann 		wait_for_completion(&cdma->complete);
2246579324aSTerje Bergstrom 		mutex_lock(&cdma->lock);
2256579324aSTerje Bergstrom 	}
2260b8070d1SThierry Reding 
2276579324aSTerje Bergstrom 	return 0;
2286579324aSTerje Bergstrom }
2296579324aSTerje Bergstrom 
2306579324aSTerje Bergstrom /*
2315a5fccbdSThierry Reding  * Sleep (if necessary) until the push buffer has enough free space.
2325a5fccbdSThierry Reding  *
2335a5fccbdSThierry Reding  * Must be called with the cdma lock held.
2345a5fccbdSThierry Reding  */
host1x_cdma_wait_pushbuffer_space(struct host1x * host1x,struct host1x_cdma * cdma,unsigned int needed)23533904487SBen Dooks (Codethink) static int host1x_cdma_wait_pushbuffer_space(struct host1x *host1x,
2365a5fccbdSThierry Reding 					     struct host1x_cdma *cdma,
2375a5fccbdSThierry Reding 					     unsigned int needed)
2385a5fccbdSThierry Reding {
2395a5fccbdSThierry Reding 	while (true) {
2405a5fccbdSThierry Reding 		struct push_buffer *pb = &cdma->push_buffer;
2415a5fccbdSThierry Reding 		unsigned int space;
2425a5fccbdSThierry Reding 
2435a5fccbdSThierry Reding 		space = host1x_pushbuffer_space(pb);
2445a5fccbdSThierry Reding 		if (space >= needed)
2455a5fccbdSThierry Reding 			break;
2465a5fccbdSThierry Reding 
2475a5fccbdSThierry Reding 		trace_host1x_wait_cdma(dev_name(cdma_to_channel(cdma)->dev),
2485a5fccbdSThierry Reding 				       CDMA_EVENT_PUSH_BUFFER_SPACE);
2495a5fccbdSThierry Reding 
2505a5fccbdSThierry Reding 		host1x_hw_cdma_flush(host1x, cdma);
2515a5fccbdSThierry Reding 
2525a5fccbdSThierry Reding 		/* If somebody has managed to already start waiting, yield */
2535a5fccbdSThierry Reding 		if (cdma->event != CDMA_EVENT_NONE) {
2545a5fccbdSThierry Reding 			mutex_unlock(&cdma->lock);
2555a5fccbdSThierry Reding 			schedule();
2565a5fccbdSThierry Reding 			mutex_lock(&cdma->lock);
2575a5fccbdSThierry Reding 			continue;
2585a5fccbdSThierry Reding 		}
2595a5fccbdSThierry Reding 
2605a5fccbdSThierry Reding 		cdma->event = CDMA_EVENT_PUSH_BUFFER_SPACE;
2615a5fccbdSThierry Reding 
2625a5fccbdSThierry Reding 		mutex_unlock(&cdma->lock);
2635a5fccbdSThierry Reding 		wait_for_completion(&cdma->complete);
2645a5fccbdSThierry Reding 		mutex_lock(&cdma->lock);
2655a5fccbdSThierry Reding 	}
2665a5fccbdSThierry Reding 
2675a5fccbdSThierry Reding 	return 0;
2685a5fccbdSThierry Reding }
2695a5fccbdSThierry Reding /*
2706579324aSTerje Bergstrom  * Start timer that tracks the time spent by the job.
2716579324aSTerje Bergstrom  * Must be called with the cdma lock held.
2726579324aSTerje Bergstrom  */
cdma_start_timer_locked(struct host1x_cdma * cdma,struct host1x_job * job)2736579324aSTerje Bergstrom static void cdma_start_timer_locked(struct host1x_cdma *cdma,
2746579324aSTerje Bergstrom 				    struct host1x_job *job)
2756579324aSTerje Bergstrom {
2766579324aSTerje Bergstrom 	if (cdma->timeout.client) {
2776579324aSTerje Bergstrom 		/* timer already started */
2786579324aSTerje Bergstrom 		return;
2796579324aSTerje Bergstrom 	}
2806579324aSTerje Bergstrom 
2816579324aSTerje Bergstrom 	cdma->timeout.client = job->client;
2822aed4f5aSMikko Perttunen 	cdma->timeout.syncpt = job->syncpt;
2836579324aSTerje Bergstrom 	cdma->timeout.syncpt_val = job->syncpt_end;
2846579324aSTerje Bergstrom 	cdma->timeout.start_ktime = ktime_get();
2856579324aSTerje Bergstrom 
2866579324aSTerje Bergstrom 	schedule_delayed_work(&cdma->timeout.wq,
2876579324aSTerje Bergstrom 			      msecs_to_jiffies(job->timeout));
2886579324aSTerje Bergstrom }
2896579324aSTerje Bergstrom 
2906579324aSTerje Bergstrom /*
2916579324aSTerje Bergstrom  * Stop timer when a buffer submission completes.
2926579324aSTerje Bergstrom  * Must be called with the cdma lock held.
2936579324aSTerje Bergstrom  */
stop_cdma_timer_locked(struct host1x_cdma * cdma)2946579324aSTerje Bergstrom static void stop_cdma_timer_locked(struct host1x_cdma *cdma)
2956579324aSTerje Bergstrom {
2966579324aSTerje Bergstrom 	cancel_delayed_work(&cdma->timeout.wq);
297bf3d41ccSThierry Reding 	cdma->timeout.client = NULL;
2986579324aSTerje Bergstrom }
2996579324aSTerje Bergstrom 
3006579324aSTerje Bergstrom /*
3016579324aSTerje Bergstrom  * For all sync queue entries that have already finished according to the
3026579324aSTerje Bergstrom  * current sync point registers:
3036579324aSTerje Bergstrom  *  - unpin & unref their mems
3046579324aSTerje Bergstrom  *  - pop their push buffer slots
3056579324aSTerje Bergstrom  *  - remove them from the sync queue
3066579324aSTerje Bergstrom  * This is normally called from the host code's worker thread, but can be
3076579324aSTerje Bergstrom  * called manually if necessary.
3086579324aSTerje Bergstrom  * Must be called with the cdma lock held.
3096579324aSTerje Bergstrom  */
update_cdma_locked(struct host1x_cdma * cdma)3106579324aSTerje Bergstrom static void update_cdma_locked(struct host1x_cdma *cdma)
3116579324aSTerje Bergstrom {
3126579324aSTerje Bergstrom 	bool signal = false;
3136579324aSTerje Bergstrom 	struct host1x_job *job, *n;
3146579324aSTerje Bergstrom 
3156579324aSTerje Bergstrom 	/*
3166579324aSTerje Bergstrom 	 * Walk the sync queue, reading the sync point registers as necessary,
3176579324aSTerje Bergstrom 	 * to consume as many sync queue entries as possible without blocking
3186579324aSTerje Bergstrom 	 */
3196579324aSTerje Bergstrom 	list_for_each_entry_safe(job, n, &cdma->sync_queue, list) {
3202aed4f5aSMikko Perttunen 		struct host1x_syncpt *sp = job->syncpt;
3216579324aSTerje Bergstrom 
3226579324aSTerje Bergstrom 		/* Check whether this syncpt has completed, and bail if not */
323c78f837aSMikko Perttunen 		if (!host1x_syncpt_is_expired(sp, job->syncpt_end) &&
324c78f837aSMikko Perttunen 		    !job->cancelled) {
3256579324aSTerje Bergstrom 			/* Start timer on next pending syncpt */
3266579324aSTerje Bergstrom 			if (job->timeout)
3276579324aSTerje Bergstrom 				cdma_start_timer_locked(cdma, job);
3280b8070d1SThierry Reding 
3296579324aSTerje Bergstrom 			break;
3306579324aSTerje Bergstrom 		}
3316579324aSTerje Bergstrom 
3326579324aSTerje Bergstrom 		/* Cancel timeout, when a buffer completes */
3336579324aSTerje Bergstrom 		if (cdma->timeout.client)
3346579324aSTerje Bergstrom 			stop_cdma_timer_locked(cdma);
3356579324aSTerje Bergstrom 
3366579324aSTerje Bergstrom 		/* Unpin the memory */
3376579324aSTerje Bergstrom 		host1x_job_unpin(job);
3386579324aSTerje Bergstrom 
3396579324aSTerje Bergstrom 		/* Pop push buffer slots */
3406579324aSTerje Bergstrom 		if (job->num_slots) {
3416579324aSTerje Bergstrom 			struct push_buffer *pb = &cdma->push_buffer;
3426df633d0SThierry Reding 
3436579324aSTerje Bergstrom 			host1x_pushbuffer_pop(pb, job->num_slots);
3440b8070d1SThierry Reding 
3456579324aSTerje Bergstrom 			if (cdma->event == CDMA_EVENT_PUSH_BUFFER_SPACE)
3466579324aSTerje Bergstrom 				signal = true;
3476579324aSTerje Bergstrom 		}
3486579324aSTerje Bergstrom 
3496579324aSTerje Bergstrom 		list_del(&job->list);
3506579324aSTerje Bergstrom 		host1x_job_put(job);
3516579324aSTerje Bergstrom 	}
3526579324aSTerje Bergstrom 
3536579324aSTerje Bergstrom 	if (cdma->event == CDMA_EVENT_SYNC_QUEUE_EMPTY &&
3546579324aSTerje Bergstrom 	    list_empty(&cdma->sync_queue))
3556579324aSTerje Bergstrom 		signal = true;
3566579324aSTerje Bergstrom 
3576579324aSTerje Bergstrom 	if (signal) {
3586579324aSTerje Bergstrom 		cdma->event = CDMA_EVENT_NONE;
3590747a672SArnd Bergmann 		complete(&cdma->complete);
3606579324aSTerje Bergstrom 	}
3616579324aSTerje Bergstrom }
3626579324aSTerje Bergstrom 
host1x_cdma_update_sync_queue(struct host1x_cdma * cdma,struct device * dev)3636579324aSTerje Bergstrom void host1x_cdma_update_sync_queue(struct host1x_cdma *cdma,
3646579324aSTerje Bergstrom 				   struct device *dev)
3656579324aSTerje Bergstrom {
3666579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
3670b8070d1SThierry Reding 	u32 restart_addr, syncpt_incrs, syncpt_val;
36879930bafSDmitry Osipenko 	struct host1x_job *job, *next_job = NULL;
3696579324aSTerje Bergstrom 
3706579324aSTerje Bergstrom 	syncpt_val = host1x_syncpt_load(cdma->timeout.syncpt);
3716579324aSTerje Bergstrom 
3726579324aSTerje Bergstrom 	dev_dbg(dev, "%s: starting cleanup (thresh %d)\n",
3736579324aSTerje Bergstrom 		__func__, syncpt_val);
3746579324aSTerje Bergstrom 
3756579324aSTerje Bergstrom 	/*
3766579324aSTerje Bergstrom 	 * Move the sync_queue read pointer to the first entry that hasn't
3776579324aSTerje Bergstrom 	 * completed based on the current HW syncpt value. It's likely there
3786579324aSTerje Bergstrom 	 * won't be any (i.e. we're still at the head), but covers the case
3796579324aSTerje Bergstrom 	 * where a syncpt incr happens just prior/during the teardown.
3806579324aSTerje Bergstrom 	 */
3816579324aSTerje Bergstrom 
3826579324aSTerje Bergstrom 	dev_dbg(dev, "%s: skip completed buffers still in sync_queue\n",
3836579324aSTerje Bergstrom 		__func__);
3846579324aSTerje Bergstrom 
3856579324aSTerje Bergstrom 	list_for_each_entry(job, &cdma->sync_queue, list) {
38679930bafSDmitry Osipenko 		if (syncpt_val < job->syncpt_end) {
38779930bafSDmitry Osipenko 
38879930bafSDmitry Osipenko 			if (!list_is_last(&job->list, &cdma->sync_queue))
38979930bafSDmitry Osipenko 				next_job = list_next_entry(job, list);
39079930bafSDmitry Osipenko 
3915d6f0436SDmitry Osipenko 			goto syncpt_incr;
39279930bafSDmitry Osipenko 		}
3936579324aSTerje Bergstrom 
3946579324aSTerje Bergstrom 		host1x_job_dump(dev, job);
3956579324aSTerje Bergstrom 	}
3966579324aSTerje Bergstrom 
3975d6f0436SDmitry Osipenko 	/* all jobs have been completed */
3985d6f0436SDmitry Osipenko 	job = NULL;
3995d6f0436SDmitry Osipenko 
4005d6f0436SDmitry Osipenko syncpt_incr:
4015d6f0436SDmitry Osipenko 
4026579324aSTerje Bergstrom 	/*
403e8bad659SDmitry Osipenko 	 * Increment with CPU the remaining syncpts of a partially executed job.
4046579324aSTerje Bergstrom 	 *
40579930bafSDmitry Osipenko 	 * CDMA will continue execution starting with the next job or will get
40679930bafSDmitry Osipenko 	 * into idle state.
4076579324aSTerje Bergstrom 	 */
40879930bafSDmitry Osipenko 	if (next_job)
40979930bafSDmitry Osipenko 		restart_addr = next_job->first_get;
4106579324aSTerje Bergstrom 	else
4116579324aSTerje Bergstrom 		restart_addr = cdma->last_pos;
4126579324aSTerje Bergstrom 
413c78f837aSMikko Perttunen 	if (!job)
414c78f837aSMikko Perttunen 		goto resume;
415c78f837aSMikko Perttunen 
416e8bad659SDmitry Osipenko 	/* do CPU increments for the remaining syncpts */
417c78f837aSMikko Perttunen 	if (job->syncpt_recovery) {
4185d6f0436SDmitry Osipenko 		dev_dbg(dev, "%s: perform CPU incr on pending buffers\n",
4195d6f0436SDmitry Osipenko 			__func__);
4205d6f0436SDmitry Osipenko 
4216579324aSTerje Bergstrom 		/* won't need a timeout when replayed */
4226579324aSTerje Bergstrom 		job->timeout = 0;
4236579324aSTerje Bergstrom 
4246579324aSTerje Bergstrom 		syncpt_incrs = job->syncpt_end - syncpt_val;
4256579324aSTerje Bergstrom 		dev_dbg(dev, "%s: CPU incr (%d)\n", __func__, syncpt_incrs);
4266579324aSTerje Bergstrom 
4276579324aSTerje Bergstrom 		host1x_job_dump(dev, job);
4286579324aSTerje Bergstrom 
4296579324aSTerje Bergstrom 		/* safe to use CPU to incr syncpts */
4306579324aSTerje Bergstrom 		host1x_hw_cdma_timeout_cpu_incr(host1x, cdma, job->first_get,
4316579324aSTerje Bergstrom 						syncpt_incrs, job->syncpt_end,
4326579324aSTerje Bergstrom 						job->num_slots);
4336579324aSTerje Bergstrom 
4345d6f0436SDmitry Osipenko 		dev_dbg(dev, "%s: finished sync_queue modification\n",
4355d6f0436SDmitry Osipenko 			__func__);
436c78f837aSMikko Perttunen 	} else {
437c78f837aSMikko Perttunen 		struct host1x_job *failed_job = job;
438c78f837aSMikko Perttunen 
439c78f837aSMikko Perttunen 		host1x_job_dump(dev, job);
440c78f837aSMikko Perttunen 
441c78f837aSMikko Perttunen 		host1x_syncpt_set_locked(job->syncpt);
442c78f837aSMikko Perttunen 		failed_job->cancelled = true;
443c78f837aSMikko Perttunen 
444c78f837aSMikko Perttunen 		list_for_each_entry_continue(job, &cdma->sync_queue, list) {
445c78f837aSMikko Perttunen 			unsigned int i;
446c78f837aSMikko Perttunen 
447c78f837aSMikko Perttunen 			if (job->syncpt != failed_job->syncpt)
448c78f837aSMikko Perttunen 				continue;
449c78f837aSMikko Perttunen 
450c78f837aSMikko Perttunen 			for (i = 0; i < job->num_slots; i++) {
451c78f837aSMikko Perttunen 				unsigned int slot = (job->first_get/8 + i) %
452c78f837aSMikko Perttunen 						    HOST1X_PUSHBUFFER_SLOTS;
453c78f837aSMikko Perttunen 				u32 *mapped = cdma->push_buffer.mapped;
454c78f837aSMikko Perttunen 
455c78f837aSMikko Perttunen 				/*
456c78f837aSMikko Perttunen 				 * Overwrite opcodes with 0 word writes
457c78f837aSMikko Perttunen 				 * to offset 0xbad. This does nothing but
458c78f837aSMikko Perttunen 				 * has a easily detected signature in debug
459c78f837aSMikko Perttunen 				 * traces.
4600ae4ae91SMikko Perttunen 				 *
4610ae4ae91SMikko Perttunen 				 * On systems with MLOCK enforcement enabled,
4620ae4ae91SMikko Perttunen 				 * the above 0 word writes would fall foul of
4630ae4ae91SMikko Perttunen 				 * the enforcement. As such, in the first slot
4640ae4ae91SMikko Perttunen 				 * put a RESTART_W opcode to the beginning
4650ae4ae91SMikko Perttunen 				 * of the next job. We don't use this for older
4660ae4ae91SMikko Perttunen 				 * chips since those only support the RESTART
4670ae4ae91SMikko Perttunen 				 * opcode with inconvenient alignment requirements.
468c78f837aSMikko Perttunen 				 */
4690ae4ae91SMikko Perttunen 				if (i == 0 && host1x->info->has_wide_gather) {
4700ae4ae91SMikko Perttunen 					unsigned int next_job = (job->first_get/8 + job->num_slots)
4710ae4ae91SMikko Perttunen 						% HOST1X_PUSHBUFFER_SLOTS;
4720ae4ae91SMikko Perttunen 					mapped[2*slot+0] = (0xd << 28) | (next_job * 2);
4730ae4ae91SMikko Perttunen 					mapped[2*slot+1] = 0x0;
4740ae4ae91SMikko Perttunen 				} else {
475c78f837aSMikko Perttunen 					mapped[2*slot+0] = 0x1bad0000;
476c78f837aSMikko Perttunen 					mapped[2*slot+1] = 0x1bad0000;
4775d6f0436SDmitry Osipenko 				}
4780ae4ae91SMikko Perttunen 			}
4796579324aSTerje Bergstrom 
480c78f837aSMikko Perttunen 			job->cancelled = true;
481c78f837aSMikko Perttunen 		}
482c78f837aSMikko Perttunen 
483c78f837aSMikko Perttunen 		wmb();
484c78f837aSMikko Perttunen 
485c78f837aSMikko Perttunen 		update_cdma_locked(cdma);
486c78f837aSMikko Perttunen 	}
487c78f837aSMikko Perttunen 
488c78f837aSMikko Perttunen resume:
4896579324aSTerje Bergstrom 	/* roll back DMAGET and start up channel again */
4906579324aSTerje Bergstrom 	host1x_hw_cdma_resume(host1x, cdma, restart_addr);
4916579324aSTerje Bergstrom }
4926579324aSTerje Bergstrom 
cdma_update_work(struct work_struct * work)493*c24973edSMikko Perttunen static void cdma_update_work(struct work_struct *work)
494*c24973edSMikko Perttunen {
495*c24973edSMikko Perttunen 	struct host1x_cdma *cdma = container_of(work, struct host1x_cdma, update_work);
496*c24973edSMikko Perttunen 
497*c24973edSMikko Perttunen 	mutex_lock(&cdma->lock);
498*c24973edSMikko Perttunen 	update_cdma_locked(cdma);
499*c24973edSMikko Perttunen 	mutex_unlock(&cdma->lock);
500*c24973edSMikko Perttunen }
501*c24973edSMikko Perttunen 
5026579324aSTerje Bergstrom /*
5036579324aSTerje Bergstrom  * Create a cdma
5046579324aSTerje Bergstrom  */
host1x_cdma_init(struct host1x_cdma * cdma)5056579324aSTerje Bergstrom int host1x_cdma_init(struct host1x_cdma *cdma)
5066579324aSTerje Bergstrom {
5076579324aSTerje Bergstrom 	int err;
5086579324aSTerje Bergstrom 
5096579324aSTerje Bergstrom 	mutex_init(&cdma->lock);
5100747a672SArnd Bergmann 	init_completion(&cdma->complete);
511*c24973edSMikko Perttunen 	INIT_WORK(&cdma->update_work, cdma_update_work);
5126579324aSTerje Bergstrom 
5136579324aSTerje Bergstrom 	INIT_LIST_HEAD(&cdma->sync_queue);
5146579324aSTerje Bergstrom 
5156579324aSTerje Bergstrom 	cdma->event = CDMA_EVENT_NONE;
5166579324aSTerje Bergstrom 	cdma->running = false;
5176579324aSTerje Bergstrom 	cdma->torndown = false;
5186579324aSTerje Bergstrom 
5196579324aSTerje Bergstrom 	err = host1x_pushbuffer_init(&cdma->push_buffer);
5206579324aSTerje Bergstrom 	if (err)
5216579324aSTerje Bergstrom 		return err;
5220b8070d1SThierry Reding 
5236579324aSTerje Bergstrom 	return 0;
5246579324aSTerje Bergstrom }
5256579324aSTerje Bergstrom 
5266579324aSTerje Bergstrom /*
5276579324aSTerje Bergstrom  * Destroy a cdma
5286579324aSTerje Bergstrom  */
host1x_cdma_deinit(struct host1x_cdma * cdma)5296579324aSTerje Bergstrom int host1x_cdma_deinit(struct host1x_cdma *cdma)
5306579324aSTerje Bergstrom {
5316579324aSTerje Bergstrom 	struct push_buffer *pb = &cdma->push_buffer;
5326579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
5336579324aSTerje Bergstrom 
5346579324aSTerje Bergstrom 	if (cdma->running) {
5356579324aSTerje Bergstrom 		pr_warn("%s: CDMA still running\n", __func__);
5366579324aSTerje Bergstrom 		return -EBUSY;
5376579324aSTerje Bergstrom 	}
5386579324aSTerje Bergstrom 
5396579324aSTerje Bergstrom 	host1x_pushbuffer_destroy(pb);
5406579324aSTerje Bergstrom 	host1x_hw_cdma_timeout_destroy(host1x, cdma);
5416579324aSTerje Bergstrom 
5426579324aSTerje Bergstrom 	return 0;
5436579324aSTerje Bergstrom }
5446579324aSTerje Bergstrom 
5456579324aSTerje Bergstrom /*
5466579324aSTerje Bergstrom  * Begin a cdma submit
5476579324aSTerje Bergstrom  */
host1x_cdma_begin(struct host1x_cdma * cdma,struct host1x_job * job)5486579324aSTerje Bergstrom int host1x_cdma_begin(struct host1x_cdma *cdma, struct host1x_job *job)
5496579324aSTerje Bergstrom {
5506579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
5516579324aSTerje Bergstrom 
5526579324aSTerje Bergstrom 	mutex_lock(&cdma->lock);
5536579324aSTerje Bergstrom 
554c78f837aSMikko Perttunen 	/*
555c78f837aSMikko Perttunen 	 * Check if syncpoint was locked due to previous job timeout.
556c78f837aSMikko Perttunen 	 * This needs to be done within the cdma lock to avoid a race
557c78f837aSMikko Perttunen 	 * with the timeout handler.
558c78f837aSMikko Perttunen 	 */
559c78f837aSMikko Perttunen 	if (job->syncpt->locked) {
560c78f837aSMikko Perttunen 		mutex_unlock(&cdma->lock);
561c78f837aSMikko Perttunen 		return -EPERM;
562c78f837aSMikko Perttunen 	}
563c78f837aSMikko Perttunen 
5646579324aSTerje Bergstrom 	if (job->timeout) {
5656579324aSTerje Bergstrom 		/* init state on first submit with timeout value */
5666579324aSTerje Bergstrom 		if (!cdma->timeout.initialized) {
5676579324aSTerje Bergstrom 			int err;
5686df633d0SThierry Reding 
5692aed4f5aSMikko Perttunen 			err = host1x_hw_cdma_timeout_init(host1x, cdma);
5706579324aSTerje Bergstrom 			if (err) {
5716579324aSTerje Bergstrom 				mutex_unlock(&cdma->lock);
5726579324aSTerje Bergstrom 				return err;
5736579324aSTerje Bergstrom 			}
5746579324aSTerje Bergstrom 		}
5756579324aSTerje Bergstrom 	}
5760b8070d1SThierry Reding 
5776579324aSTerje Bergstrom 	if (!cdma->running)
5786579324aSTerje Bergstrom 		host1x_hw_cdma_start(host1x, cdma);
5796579324aSTerje Bergstrom 
5806579324aSTerje Bergstrom 	cdma->slots_free = 0;
5816579324aSTerje Bergstrom 	cdma->slots_used = 0;
5826579324aSTerje Bergstrom 	cdma->first_get = cdma->push_buffer.pos;
5836579324aSTerje Bergstrom 
5846579324aSTerje Bergstrom 	trace_host1x_cdma_begin(dev_name(job->channel->dev));
5856579324aSTerje Bergstrom 	return 0;
5866579324aSTerje Bergstrom }
5876579324aSTerje Bergstrom 
5886579324aSTerje Bergstrom /*
5896579324aSTerje Bergstrom  * Push two words into a push buffer slot
5906579324aSTerje Bergstrom  * Blocks as necessary if the push buffer is full.
5916579324aSTerje Bergstrom  */
host1x_cdma_push(struct host1x_cdma * cdma,u32 op1,u32 op2)5926579324aSTerje Bergstrom void host1x_cdma_push(struct host1x_cdma *cdma, u32 op1, u32 op2)
5936579324aSTerje Bergstrom {
5946579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
5956579324aSTerje Bergstrom 	struct push_buffer *pb = &cdma->push_buffer;
5966579324aSTerje Bergstrom 	u32 slots_free = cdma->slots_free;
5976579324aSTerje Bergstrom 
5986236451dSTerje Bergstrom 	if (host1x_debug_trace_cmdbuf)
5996236451dSTerje Bergstrom 		trace_host1x_cdma_push(dev_name(cdma_to_channel(cdma)->dev),
6006236451dSTerje Bergstrom 				       op1, op2);
6016236451dSTerje Bergstrom 
6026579324aSTerje Bergstrom 	if (slots_free == 0) {
6036579324aSTerje Bergstrom 		host1x_hw_cdma_flush(host1x, cdma);
6046579324aSTerje Bergstrom 		slots_free = host1x_cdma_wait_locked(cdma,
6056579324aSTerje Bergstrom 						CDMA_EVENT_PUSH_BUFFER_SPACE);
6066579324aSTerje Bergstrom 	}
6070b8070d1SThierry Reding 
6086579324aSTerje Bergstrom 	cdma->slots_free = slots_free - 1;
6096579324aSTerje Bergstrom 	cdma->slots_used++;
6106579324aSTerje Bergstrom 	host1x_pushbuffer_push(pb, op1, op2);
6116579324aSTerje Bergstrom }
6126579324aSTerje Bergstrom 
6136579324aSTerje Bergstrom /*
6145a5fccbdSThierry Reding  * Push four words into two consecutive push buffer slots. Note that extra
6155a5fccbdSThierry Reding  * care needs to be taken not to split the two slots across the end of the
6165a5fccbdSThierry Reding  * push buffer. Otherwise the RESTART opcode at the end of the push buffer
6175a5fccbdSThierry Reding  * that ensures processing will restart at the beginning will break up the
6185a5fccbdSThierry Reding  * four words.
6195a5fccbdSThierry Reding  *
6205a5fccbdSThierry Reding  * Blocks as necessary if the push buffer is full.
6215a5fccbdSThierry Reding  */
host1x_cdma_push_wide(struct host1x_cdma * cdma,u32 op1,u32 op2,u32 op3,u32 op4)6225a5fccbdSThierry Reding void host1x_cdma_push_wide(struct host1x_cdma *cdma, u32 op1, u32 op2,
6235a5fccbdSThierry Reding 			   u32 op3, u32 op4)
6245a5fccbdSThierry Reding {
6255a5fccbdSThierry Reding 	struct host1x_channel *channel = cdma_to_channel(cdma);
6265a5fccbdSThierry Reding 	struct host1x *host1x = cdma_to_host1x(cdma);
6275a5fccbdSThierry Reding 	struct push_buffer *pb = &cdma->push_buffer;
6285a5fccbdSThierry Reding 	unsigned int space = cdma->slots_free;
6298c92243dSMikko Perttunen 	unsigned int needed = 2, extra = 0;
6305a5fccbdSThierry Reding 
6315a5fccbdSThierry Reding 	if (host1x_debug_trace_cmdbuf)
6325a5fccbdSThierry Reding 		trace_host1x_cdma_push_wide(dev_name(channel->dev), op1, op2,
6335a5fccbdSThierry Reding 					    op3, op4);
6345a5fccbdSThierry Reding 
6355a5fccbdSThierry Reding 	/* compute number of extra slots needed for padding */
6365a5fccbdSThierry Reding 	if (pb->pos + 16 > pb->size) {
6375a5fccbdSThierry Reding 		extra = (pb->size - pb->pos) / 8;
6385a5fccbdSThierry Reding 		needed += extra;
6395a5fccbdSThierry Reding 	}
6405a5fccbdSThierry Reding 
6415a5fccbdSThierry Reding 	host1x_cdma_wait_pushbuffer_space(host1x, cdma, needed);
6425a5fccbdSThierry Reding 	space = host1x_pushbuffer_space(pb);
6435a5fccbdSThierry Reding 
6445a5fccbdSThierry Reding 	cdma->slots_free = space - needed;
6455a5fccbdSThierry Reding 	cdma->slots_used += needed;
6465a5fccbdSThierry Reding 
6478c92243dSMikko Perttunen 	if (extra > 0) {
6485a5fccbdSThierry Reding 		/*
6498c92243dSMikko Perttunen 		 * If there isn't enough space at the tail of the pushbuffer,
6508c92243dSMikko Perttunen 		 * insert a RESTART(0) here to go back to the beginning.
6518c92243dSMikko Perttunen 		 * The code above adjusted the indexes appropriately.
6525a5fccbdSThierry Reding 		 */
6538c92243dSMikko Perttunen 		host1x_pushbuffer_push(pb, (0x5 << 28), 0xdead0000);
6548c92243dSMikko Perttunen 	}
6555a5fccbdSThierry Reding 
6565a5fccbdSThierry Reding 	host1x_pushbuffer_push(pb, op1, op2);
6575a5fccbdSThierry Reding 	host1x_pushbuffer_push(pb, op3, op4);
6585a5fccbdSThierry Reding }
6595a5fccbdSThierry Reding 
6605a5fccbdSThierry Reding /*
6616579324aSTerje Bergstrom  * End a cdma submit
6626579324aSTerje Bergstrom  * Kick off DMA, add job to the sync queue, and a number of slots to be freed
6636579324aSTerje Bergstrom  * from the pushbuffer. The handles for a submit must all be pinned at the same
6646579324aSTerje Bergstrom  * time, but they can be unpinned in smaller chunks.
6656579324aSTerje Bergstrom  */
host1x_cdma_end(struct host1x_cdma * cdma,struct host1x_job * job)6666579324aSTerje Bergstrom void host1x_cdma_end(struct host1x_cdma *cdma,
6676579324aSTerje Bergstrom 		     struct host1x_job *job)
6686579324aSTerje Bergstrom {
6696579324aSTerje Bergstrom 	struct host1x *host1x = cdma_to_host1x(cdma);
6706579324aSTerje Bergstrom 	bool idle = list_empty(&cdma->sync_queue);
6716579324aSTerje Bergstrom 
6726579324aSTerje Bergstrom 	host1x_hw_cdma_flush(host1x, cdma);
6736579324aSTerje Bergstrom 
6746579324aSTerje Bergstrom 	job->first_get = cdma->first_get;
6756579324aSTerje Bergstrom 	job->num_slots = cdma->slots_used;
6766579324aSTerje Bergstrom 	host1x_job_get(job);
6776579324aSTerje Bergstrom 	list_add_tail(&job->list, &cdma->sync_queue);
6786579324aSTerje Bergstrom 
6796579324aSTerje Bergstrom 	/* start timer on idle -> active transitions */
6806579324aSTerje Bergstrom 	if (job->timeout && idle)
6816579324aSTerje Bergstrom 		cdma_start_timer_locked(cdma, job);
6826579324aSTerje Bergstrom 
6836579324aSTerje Bergstrom 	trace_host1x_cdma_end(dev_name(job->channel->dev));
6846579324aSTerje Bergstrom 	mutex_unlock(&cdma->lock);
6856579324aSTerje Bergstrom }
6866579324aSTerje Bergstrom 
6876579324aSTerje Bergstrom /*
6886579324aSTerje Bergstrom  * Update cdma state according to current sync point values
6896579324aSTerje Bergstrom  */
host1x_cdma_update(struct host1x_cdma * cdma)6906579324aSTerje Bergstrom void host1x_cdma_update(struct host1x_cdma *cdma)
6916579324aSTerje Bergstrom {
692*c24973edSMikko Perttunen 	schedule_work(&cdma->update_work);
6936579324aSTerje Bergstrom }
694