19952f691SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
26579324aSTerje Bergstrom /*
36579324aSTerje Bergstrom * Tegra host1x Command DMA
46579324aSTerje Bergstrom *
56579324aSTerje Bergstrom * Copyright (c) 2010-2013, NVIDIA Corporation.
66579324aSTerje Bergstrom */
76579324aSTerje Bergstrom
86579324aSTerje Bergstrom
96579324aSTerje Bergstrom #include <asm/cacheflush.h>
106579324aSTerje Bergstrom #include <linux/device.h>
116579324aSTerje Bergstrom #include <linux/dma-mapping.h>
1235d747a8SThierry Reding #include <linux/host1x.h>
136579324aSTerje Bergstrom #include <linux/interrupt.h>
146579324aSTerje Bergstrom #include <linux/kernel.h>
156579324aSTerje Bergstrom #include <linux/kfifo.h>
166579324aSTerje Bergstrom #include <linux/slab.h>
176579324aSTerje Bergstrom #include <trace/events/host1x.h>
186579324aSTerje Bergstrom
196579324aSTerje Bergstrom #include "cdma.h"
206579324aSTerje Bergstrom #include "channel.h"
216579324aSTerje Bergstrom #include "dev.h"
226579324aSTerje Bergstrom #include "debug.h"
236579324aSTerje Bergstrom #include "job.h"
246579324aSTerje Bergstrom
256579324aSTerje Bergstrom /*
266579324aSTerje Bergstrom * push_buffer
276579324aSTerje Bergstrom *
286579324aSTerje Bergstrom * The push buffer is a circular array of words to be fetched by command DMA.
296579324aSTerje Bergstrom * Note that it works slightly differently to the sync queue; fence == pos
306579324aSTerje Bergstrom * means that the push buffer is full, not empty.
316579324aSTerje Bergstrom */
326579324aSTerje Bergstrom
33e1f338c0SThierry Reding /*
34e1f338c0SThierry Reding * Typically the commands written into the push buffer are a pair of words. We
35e1f338c0SThierry Reding * use slots to represent each of these pairs and to simplify things. Note the
36e1f338c0SThierry Reding * strange number of slots allocated here. 512 slots will fit exactly within a
37e1f338c0SThierry Reding * single memory page. We also need one additional word at the end of the push
38e1f338c0SThierry Reding * buffer for the RESTART opcode that will instruct the CDMA to jump back to
39e1f338c0SThierry Reding * the beginning of the push buffer. With 512 slots, this means that we'll use
40e1f338c0SThierry Reding * 2 memory pages and waste 4092 bytes of the second page that will never be
41e1f338c0SThierry Reding * used.
42e1f338c0SThierry Reding */
43e1f338c0SThierry Reding #define HOST1X_PUSHBUFFER_SLOTS 511
446579324aSTerje Bergstrom
456579324aSTerje Bergstrom /*
466579324aSTerje Bergstrom * Clean up push buffer resources
476579324aSTerje Bergstrom */
host1x_pushbuffer_destroy(struct push_buffer * pb)486579324aSTerje Bergstrom static void host1x_pushbuffer_destroy(struct push_buffer *pb)
496579324aSTerje Bergstrom {
506579324aSTerje Bergstrom struct host1x_cdma *cdma = pb_to_cdma(pb);
516579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
526579324aSTerje Bergstrom
532f8a6da8SEmil Goode if (!pb->mapped)
54404bfb78SMikko Perttunen return;
55404bfb78SMikko Perttunen
56404bfb78SMikko Perttunen if (host1x->domain) {
57404bfb78SMikko Perttunen iommu_unmap(host1x->domain, pb->dma, pb->alloc_size);
58404bfb78SMikko Perttunen free_iova(&host1x->iova, iova_pfn(&host1x->iova, pb->dma));
59404bfb78SMikko Perttunen }
60404bfb78SMikko Perttunen
61404bfb78SMikko Perttunen dma_free_wc(host1x->dev, pb->alloc_size, pb->mapped, pb->phys);
626579324aSTerje Bergstrom
636579324aSTerje Bergstrom pb->mapped = NULL;
646579324aSTerje Bergstrom pb->phys = 0;
656579324aSTerje Bergstrom }
666579324aSTerje Bergstrom
676579324aSTerje Bergstrom /*
686579324aSTerje Bergstrom * Init push buffer resources
696579324aSTerje Bergstrom */
host1x_pushbuffer_init(struct push_buffer * pb)706579324aSTerje Bergstrom static int host1x_pushbuffer_init(struct push_buffer *pb)
716579324aSTerje Bergstrom {
726579324aSTerje Bergstrom struct host1x_cdma *cdma = pb_to_cdma(pb);
736579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
74404bfb78SMikko Perttunen struct iova *alloc;
75404bfb78SMikko Perttunen u32 size;
76404bfb78SMikko Perttunen int err;
776579324aSTerje Bergstrom
786579324aSTerje Bergstrom pb->mapped = NULL;
796579324aSTerje Bergstrom pb->phys = 0;
80404bfb78SMikko Perttunen pb->size = HOST1X_PUSHBUFFER_SLOTS * 8;
81404bfb78SMikko Perttunen
82404bfb78SMikko Perttunen size = pb->size + 4;
836579324aSTerje Bergstrom
846579324aSTerje Bergstrom /* initialize buffer pointers */
85404bfb78SMikko Perttunen pb->fence = pb->size - 8;
866579324aSTerje Bergstrom pb->pos = 0;
876579324aSTerje Bergstrom
88404bfb78SMikko Perttunen if (host1x->domain) {
89404bfb78SMikko Perttunen unsigned long shift;
90404bfb78SMikko Perttunen
91404bfb78SMikko Perttunen size = iova_align(&host1x->iova, size);
92404bfb78SMikko Perttunen
93404bfb78SMikko Perttunen pb->mapped = dma_alloc_wc(host1x->dev, size, &pb->phys,
94f6e45661SLuis R. Rodriguez GFP_KERNEL);
956579324aSTerje Bergstrom if (!pb->mapped)
96404bfb78SMikko Perttunen return -ENOMEM;
97404bfb78SMikko Perttunen
98404bfb78SMikko Perttunen shift = iova_shift(&host1x->iova);
99404bfb78SMikko Perttunen alloc = alloc_iova(&host1x->iova, size >> shift,
100404bfb78SMikko Perttunen host1x->iova_end >> shift, true);
101404bfb78SMikko Perttunen if (!alloc) {
102404bfb78SMikko Perttunen err = -ENOMEM;
103404bfb78SMikko Perttunen goto iommu_free_mem;
104404bfb78SMikko Perttunen }
105404bfb78SMikko Perttunen
106404bfb78SMikko Perttunen pb->dma = iova_dma_addr(&host1x->iova, alloc);
107404bfb78SMikko Perttunen err = iommu_map(host1x->domain, pb->dma, pb->phys, size,
1081369459bSJason Gunthorpe IOMMU_READ, GFP_KERNEL);
109404bfb78SMikko Perttunen if (err)
110404bfb78SMikko Perttunen goto iommu_free_iova;
111404bfb78SMikko Perttunen } else {
112404bfb78SMikko Perttunen pb->mapped = dma_alloc_wc(host1x->dev, size, &pb->phys,
113404bfb78SMikko Perttunen GFP_KERNEL);
114404bfb78SMikko Perttunen if (!pb->mapped)
115404bfb78SMikko Perttunen return -ENOMEM;
116404bfb78SMikko Perttunen
117404bfb78SMikko Perttunen pb->dma = pb->phys;
118404bfb78SMikko Perttunen }
119404bfb78SMikko Perttunen
120404bfb78SMikko Perttunen pb->alloc_size = size;
1216579324aSTerje Bergstrom
1226579324aSTerje Bergstrom host1x_hw_pushbuffer_init(host1x, pb);
1236579324aSTerje Bergstrom
1246579324aSTerje Bergstrom return 0;
1256579324aSTerje Bergstrom
126404bfb78SMikko Perttunen iommu_free_iova:
127404bfb78SMikko Perttunen __free_iova(&host1x->iova, alloc);
128404bfb78SMikko Perttunen iommu_free_mem:
12927db6a00SDmitry Osipenko dma_free_wc(host1x->dev, size, pb->mapped, pb->phys);
130404bfb78SMikko Perttunen
131404bfb78SMikko Perttunen return err;
1326579324aSTerje Bergstrom }
1336579324aSTerje Bergstrom
1346579324aSTerje Bergstrom /*
1356579324aSTerje Bergstrom * Push two words to the push buffer
1366579324aSTerje Bergstrom * Caller must ensure push buffer is not full
1376579324aSTerje Bergstrom */
host1x_pushbuffer_push(struct push_buffer * pb,u32 op1,u32 op2)1386579324aSTerje Bergstrom static void host1x_pushbuffer_push(struct push_buffer *pb, u32 op1, u32 op2)
1396579324aSTerje Bergstrom {
140ebb2475cSThierry Reding u32 *p = (u32 *)((void *)pb->mapped + pb->pos);
141ebb2475cSThierry Reding
142ebb2475cSThierry Reding WARN_ON(pb->pos == pb->fence);
1436579324aSTerje Bergstrom *(p++) = op1;
1446579324aSTerje Bergstrom *(p++) = op2;
145e1f338c0SThierry Reding pb->pos += 8;
146e1f338c0SThierry Reding
147e1f338c0SThierry Reding if (pb->pos >= pb->size)
148e1f338c0SThierry Reding pb->pos -= pb->size;
1496579324aSTerje Bergstrom }
1506579324aSTerje Bergstrom
1516579324aSTerje Bergstrom /*
1526579324aSTerje Bergstrom * Pop a number of two word slots from the push buffer
1536579324aSTerje Bergstrom * Caller must ensure push buffer is not empty
1546579324aSTerje Bergstrom */
host1x_pushbuffer_pop(struct push_buffer * pb,unsigned int slots)1556579324aSTerje Bergstrom static void host1x_pushbuffer_pop(struct push_buffer *pb, unsigned int slots)
1566579324aSTerje Bergstrom {
1576579324aSTerje Bergstrom /* Advance the next write position */
158e1f338c0SThierry Reding pb->fence += slots * 8;
159e1f338c0SThierry Reding
160e1f338c0SThierry Reding if (pb->fence >= pb->size)
161e1f338c0SThierry Reding pb->fence -= pb->size;
1626579324aSTerje Bergstrom }
1636579324aSTerje Bergstrom
1646579324aSTerje Bergstrom /*
1656579324aSTerje Bergstrom * Return the number of two word slots free in the push buffer
1666579324aSTerje Bergstrom */
host1x_pushbuffer_space(struct push_buffer * pb)1676579324aSTerje Bergstrom static u32 host1x_pushbuffer_space(struct push_buffer *pb)
1686579324aSTerje Bergstrom {
169e1f338c0SThierry Reding unsigned int fence = pb->fence;
170e1f338c0SThierry Reding
171e1f338c0SThierry Reding if (pb->fence < pb->pos)
172e1f338c0SThierry Reding fence += pb->size;
173e1f338c0SThierry Reding
174e1f338c0SThierry Reding return (fence - pb->pos) / 8;
1756579324aSTerje Bergstrom }
1766579324aSTerje Bergstrom
1776579324aSTerje Bergstrom /*
1786579324aSTerje Bergstrom * Sleep (if necessary) until the requested event happens
1796579324aSTerje Bergstrom * - CDMA_EVENT_SYNC_QUEUE_EMPTY : sync queue is completely empty.
1806579324aSTerje Bergstrom * - Returns 1
1816579324aSTerje Bergstrom * - CDMA_EVENT_PUSH_BUFFER_SPACE : there is space in the push buffer
1826579324aSTerje Bergstrom * - Return the amount of space (> 0)
1836579324aSTerje Bergstrom * Must be called with the cdma lock held.
1846579324aSTerje Bergstrom */
host1x_cdma_wait_locked(struct host1x_cdma * cdma,enum cdma_event event)1856579324aSTerje Bergstrom unsigned int host1x_cdma_wait_locked(struct host1x_cdma *cdma,
1866579324aSTerje Bergstrom enum cdma_event event)
1876579324aSTerje Bergstrom {
1886579324aSTerje Bergstrom for (;;) {
1890b8070d1SThierry Reding struct push_buffer *pb = &cdma->push_buffer;
1906579324aSTerje Bergstrom unsigned int space;
1916579324aSTerje Bergstrom
1920b8070d1SThierry Reding switch (event) {
1930b8070d1SThierry Reding case CDMA_EVENT_SYNC_QUEUE_EMPTY:
1946579324aSTerje Bergstrom space = list_empty(&cdma->sync_queue) ? 1 : 0;
1950b8070d1SThierry Reding break;
1960b8070d1SThierry Reding
1970b8070d1SThierry Reding case CDMA_EVENT_PUSH_BUFFER_SPACE:
1986579324aSTerje Bergstrom space = host1x_pushbuffer_space(pb);
1990b8070d1SThierry Reding break;
2000b8070d1SThierry Reding
2010b8070d1SThierry Reding default:
2026579324aSTerje Bergstrom WARN_ON(1);
2036579324aSTerje Bergstrom return -EINVAL;
2046579324aSTerje Bergstrom }
2056579324aSTerje Bergstrom
2066579324aSTerje Bergstrom if (space)
2076579324aSTerje Bergstrom return space;
2086579324aSTerje Bergstrom
2096579324aSTerje Bergstrom trace_host1x_wait_cdma(dev_name(cdma_to_channel(cdma)->dev),
2106579324aSTerje Bergstrom event);
2116579324aSTerje Bergstrom
2126579324aSTerje Bergstrom /* If somebody has managed to already start waiting, yield */
2136579324aSTerje Bergstrom if (cdma->event != CDMA_EVENT_NONE) {
2146579324aSTerje Bergstrom mutex_unlock(&cdma->lock);
2156579324aSTerje Bergstrom schedule();
2166579324aSTerje Bergstrom mutex_lock(&cdma->lock);
2176579324aSTerje Bergstrom continue;
2186579324aSTerje Bergstrom }
2190b8070d1SThierry Reding
2206579324aSTerje Bergstrom cdma->event = event;
2216579324aSTerje Bergstrom
2226579324aSTerje Bergstrom mutex_unlock(&cdma->lock);
2230747a672SArnd Bergmann wait_for_completion(&cdma->complete);
2246579324aSTerje Bergstrom mutex_lock(&cdma->lock);
2256579324aSTerje Bergstrom }
2260b8070d1SThierry Reding
2276579324aSTerje Bergstrom return 0;
2286579324aSTerje Bergstrom }
2296579324aSTerje Bergstrom
2306579324aSTerje Bergstrom /*
2315a5fccbdSThierry Reding * Sleep (if necessary) until the push buffer has enough free space.
2325a5fccbdSThierry Reding *
2335a5fccbdSThierry Reding * Must be called with the cdma lock held.
2345a5fccbdSThierry Reding */
host1x_cdma_wait_pushbuffer_space(struct host1x * host1x,struct host1x_cdma * cdma,unsigned int needed)23533904487SBen Dooks (Codethink) static int host1x_cdma_wait_pushbuffer_space(struct host1x *host1x,
2365a5fccbdSThierry Reding struct host1x_cdma *cdma,
2375a5fccbdSThierry Reding unsigned int needed)
2385a5fccbdSThierry Reding {
2395a5fccbdSThierry Reding while (true) {
2405a5fccbdSThierry Reding struct push_buffer *pb = &cdma->push_buffer;
2415a5fccbdSThierry Reding unsigned int space;
2425a5fccbdSThierry Reding
2435a5fccbdSThierry Reding space = host1x_pushbuffer_space(pb);
2445a5fccbdSThierry Reding if (space >= needed)
2455a5fccbdSThierry Reding break;
2465a5fccbdSThierry Reding
2475a5fccbdSThierry Reding trace_host1x_wait_cdma(dev_name(cdma_to_channel(cdma)->dev),
2485a5fccbdSThierry Reding CDMA_EVENT_PUSH_BUFFER_SPACE);
2495a5fccbdSThierry Reding
2505a5fccbdSThierry Reding host1x_hw_cdma_flush(host1x, cdma);
2515a5fccbdSThierry Reding
2525a5fccbdSThierry Reding /* If somebody has managed to already start waiting, yield */
2535a5fccbdSThierry Reding if (cdma->event != CDMA_EVENT_NONE) {
2545a5fccbdSThierry Reding mutex_unlock(&cdma->lock);
2555a5fccbdSThierry Reding schedule();
2565a5fccbdSThierry Reding mutex_lock(&cdma->lock);
2575a5fccbdSThierry Reding continue;
2585a5fccbdSThierry Reding }
2595a5fccbdSThierry Reding
2605a5fccbdSThierry Reding cdma->event = CDMA_EVENT_PUSH_BUFFER_SPACE;
2615a5fccbdSThierry Reding
2625a5fccbdSThierry Reding mutex_unlock(&cdma->lock);
2635a5fccbdSThierry Reding wait_for_completion(&cdma->complete);
2645a5fccbdSThierry Reding mutex_lock(&cdma->lock);
2655a5fccbdSThierry Reding }
2665a5fccbdSThierry Reding
2675a5fccbdSThierry Reding return 0;
2685a5fccbdSThierry Reding }
2695a5fccbdSThierry Reding /*
2706579324aSTerje Bergstrom * Start timer that tracks the time spent by the job.
2716579324aSTerje Bergstrom * Must be called with the cdma lock held.
2726579324aSTerje Bergstrom */
cdma_start_timer_locked(struct host1x_cdma * cdma,struct host1x_job * job)2736579324aSTerje Bergstrom static void cdma_start_timer_locked(struct host1x_cdma *cdma,
2746579324aSTerje Bergstrom struct host1x_job *job)
2756579324aSTerje Bergstrom {
2766579324aSTerje Bergstrom if (cdma->timeout.client) {
2776579324aSTerje Bergstrom /* timer already started */
2786579324aSTerje Bergstrom return;
2796579324aSTerje Bergstrom }
2806579324aSTerje Bergstrom
2816579324aSTerje Bergstrom cdma->timeout.client = job->client;
2822aed4f5aSMikko Perttunen cdma->timeout.syncpt = job->syncpt;
2836579324aSTerje Bergstrom cdma->timeout.syncpt_val = job->syncpt_end;
2846579324aSTerje Bergstrom cdma->timeout.start_ktime = ktime_get();
2856579324aSTerje Bergstrom
2866579324aSTerje Bergstrom schedule_delayed_work(&cdma->timeout.wq,
2876579324aSTerje Bergstrom msecs_to_jiffies(job->timeout));
2886579324aSTerje Bergstrom }
2896579324aSTerje Bergstrom
2906579324aSTerje Bergstrom /*
2916579324aSTerje Bergstrom * Stop timer when a buffer submission completes.
2926579324aSTerje Bergstrom * Must be called with the cdma lock held.
2936579324aSTerje Bergstrom */
stop_cdma_timer_locked(struct host1x_cdma * cdma)2946579324aSTerje Bergstrom static void stop_cdma_timer_locked(struct host1x_cdma *cdma)
2956579324aSTerje Bergstrom {
2966579324aSTerje Bergstrom cancel_delayed_work(&cdma->timeout.wq);
297bf3d41ccSThierry Reding cdma->timeout.client = NULL;
2986579324aSTerje Bergstrom }
2996579324aSTerje Bergstrom
3006579324aSTerje Bergstrom /*
3016579324aSTerje Bergstrom * For all sync queue entries that have already finished according to the
3026579324aSTerje Bergstrom * current sync point registers:
3036579324aSTerje Bergstrom * - unpin & unref their mems
3046579324aSTerje Bergstrom * - pop their push buffer slots
3056579324aSTerje Bergstrom * - remove them from the sync queue
3066579324aSTerje Bergstrom * This is normally called from the host code's worker thread, but can be
3076579324aSTerje Bergstrom * called manually if necessary.
3086579324aSTerje Bergstrom * Must be called with the cdma lock held.
3096579324aSTerje Bergstrom */
update_cdma_locked(struct host1x_cdma * cdma)3106579324aSTerje Bergstrom static void update_cdma_locked(struct host1x_cdma *cdma)
3116579324aSTerje Bergstrom {
3126579324aSTerje Bergstrom bool signal = false;
3136579324aSTerje Bergstrom struct host1x_job *job, *n;
3146579324aSTerje Bergstrom
3156579324aSTerje Bergstrom /*
3166579324aSTerje Bergstrom * Walk the sync queue, reading the sync point registers as necessary,
3176579324aSTerje Bergstrom * to consume as many sync queue entries as possible without blocking
3186579324aSTerje Bergstrom */
3196579324aSTerje Bergstrom list_for_each_entry_safe(job, n, &cdma->sync_queue, list) {
3202aed4f5aSMikko Perttunen struct host1x_syncpt *sp = job->syncpt;
3216579324aSTerje Bergstrom
3226579324aSTerje Bergstrom /* Check whether this syncpt has completed, and bail if not */
323c78f837aSMikko Perttunen if (!host1x_syncpt_is_expired(sp, job->syncpt_end) &&
324c78f837aSMikko Perttunen !job->cancelled) {
3256579324aSTerje Bergstrom /* Start timer on next pending syncpt */
3266579324aSTerje Bergstrom if (job->timeout)
3276579324aSTerje Bergstrom cdma_start_timer_locked(cdma, job);
3280b8070d1SThierry Reding
3296579324aSTerje Bergstrom break;
3306579324aSTerje Bergstrom }
3316579324aSTerje Bergstrom
3326579324aSTerje Bergstrom /* Cancel timeout, when a buffer completes */
3336579324aSTerje Bergstrom if (cdma->timeout.client)
3346579324aSTerje Bergstrom stop_cdma_timer_locked(cdma);
3356579324aSTerje Bergstrom
3366579324aSTerje Bergstrom /* Unpin the memory */
3376579324aSTerje Bergstrom host1x_job_unpin(job);
3386579324aSTerje Bergstrom
3396579324aSTerje Bergstrom /* Pop push buffer slots */
3406579324aSTerje Bergstrom if (job->num_slots) {
3416579324aSTerje Bergstrom struct push_buffer *pb = &cdma->push_buffer;
3426df633d0SThierry Reding
3436579324aSTerje Bergstrom host1x_pushbuffer_pop(pb, job->num_slots);
3440b8070d1SThierry Reding
3456579324aSTerje Bergstrom if (cdma->event == CDMA_EVENT_PUSH_BUFFER_SPACE)
3466579324aSTerje Bergstrom signal = true;
3476579324aSTerje Bergstrom }
3486579324aSTerje Bergstrom
3496579324aSTerje Bergstrom list_del(&job->list);
3506579324aSTerje Bergstrom host1x_job_put(job);
3516579324aSTerje Bergstrom }
3526579324aSTerje Bergstrom
3536579324aSTerje Bergstrom if (cdma->event == CDMA_EVENT_SYNC_QUEUE_EMPTY &&
3546579324aSTerje Bergstrom list_empty(&cdma->sync_queue))
3556579324aSTerje Bergstrom signal = true;
3566579324aSTerje Bergstrom
3576579324aSTerje Bergstrom if (signal) {
3586579324aSTerje Bergstrom cdma->event = CDMA_EVENT_NONE;
3590747a672SArnd Bergmann complete(&cdma->complete);
3606579324aSTerje Bergstrom }
3616579324aSTerje Bergstrom }
3626579324aSTerje Bergstrom
host1x_cdma_update_sync_queue(struct host1x_cdma * cdma,struct device * dev)3636579324aSTerje Bergstrom void host1x_cdma_update_sync_queue(struct host1x_cdma *cdma,
3646579324aSTerje Bergstrom struct device *dev)
3656579324aSTerje Bergstrom {
3666579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
3670b8070d1SThierry Reding u32 restart_addr, syncpt_incrs, syncpt_val;
36879930bafSDmitry Osipenko struct host1x_job *job, *next_job = NULL;
3696579324aSTerje Bergstrom
3706579324aSTerje Bergstrom syncpt_val = host1x_syncpt_load(cdma->timeout.syncpt);
3716579324aSTerje Bergstrom
3726579324aSTerje Bergstrom dev_dbg(dev, "%s: starting cleanup (thresh %d)\n",
3736579324aSTerje Bergstrom __func__, syncpt_val);
3746579324aSTerje Bergstrom
3756579324aSTerje Bergstrom /*
3766579324aSTerje Bergstrom * Move the sync_queue read pointer to the first entry that hasn't
3776579324aSTerje Bergstrom * completed based on the current HW syncpt value. It's likely there
3786579324aSTerje Bergstrom * won't be any (i.e. we're still at the head), but covers the case
3796579324aSTerje Bergstrom * where a syncpt incr happens just prior/during the teardown.
3806579324aSTerje Bergstrom */
3816579324aSTerje Bergstrom
3826579324aSTerje Bergstrom dev_dbg(dev, "%s: skip completed buffers still in sync_queue\n",
3836579324aSTerje Bergstrom __func__);
3846579324aSTerje Bergstrom
3856579324aSTerje Bergstrom list_for_each_entry(job, &cdma->sync_queue, list) {
38679930bafSDmitry Osipenko if (syncpt_val < job->syncpt_end) {
38779930bafSDmitry Osipenko
38879930bafSDmitry Osipenko if (!list_is_last(&job->list, &cdma->sync_queue))
38979930bafSDmitry Osipenko next_job = list_next_entry(job, list);
39079930bafSDmitry Osipenko
3915d6f0436SDmitry Osipenko goto syncpt_incr;
39279930bafSDmitry Osipenko }
3936579324aSTerje Bergstrom
3946579324aSTerje Bergstrom host1x_job_dump(dev, job);
3956579324aSTerje Bergstrom }
3966579324aSTerje Bergstrom
3975d6f0436SDmitry Osipenko /* all jobs have been completed */
3985d6f0436SDmitry Osipenko job = NULL;
3995d6f0436SDmitry Osipenko
4005d6f0436SDmitry Osipenko syncpt_incr:
4015d6f0436SDmitry Osipenko
4026579324aSTerje Bergstrom /*
403e8bad659SDmitry Osipenko * Increment with CPU the remaining syncpts of a partially executed job.
4046579324aSTerje Bergstrom *
40579930bafSDmitry Osipenko * CDMA will continue execution starting with the next job or will get
40679930bafSDmitry Osipenko * into idle state.
4076579324aSTerje Bergstrom */
40879930bafSDmitry Osipenko if (next_job)
40979930bafSDmitry Osipenko restart_addr = next_job->first_get;
4106579324aSTerje Bergstrom else
4116579324aSTerje Bergstrom restart_addr = cdma->last_pos;
4126579324aSTerje Bergstrom
413c78f837aSMikko Perttunen if (!job)
414c78f837aSMikko Perttunen goto resume;
415c78f837aSMikko Perttunen
416e8bad659SDmitry Osipenko /* do CPU increments for the remaining syncpts */
417c78f837aSMikko Perttunen if (job->syncpt_recovery) {
4185d6f0436SDmitry Osipenko dev_dbg(dev, "%s: perform CPU incr on pending buffers\n",
4195d6f0436SDmitry Osipenko __func__);
4205d6f0436SDmitry Osipenko
4216579324aSTerje Bergstrom /* won't need a timeout when replayed */
4226579324aSTerje Bergstrom job->timeout = 0;
4236579324aSTerje Bergstrom
4246579324aSTerje Bergstrom syncpt_incrs = job->syncpt_end - syncpt_val;
4256579324aSTerje Bergstrom dev_dbg(dev, "%s: CPU incr (%d)\n", __func__, syncpt_incrs);
4266579324aSTerje Bergstrom
4276579324aSTerje Bergstrom host1x_job_dump(dev, job);
4286579324aSTerje Bergstrom
4296579324aSTerje Bergstrom /* safe to use CPU to incr syncpts */
4306579324aSTerje Bergstrom host1x_hw_cdma_timeout_cpu_incr(host1x, cdma, job->first_get,
4316579324aSTerje Bergstrom syncpt_incrs, job->syncpt_end,
4326579324aSTerje Bergstrom job->num_slots);
4336579324aSTerje Bergstrom
4345d6f0436SDmitry Osipenko dev_dbg(dev, "%s: finished sync_queue modification\n",
4355d6f0436SDmitry Osipenko __func__);
436c78f837aSMikko Perttunen } else {
437c78f837aSMikko Perttunen struct host1x_job *failed_job = job;
438c78f837aSMikko Perttunen
439c78f837aSMikko Perttunen host1x_job_dump(dev, job);
440c78f837aSMikko Perttunen
441c78f837aSMikko Perttunen host1x_syncpt_set_locked(job->syncpt);
442c78f837aSMikko Perttunen failed_job->cancelled = true;
443c78f837aSMikko Perttunen
444c78f837aSMikko Perttunen list_for_each_entry_continue(job, &cdma->sync_queue, list) {
445c78f837aSMikko Perttunen unsigned int i;
446c78f837aSMikko Perttunen
447c78f837aSMikko Perttunen if (job->syncpt != failed_job->syncpt)
448c78f837aSMikko Perttunen continue;
449c78f837aSMikko Perttunen
450c78f837aSMikko Perttunen for (i = 0; i < job->num_slots; i++) {
451c78f837aSMikko Perttunen unsigned int slot = (job->first_get/8 + i) %
452c78f837aSMikko Perttunen HOST1X_PUSHBUFFER_SLOTS;
453c78f837aSMikko Perttunen u32 *mapped = cdma->push_buffer.mapped;
454c78f837aSMikko Perttunen
455c78f837aSMikko Perttunen /*
456c78f837aSMikko Perttunen * Overwrite opcodes with 0 word writes
457c78f837aSMikko Perttunen * to offset 0xbad. This does nothing but
458c78f837aSMikko Perttunen * has a easily detected signature in debug
459c78f837aSMikko Perttunen * traces.
4600ae4ae91SMikko Perttunen *
4610ae4ae91SMikko Perttunen * On systems with MLOCK enforcement enabled,
4620ae4ae91SMikko Perttunen * the above 0 word writes would fall foul of
4630ae4ae91SMikko Perttunen * the enforcement. As such, in the first slot
4640ae4ae91SMikko Perttunen * put a RESTART_W opcode to the beginning
4650ae4ae91SMikko Perttunen * of the next job. We don't use this for older
4660ae4ae91SMikko Perttunen * chips since those only support the RESTART
4670ae4ae91SMikko Perttunen * opcode with inconvenient alignment requirements.
468c78f837aSMikko Perttunen */
4690ae4ae91SMikko Perttunen if (i == 0 && host1x->info->has_wide_gather) {
4700ae4ae91SMikko Perttunen unsigned int next_job = (job->first_get/8 + job->num_slots)
4710ae4ae91SMikko Perttunen % HOST1X_PUSHBUFFER_SLOTS;
4720ae4ae91SMikko Perttunen mapped[2*slot+0] = (0xd << 28) | (next_job * 2);
4730ae4ae91SMikko Perttunen mapped[2*slot+1] = 0x0;
4740ae4ae91SMikko Perttunen } else {
475c78f837aSMikko Perttunen mapped[2*slot+0] = 0x1bad0000;
476c78f837aSMikko Perttunen mapped[2*slot+1] = 0x1bad0000;
4775d6f0436SDmitry Osipenko }
4780ae4ae91SMikko Perttunen }
4796579324aSTerje Bergstrom
480c78f837aSMikko Perttunen job->cancelled = true;
481c78f837aSMikko Perttunen }
482c78f837aSMikko Perttunen
483c78f837aSMikko Perttunen wmb();
484c78f837aSMikko Perttunen
485c78f837aSMikko Perttunen update_cdma_locked(cdma);
486c78f837aSMikko Perttunen }
487c78f837aSMikko Perttunen
488c78f837aSMikko Perttunen resume:
4896579324aSTerje Bergstrom /* roll back DMAGET and start up channel again */
4906579324aSTerje Bergstrom host1x_hw_cdma_resume(host1x, cdma, restart_addr);
4916579324aSTerje Bergstrom }
4926579324aSTerje Bergstrom
cdma_update_work(struct work_struct * work)493*c24973edSMikko Perttunen static void cdma_update_work(struct work_struct *work)
494*c24973edSMikko Perttunen {
495*c24973edSMikko Perttunen struct host1x_cdma *cdma = container_of(work, struct host1x_cdma, update_work);
496*c24973edSMikko Perttunen
497*c24973edSMikko Perttunen mutex_lock(&cdma->lock);
498*c24973edSMikko Perttunen update_cdma_locked(cdma);
499*c24973edSMikko Perttunen mutex_unlock(&cdma->lock);
500*c24973edSMikko Perttunen }
501*c24973edSMikko Perttunen
5026579324aSTerje Bergstrom /*
5036579324aSTerje Bergstrom * Create a cdma
5046579324aSTerje Bergstrom */
host1x_cdma_init(struct host1x_cdma * cdma)5056579324aSTerje Bergstrom int host1x_cdma_init(struct host1x_cdma *cdma)
5066579324aSTerje Bergstrom {
5076579324aSTerje Bergstrom int err;
5086579324aSTerje Bergstrom
5096579324aSTerje Bergstrom mutex_init(&cdma->lock);
5100747a672SArnd Bergmann init_completion(&cdma->complete);
511*c24973edSMikko Perttunen INIT_WORK(&cdma->update_work, cdma_update_work);
5126579324aSTerje Bergstrom
5136579324aSTerje Bergstrom INIT_LIST_HEAD(&cdma->sync_queue);
5146579324aSTerje Bergstrom
5156579324aSTerje Bergstrom cdma->event = CDMA_EVENT_NONE;
5166579324aSTerje Bergstrom cdma->running = false;
5176579324aSTerje Bergstrom cdma->torndown = false;
5186579324aSTerje Bergstrom
5196579324aSTerje Bergstrom err = host1x_pushbuffer_init(&cdma->push_buffer);
5206579324aSTerje Bergstrom if (err)
5216579324aSTerje Bergstrom return err;
5220b8070d1SThierry Reding
5236579324aSTerje Bergstrom return 0;
5246579324aSTerje Bergstrom }
5256579324aSTerje Bergstrom
5266579324aSTerje Bergstrom /*
5276579324aSTerje Bergstrom * Destroy a cdma
5286579324aSTerje Bergstrom */
host1x_cdma_deinit(struct host1x_cdma * cdma)5296579324aSTerje Bergstrom int host1x_cdma_deinit(struct host1x_cdma *cdma)
5306579324aSTerje Bergstrom {
5316579324aSTerje Bergstrom struct push_buffer *pb = &cdma->push_buffer;
5326579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
5336579324aSTerje Bergstrom
5346579324aSTerje Bergstrom if (cdma->running) {
5356579324aSTerje Bergstrom pr_warn("%s: CDMA still running\n", __func__);
5366579324aSTerje Bergstrom return -EBUSY;
5376579324aSTerje Bergstrom }
5386579324aSTerje Bergstrom
5396579324aSTerje Bergstrom host1x_pushbuffer_destroy(pb);
5406579324aSTerje Bergstrom host1x_hw_cdma_timeout_destroy(host1x, cdma);
5416579324aSTerje Bergstrom
5426579324aSTerje Bergstrom return 0;
5436579324aSTerje Bergstrom }
5446579324aSTerje Bergstrom
5456579324aSTerje Bergstrom /*
5466579324aSTerje Bergstrom * Begin a cdma submit
5476579324aSTerje Bergstrom */
host1x_cdma_begin(struct host1x_cdma * cdma,struct host1x_job * job)5486579324aSTerje Bergstrom int host1x_cdma_begin(struct host1x_cdma *cdma, struct host1x_job *job)
5496579324aSTerje Bergstrom {
5506579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
5516579324aSTerje Bergstrom
5526579324aSTerje Bergstrom mutex_lock(&cdma->lock);
5536579324aSTerje Bergstrom
554c78f837aSMikko Perttunen /*
555c78f837aSMikko Perttunen * Check if syncpoint was locked due to previous job timeout.
556c78f837aSMikko Perttunen * This needs to be done within the cdma lock to avoid a race
557c78f837aSMikko Perttunen * with the timeout handler.
558c78f837aSMikko Perttunen */
559c78f837aSMikko Perttunen if (job->syncpt->locked) {
560c78f837aSMikko Perttunen mutex_unlock(&cdma->lock);
561c78f837aSMikko Perttunen return -EPERM;
562c78f837aSMikko Perttunen }
563c78f837aSMikko Perttunen
5646579324aSTerje Bergstrom if (job->timeout) {
5656579324aSTerje Bergstrom /* init state on first submit with timeout value */
5666579324aSTerje Bergstrom if (!cdma->timeout.initialized) {
5676579324aSTerje Bergstrom int err;
5686df633d0SThierry Reding
5692aed4f5aSMikko Perttunen err = host1x_hw_cdma_timeout_init(host1x, cdma);
5706579324aSTerje Bergstrom if (err) {
5716579324aSTerje Bergstrom mutex_unlock(&cdma->lock);
5726579324aSTerje Bergstrom return err;
5736579324aSTerje Bergstrom }
5746579324aSTerje Bergstrom }
5756579324aSTerje Bergstrom }
5760b8070d1SThierry Reding
5776579324aSTerje Bergstrom if (!cdma->running)
5786579324aSTerje Bergstrom host1x_hw_cdma_start(host1x, cdma);
5796579324aSTerje Bergstrom
5806579324aSTerje Bergstrom cdma->slots_free = 0;
5816579324aSTerje Bergstrom cdma->slots_used = 0;
5826579324aSTerje Bergstrom cdma->first_get = cdma->push_buffer.pos;
5836579324aSTerje Bergstrom
5846579324aSTerje Bergstrom trace_host1x_cdma_begin(dev_name(job->channel->dev));
5856579324aSTerje Bergstrom return 0;
5866579324aSTerje Bergstrom }
5876579324aSTerje Bergstrom
5886579324aSTerje Bergstrom /*
5896579324aSTerje Bergstrom * Push two words into a push buffer slot
5906579324aSTerje Bergstrom * Blocks as necessary if the push buffer is full.
5916579324aSTerje Bergstrom */
host1x_cdma_push(struct host1x_cdma * cdma,u32 op1,u32 op2)5926579324aSTerje Bergstrom void host1x_cdma_push(struct host1x_cdma *cdma, u32 op1, u32 op2)
5936579324aSTerje Bergstrom {
5946579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
5956579324aSTerje Bergstrom struct push_buffer *pb = &cdma->push_buffer;
5966579324aSTerje Bergstrom u32 slots_free = cdma->slots_free;
5976579324aSTerje Bergstrom
5986236451dSTerje Bergstrom if (host1x_debug_trace_cmdbuf)
5996236451dSTerje Bergstrom trace_host1x_cdma_push(dev_name(cdma_to_channel(cdma)->dev),
6006236451dSTerje Bergstrom op1, op2);
6016236451dSTerje Bergstrom
6026579324aSTerje Bergstrom if (slots_free == 0) {
6036579324aSTerje Bergstrom host1x_hw_cdma_flush(host1x, cdma);
6046579324aSTerje Bergstrom slots_free = host1x_cdma_wait_locked(cdma,
6056579324aSTerje Bergstrom CDMA_EVENT_PUSH_BUFFER_SPACE);
6066579324aSTerje Bergstrom }
6070b8070d1SThierry Reding
6086579324aSTerje Bergstrom cdma->slots_free = slots_free - 1;
6096579324aSTerje Bergstrom cdma->slots_used++;
6106579324aSTerje Bergstrom host1x_pushbuffer_push(pb, op1, op2);
6116579324aSTerje Bergstrom }
6126579324aSTerje Bergstrom
6136579324aSTerje Bergstrom /*
6145a5fccbdSThierry Reding * Push four words into two consecutive push buffer slots. Note that extra
6155a5fccbdSThierry Reding * care needs to be taken not to split the two slots across the end of the
6165a5fccbdSThierry Reding * push buffer. Otherwise the RESTART opcode at the end of the push buffer
6175a5fccbdSThierry Reding * that ensures processing will restart at the beginning will break up the
6185a5fccbdSThierry Reding * four words.
6195a5fccbdSThierry Reding *
6205a5fccbdSThierry Reding * Blocks as necessary if the push buffer is full.
6215a5fccbdSThierry Reding */
host1x_cdma_push_wide(struct host1x_cdma * cdma,u32 op1,u32 op2,u32 op3,u32 op4)6225a5fccbdSThierry Reding void host1x_cdma_push_wide(struct host1x_cdma *cdma, u32 op1, u32 op2,
6235a5fccbdSThierry Reding u32 op3, u32 op4)
6245a5fccbdSThierry Reding {
6255a5fccbdSThierry Reding struct host1x_channel *channel = cdma_to_channel(cdma);
6265a5fccbdSThierry Reding struct host1x *host1x = cdma_to_host1x(cdma);
6275a5fccbdSThierry Reding struct push_buffer *pb = &cdma->push_buffer;
6285a5fccbdSThierry Reding unsigned int space = cdma->slots_free;
6298c92243dSMikko Perttunen unsigned int needed = 2, extra = 0;
6305a5fccbdSThierry Reding
6315a5fccbdSThierry Reding if (host1x_debug_trace_cmdbuf)
6325a5fccbdSThierry Reding trace_host1x_cdma_push_wide(dev_name(channel->dev), op1, op2,
6335a5fccbdSThierry Reding op3, op4);
6345a5fccbdSThierry Reding
6355a5fccbdSThierry Reding /* compute number of extra slots needed for padding */
6365a5fccbdSThierry Reding if (pb->pos + 16 > pb->size) {
6375a5fccbdSThierry Reding extra = (pb->size - pb->pos) / 8;
6385a5fccbdSThierry Reding needed += extra;
6395a5fccbdSThierry Reding }
6405a5fccbdSThierry Reding
6415a5fccbdSThierry Reding host1x_cdma_wait_pushbuffer_space(host1x, cdma, needed);
6425a5fccbdSThierry Reding space = host1x_pushbuffer_space(pb);
6435a5fccbdSThierry Reding
6445a5fccbdSThierry Reding cdma->slots_free = space - needed;
6455a5fccbdSThierry Reding cdma->slots_used += needed;
6465a5fccbdSThierry Reding
6478c92243dSMikko Perttunen if (extra > 0) {
6485a5fccbdSThierry Reding /*
6498c92243dSMikko Perttunen * If there isn't enough space at the tail of the pushbuffer,
6508c92243dSMikko Perttunen * insert a RESTART(0) here to go back to the beginning.
6518c92243dSMikko Perttunen * The code above adjusted the indexes appropriately.
6525a5fccbdSThierry Reding */
6538c92243dSMikko Perttunen host1x_pushbuffer_push(pb, (0x5 << 28), 0xdead0000);
6548c92243dSMikko Perttunen }
6555a5fccbdSThierry Reding
6565a5fccbdSThierry Reding host1x_pushbuffer_push(pb, op1, op2);
6575a5fccbdSThierry Reding host1x_pushbuffer_push(pb, op3, op4);
6585a5fccbdSThierry Reding }
6595a5fccbdSThierry Reding
6605a5fccbdSThierry Reding /*
6616579324aSTerje Bergstrom * End a cdma submit
6626579324aSTerje Bergstrom * Kick off DMA, add job to the sync queue, and a number of slots to be freed
6636579324aSTerje Bergstrom * from the pushbuffer. The handles for a submit must all be pinned at the same
6646579324aSTerje Bergstrom * time, but they can be unpinned in smaller chunks.
6656579324aSTerje Bergstrom */
host1x_cdma_end(struct host1x_cdma * cdma,struct host1x_job * job)6666579324aSTerje Bergstrom void host1x_cdma_end(struct host1x_cdma *cdma,
6676579324aSTerje Bergstrom struct host1x_job *job)
6686579324aSTerje Bergstrom {
6696579324aSTerje Bergstrom struct host1x *host1x = cdma_to_host1x(cdma);
6706579324aSTerje Bergstrom bool idle = list_empty(&cdma->sync_queue);
6716579324aSTerje Bergstrom
6726579324aSTerje Bergstrom host1x_hw_cdma_flush(host1x, cdma);
6736579324aSTerje Bergstrom
6746579324aSTerje Bergstrom job->first_get = cdma->first_get;
6756579324aSTerje Bergstrom job->num_slots = cdma->slots_used;
6766579324aSTerje Bergstrom host1x_job_get(job);
6776579324aSTerje Bergstrom list_add_tail(&job->list, &cdma->sync_queue);
6786579324aSTerje Bergstrom
6796579324aSTerje Bergstrom /* start timer on idle -> active transitions */
6806579324aSTerje Bergstrom if (job->timeout && idle)
6816579324aSTerje Bergstrom cdma_start_timer_locked(cdma, job);
6826579324aSTerje Bergstrom
6836579324aSTerje Bergstrom trace_host1x_cdma_end(dev_name(job->channel->dev));
6846579324aSTerje Bergstrom mutex_unlock(&cdma->lock);
6856579324aSTerje Bergstrom }
6866579324aSTerje Bergstrom
6876579324aSTerje Bergstrom /*
6886579324aSTerje Bergstrom * Update cdma state according to current sync point values
6896579324aSTerje Bergstrom */
host1x_cdma_update(struct host1x_cdma * cdma)6906579324aSTerje Bergstrom void host1x_cdma_update(struct host1x_cdma *cdma)
6916579324aSTerje Bergstrom {
692*c24973edSMikko Perttunen schedule_work(&cdma->update_work);
6936579324aSTerje Bergstrom }
694